LCOV - code coverage report
Current view: top level - sys/classes/ds/impls/ghiep - dsghiep.c (source / functions) Hit Total Coverage
Test: SLEPc Lines: 641 712 90.0 %
Date: 2024-11-21 00:34:55 Functions: 17 17 100.0 %
Legend: Lines: hit not hit

          Line data    Source code
       1             : /*
       2             :    - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
       3             :    SLEPc - Scalable Library for Eigenvalue Problem Computations
       4             :    Copyright (c) 2002-, Universitat Politecnica de Valencia, Spain
       5             : 
       6             :    This file is part of SLEPc.
       7             :    SLEPc is distributed under a 2-clause BSD license (see LICENSE).
       8             :    - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
       9             : */
      10             : 
      11             : #include <slepc/private/dsimpl.h>
      12             : #include <slepcblaslapack.h>
      13             : 
      14          58 : static PetscErrorCode DSAllocate_GHIEP(DS ds,PetscInt ld)
      15             : {
      16          58 :   PetscFunctionBegin;
      17          58 :   PetscCall(DSAllocateMat_Private(ds,DS_MAT_A));
      18          58 :   PetscCall(DSAllocateMat_Private(ds,DS_MAT_B));
      19          58 :   PetscCall(DSAllocateMat_Private(ds,DS_MAT_Q));
      20          58 :   PetscCall(DSAllocateMat_Private(ds,DS_MAT_T));
      21          58 :   PetscCall(DSAllocateMat_Private(ds,DS_MAT_D));
      22          58 :   PetscCall(PetscFree(ds->perm));
      23          58 :   PetscCall(PetscMalloc1(ld,&ds->perm));
      24          58 :   PetscFunctionReturn(PETSC_SUCCESS);
      25             : }
      26             : 
      27        2721 : PetscErrorCode DSSwitchFormat_GHIEP(DS ds,PetscBool tocompact)
      28             : {
      29        2721 :   PetscReal      *T,*S;
      30        2721 :   PetscScalar    *A,*B;
      31        2721 :   PetscInt       i,n,ld;
      32             : 
      33        2721 :   PetscFunctionBegin;
      34        2721 :   PetscCall(MatDenseGetArray(ds->omat[DS_MAT_A],&A));
      35        2721 :   PetscCall(MatDenseGetArray(ds->omat[DS_MAT_B],&B));
      36        2721 :   PetscCall(DSGetArrayReal(ds,DS_MAT_T,&T));
      37        2721 :   PetscCall(DSGetArrayReal(ds,DS_MAT_D,&S));
      38        2721 :   n = ds->n;
      39        2721 :   ld = ds->ld;
      40        2721 :   if (tocompact) { /* switch from dense (arrow) to compact storage */
      41           6 :     PetscCall(PetscArrayzero(T,n));
      42           6 :     PetscCall(PetscArrayzero(T+ld,n));
      43           6 :     PetscCall(PetscArrayzero(T+2*ld,n));
      44           6 :     PetscCall(PetscArrayzero(S,n));
      45          60 :     for (i=0;i<n-1;i++) {
      46          54 :       T[i]    = PetscRealPart(A[i+i*ld]);
      47          54 :       T[ld+i] = PetscRealPart(A[i+1+i*ld]);
      48          54 :       S[i]    = PetscRealPart(B[i+i*ld]);
      49             :     }
      50           6 :     T[n-1] = PetscRealPart(A[n-1+(n-1)*ld]);
      51           6 :     S[n-1] = PetscRealPart(B[n-1+(n-1)*ld]);
      52           6 :     for (i=ds->l;i<ds->k;i++) T[2*ld+i] = PetscRealPart(A[ds->k+i*ld]);
      53             :   } else { /* switch from compact (arrow) to dense storage */
      54       88467 :     for (i=0;i<n;i++) {
      55       85752 :       PetscCall(PetscArrayzero(A+i*ld,n));
      56       85752 :       PetscCall(PetscArrayzero(B+i*ld,n));
      57             :     }
      58       85752 :     for (i=0;i<n-1;i++) {
      59       83037 :       A[i+i*ld]     = T[i];
      60       83037 :       A[i+1+i*ld]   = T[ld+i];
      61       83037 :       A[i+(i+1)*ld] = T[ld+i];
      62       83037 :       B[i+i*ld]     = S[i];
      63             :     }
      64        2715 :     A[n-1+(n-1)*ld] = T[n-1];
      65        2715 :     B[n-1+(n-1)*ld] = S[n-1];
      66       44315 :     for (i=ds->l;i<ds->k;i++) {
      67       41600 :       A[ds->k+i*ld] = T[2*ld+i];
      68       41600 :       A[i+ds->k*ld] = T[2*ld+i];
      69             :     }
      70             :   }
      71        2721 :   PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_A],&A));
      72        2721 :   PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_B],&B));
      73        2721 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&T));
      74        2721 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_D,&S));
      75        2721 :   PetscFunctionReturn(PETSC_SUCCESS);
      76             : }
      77             : 
      78          18 : static PetscErrorCode DSView_GHIEP(DS ds,PetscViewer viewer)
      79             : {
      80          18 :   PetscViewerFormat format;
      81          18 :   PetscInt          i,j;
      82          18 :   PetscReal         *T,*S,value;
      83          18 :   const char        *methodname[] = {
      84             :                      "QR + Inverse Iteration",
      85             :                      "HZ method",
      86             :                      "QR"
      87             :   };
      88          18 :   const int         nmeth=PETSC_STATIC_ARRAY_LENGTH(methodname);
      89             : 
      90          18 :   PetscFunctionBegin;
      91          18 :   PetscCall(PetscViewerGetFormat(viewer,&format));
      92          18 :   if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) {
      93          12 :     if (ds->method<nmeth) PetscCall(PetscViewerASCIIPrintf(viewer,"solving the problem with: %s\n",methodname[ds->method]));
      94          12 :     PetscFunctionReturn(PETSC_SUCCESS);
      95             :   }
      96           6 :   if (ds->compact) {
      97           6 :     PetscCall(DSGetArrayReal(ds,DS_MAT_T,&T));
      98           6 :     PetscCall(DSGetArrayReal(ds,DS_MAT_D,&S));
      99           6 :     PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE));
     100           6 :     if (format == PETSC_VIEWER_ASCII_MATLAB) {
     101           6 :       PetscCall(PetscViewerASCIIPrintf(viewer,"%% Size = %" PetscInt_FMT " %" PetscInt_FMT "\n",ds->n,ds->n));
     102           6 :       PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = zeros(%" PetscInt_FMT ",3);\n",3*ds->n));
     103           6 :       PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = [\n"));
     104          51 :       for (i=0;i<ds->n;i++) PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n",i+1,i+1,(double)T[i]));
     105          45 :       for (i=0;i<ds->n-1;i++) {
     106          39 :         if (T[i+ds->ld] !=0 && i!=ds->k-1) {
     107          12 :           PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n",i+2,i+1,(double)T[i+ds->ld]));
     108          39 :           PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n",i+1,i+2,(double)T[i+ds->ld]));
     109             :         }
     110             :       }
     111          15 :       for (i = ds->l;i<ds->k;i++) {
     112           9 :         if (T[i+2*ds->ld]) {
     113           9 :           PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n",ds->k+1,i+1,(double)T[i+2*ds->ld]));
     114           9 :           PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n",i+1,ds->k+1,(double)T[i+2*ds->ld]));
     115             :         }
     116             :       }
     117           6 :       PetscCall(PetscViewerASCIIPrintf(viewer,"];\n%s = spconvert(zzz);\n",DSMatName[DS_MAT_A]));
     118             : 
     119           6 :       PetscCall(PetscViewerASCIIPrintf(viewer,"%% Size = %" PetscInt_FMT " %" PetscInt_FMT "\n",ds->n,ds->n));
     120           6 :       PetscCall(PetscViewerASCIIPrintf(viewer,"omega = zeros(%" PetscInt_FMT ",3);\n",3*ds->n));
     121           6 :       PetscCall(PetscViewerASCIIPrintf(viewer,"omega = [\n"));
     122          51 :       for (i=0;i<ds->n;i++) PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n",i+1,i+1,(double)S[i]));
     123           6 :       PetscCall(PetscViewerASCIIPrintf(viewer,"];\n%s = spconvert(omega);\n",DSMatName[DS_MAT_B]));
     124             : 
     125             :     } else {
     126           0 :       PetscCall(PetscViewerASCIIPrintf(viewer,"T\n"));
     127           0 :       for (i=0;i<ds->n;i++) {
     128           0 :         for (j=0;j<ds->n;j++) {
     129           0 :           if (i==j) value = T[i];
     130           0 :           else if (i==j+1 || j==i+1) value = T[PetscMin(i,j)+ds->ld];
     131           0 :           else if ((i<ds->k && j==ds->k) || (i==ds->k && j<ds->k)) value = T[PetscMin(i,j)+2*ds->ld];
     132             :           else value = 0.0;
     133           0 :           PetscCall(PetscViewerASCIIPrintf(viewer," %18.16e ",(double)value));
     134             :         }
     135           0 :         PetscCall(PetscViewerASCIIPrintf(viewer,"\n"));
     136             :       }
     137           0 :       PetscCall(PetscViewerASCIIPrintf(viewer,"omega\n"));
     138           0 :       for (i=0;i<ds->n;i++) {
     139           0 :         for (j=0;j<ds->n;j++) {
     140           0 :           if (i==j) value = S[i];
     141             :           else value = 0.0;
     142           0 :           PetscCall(PetscViewerASCIIPrintf(viewer," %18.16e ",(double)value));
     143             :         }
     144           0 :         PetscCall(PetscViewerASCIIPrintf(viewer,"\n"));
     145             :       }
     146             :     }
     147           6 :     PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE));
     148           6 :     PetscCall(PetscViewerFlush(viewer));
     149           6 :     PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&T));
     150           6 :     PetscCall(DSRestoreArrayReal(ds,DS_MAT_D,&S));
     151             :   } else {
     152           0 :     PetscCall(DSViewMat(ds,viewer,DS_MAT_A));
     153           0 :     PetscCall(DSViewMat(ds,viewer,DS_MAT_B));
     154             :   }
     155           6 :   if (ds->state>DS_STATE_INTERMEDIATE) PetscCall(DSViewMat(ds,viewer,DS_MAT_Q));
     156           6 :   PetscFunctionReturn(PETSC_SUCCESS);
     157             : }
     158             : 
     159        3689 : static PetscErrorCode DSVectors_GHIEP_Eigen_Some(DS ds,PetscInt *idx,PetscReal *rnorm)
     160             : {
     161        3689 :   PetscReal         b[4],M[4],*T,*S,d1,d2,s1,s2,e,scal1,scal2,wr1,wr2,wi,ep,norm;
     162        3689 :   PetscScalar       *X,Y[4],alpha,szero=0.0;
     163        3689 :   const PetscScalar *A,*B,*Q;
     164        3689 :   PetscInt          k;
     165        3689 :   PetscBLASInt      two=2,n_,ld,one=1;
     166             : #if !defined(PETSC_USE_COMPLEX)
     167        3689 :   PetscBLASInt      four=4;
     168             : #endif
     169             : 
     170        3689 :   PetscFunctionBegin;
     171        3689 :   PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_A],&A));
     172        3689 :   PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_B],&B));
     173        3689 :   PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_Q],&Q));
     174        3689 :   PetscCall(MatDenseGetArray(ds->omat[DS_MAT_X],&X));
     175        3689 :   PetscCall(DSGetArrayReal(ds,DS_MAT_T,&T));
     176        3689 :   PetscCall(DSGetArrayReal(ds,DS_MAT_D,&S));
     177        3689 :   k = *idx;
     178        3689 :   PetscCall(PetscBLASIntCast(ds->n,&n_));
     179        3689 :   PetscCall(PetscBLASIntCast(ds->ld,&ld));
     180        3689 :   if (k < ds->n-1) e = (ds->compact)?T[k+ld]:PetscRealPart(A[(k+1)+ld*k]);
     181             :   else e = 0.0;
     182        3689 :   if (e == 0.0) { /* Real */
     183        3640 :     if (ds->state>=DS_STATE_CONDENSED) PetscCall(PetscArraycpy(X+k*ld,Q+k*ld,ld));
     184             :     else {
     185           0 :       PetscCall(PetscArrayzero(X+k*ds->ld,ds->ld));
     186           0 :       X[k+k*ds->ld] = 1.0;
     187             :     }
     188        3640 :     if (rnorm) *rnorm = PetscAbsScalar(X[ds->n-1+k*ld]);
     189             :   } else { /* 2x2 block */
     190          49 :     if (ds->compact) {
     191          49 :       s1 = S[k];
     192          49 :       d1 = T[k];
     193          49 :       s2 = S[k+1];
     194          49 :       d2 = T[k+1];
     195             :     } else {
     196           0 :       s1 = PetscRealPart(B[k*ld+k]);
     197           0 :       d1 = PetscRealPart(A[k+k*ld]);
     198           0 :       s2 = PetscRealPart(B[(k+1)*ld+k+1]);
     199           0 :       d2 = PetscRealPart(A[k+1+(k+1)*ld]);
     200             :     }
     201          49 :     M[0] = d1; M[1] = e; M[2] = e; M[3]= d2;
     202          49 :     b[0] = s1; b[1] = 0.0; b[2] = 0.0; b[3] = s2;
     203          49 :     ep = LAPACKlamch_("S");
     204             :     /* Compute eigenvalues of the block */
     205          49 :     PetscCallBLAS("LAPACKlag2",LAPACKlag2_(M,&two,b,&two,&ep,&scal1,&scal2,&wr1,&wr2,&wi));
     206          49 :     PetscCheck(wi!=0.0,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Real block in DSVectors_GHIEP");
     207             :     /* Complex eigenvalues */
     208          49 :     PetscCheck(scal1>=ep,PETSC_COMM_SELF,PETSC_ERR_FP,"Nearly infinite eigenvalue");
     209          49 :     wr1 /= scal1;
     210          49 :     wi  /= scal1;
     211             : #if !defined(PETSC_USE_COMPLEX)
     212          49 :     if (SlepcAbs(s1*d1-wr1,wi)<SlepcAbs(s2*d2-wr1,wi)) {
     213           7 :       Y[0] = wr1-s2*d2; Y[1] = s2*e; Y[2] = wi; Y[3] = 0.0;
     214             :     } else {
     215          42 :       Y[0] = s1*e; Y[1] = wr1-s1*d1; Y[2] = 0.0; Y[3] = wi;
     216             :     }
     217          49 :     norm = BLASnrm2_(&four,Y,&one);
     218          49 :     norm = 1.0/norm;
     219          49 :     if (ds->state >= DS_STATE_CONDENSED) {
     220          33 :       alpha = norm;
     221          33 :       PetscCallBLAS("BLASgemm",BLASgemm_("N","N",&n_,&two,&two,&alpha,Q+k*ld,&ld,Y,&two,&szero,X+k*ld,&ld));
     222          33 :       if (rnorm) *rnorm = SlepcAbsEigenvalue(X[ds->n-1+k*ld],X[ds->n-1+(k+1)*ld]);
     223             :     } else {
     224          16 :       PetscCall(PetscArrayzero(X+k*ld,2*ld));
     225          16 :       X[k*ld+k]       = Y[0]*norm;
     226          16 :       X[k*ld+k+1]     = Y[1]*norm;
     227          16 :       X[(k+1)*ld+k]   = Y[2]*norm;
     228          16 :       X[(k+1)*ld+k+1] = Y[3]*norm;
     229             :     }
     230             : #else
     231             :     if (SlepcAbs(s1*d1-wr1,wi)<SlepcAbs(s2*d2-wr1,wi)) {
     232             :       Y[0] = PetscCMPLX(wr1-s2*d2,wi);
     233             :       Y[1] = s2*e;
     234             :     } else {
     235             :       Y[0] = s1*e;
     236             :       Y[1] = PetscCMPLX(wr1-s1*d1,wi);
     237             :     }
     238             :     norm = BLASnrm2_(&two,Y,&one);
     239             :     norm = 1.0/norm;
     240             :     if (ds->state >= DS_STATE_CONDENSED) {
     241             :       alpha = norm;
     242             :       PetscCallBLAS("BLASgemv",BLASgemv_("N",&n_,&two,&alpha,Q+k*ld,&ld,Y,&one,&szero,X+k*ld,&one));
     243             :       if (rnorm) *rnorm = PetscAbsScalar(X[ds->n-1+k*ld]);
     244             :     } else {
     245             :       PetscCall(PetscArrayzero(X+k*ld,2*ld));
     246             :       X[k*ld+k]   = Y[0]*norm;
     247             :       X[k*ld+k+1] = Y[1]*norm;
     248             :     }
     249             :     X[(k+1)*ld+k]   = PetscConj(X[k*ld+k]);
     250             :     X[(k+1)*ld+k+1] = PetscConj(X[k*ld+k+1]);
     251             : #endif
     252          49 :     (*idx)++;
     253             :   }
     254        3689 :   PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_A],&A));
     255        3689 :   PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_B],&B));
     256        3689 :   PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_Q],&Q));
     257        3689 :   PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_X],&X));
     258        3689 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&T));
     259        3689 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_D,&S));
     260        3689 :   PetscFunctionReturn(PETSC_SUCCESS);
     261             : }
     262             : 
     263        3702 : static PetscErrorCode DSVectors_GHIEP(DS ds,DSMatType mat,PetscInt *k,PetscReal *rnorm)
     264             : {
     265        3702 :   PetscScalar       *Z;
     266        3702 :   const PetscScalar *A,*Q;
     267        3702 :   PetscInt          i;
     268        3702 :   PetscReal         e,*T;
     269             : 
     270        3702 :   PetscFunctionBegin;
     271        3702 :   switch (mat) {
     272        3702 :     case DS_MAT_X:
     273             :     case DS_MAT_Y:
     274        3702 :       if (k) PetscCall(DSVectors_GHIEP_Eigen_Some(ds,k,rnorm));
     275             :       else {
     276          29 :         PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_A],&A));
     277          29 :         PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_Q],&Q));
     278          29 :         PetscCall(MatDenseGetArray(ds->omat[mat],&Z));
     279          29 :         PetscCall(DSGetArrayReal(ds,DS_MAT_T,&T));
     280         639 :         for (i=0; i<ds->n; i++) {
     281         610 :           e = (ds->compact)?T[i+ds->ld]:PetscRealPart(A[(i+1)+ds->ld*i]);
     282         610 :           if (e == 0.0) { /* real */
     283         594 :             if (ds->state >= DS_STATE_CONDENSED) PetscCall(PetscArraycpy(Z+i*ds->ld,Q+i*ds->ld,ds->ld));
     284             :             else {
     285         594 :               PetscCall(PetscArrayzero(Z+i*ds->ld,ds->ld));
     286         594 :               Z[i+i*ds->ld] = 1.0;
     287             :             }
     288         610 :           } else PetscCall(DSVectors_GHIEP_Eigen_Some(ds,&i,rnorm));
     289             :         }
     290          29 :         PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_A],&A));
     291          29 :         PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_Q],&Q));
     292          29 :         PetscCall(MatDenseRestoreArray(ds->omat[mat],&Z));
     293          29 :         PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&T));
     294             :       }
     295        3702 :       break;
     296           0 :     case DS_MAT_U:
     297             :     case DS_MAT_V:
     298           0 :       SETERRQ(PetscObjectComm((PetscObject)ds),PETSC_ERR_SUP,"Not implemented yet");
     299           0 :     default:
     300           0 :       SETERRQ(PetscObjectComm((PetscObject)ds),PETSC_ERR_ARG_OUTOFRANGE,"Invalid mat parameter");
     301             :   }
     302        3702 :   PetscFunctionReturn(PETSC_SUCCESS);
     303             : }
     304             : 
     305             : /*
     306             :   Extract the eigenvalues contained in the block-diagonal of the indefinite problem.
     307             :   Only the index range n0..n1 is processed.
     308             : */
     309        2759 : PetscErrorCode DSGHIEPComplexEigs(DS ds,PetscInt n0,PetscInt n1,PetscScalar *wr,PetscScalar *wi)
     310             : {
     311        2759 :   PetscInt          k,ld;
     312        2759 :   PetscBLASInt      two=2;
     313        2759 :   const PetscScalar *A,*B;
     314        2759 :   PetscReal         *D,*T,b[4],M[4],d1,d2,s1,s2,e,scal1,scal2,ep,wr1,wr2,wi1;
     315             : 
     316        2759 :   PetscFunctionBegin;
     317        2759 :   ld = ds->ld;
     318        2759 :   PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_A],&A));
     319        2759 :   PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_B],&B));
     320        2759 :   PetscCall(DSGetArrayReal(ds,DS_MAT_T,&T));
     321        2759 :   PetscCall(DSGetArrayReal(ds,DS_MAT_D,&D));
     322        4591 :   for (k=n0;k<n1;k++) {
     323        1832 :     if (k < n1-1) e = (ds->compact)?T[ld+k]:PetscRealPart(A[(k+1)+ld*k]);
     324             :     else e = 0.0;
     325        1832 :     if (e==0.0) { /* real eigenvalue */
     326        1827 :       wr[k] = (ds->compact)?T[k]/D[k]:A[k+k*ld]/B[k+k*ld];
     327             : #if !defined(PETSC_USE_COMPLEX)
     328        1827 :       wi[k] = 0.0 ;
     329             : #endif
     330             :     } else { /* diagonal block */
     331           5 :       if (ds->compact) {
     332           3 :         s1 = D[k];
     333           3 :         d1 = T[k];
     334           3 :         s2 = D[k+1];
     335           3 :         d2 = T[k+1];
     336             :       } else {
     337           2 :         s1 = PetscRealPart(B[k*ld+k]);
     338           2 :         d1 = PetscRealPart(A[k+k*ld]);
     339           2 :         s2 = PetscRealPart(B[(k+1)*ld+k+1]);
     340           2 :         d2 = PetscRealPart(A[k+1+(k+1)*ld]);
     341             :       }
     342           5 :       M[0] = d1; M[1] = e; M[2] = e; M[3]= d2;
     343           5 :       b[0] = s1; b[1] = 0.0; b[2] = 0.0; b[3] = s2;
     344           5 :       ep = LAPACKlamch_("S");
     345             :       /* Compute eigenvalues of the block */
     346           5 :       PetscCallBLAS("LAPACKlag2",LAPACKlag2_(M,&two,b,&two,&ep,&scal1,&scal2,&wr1,&wr2,&wi1));
     347           5 :       PetscCheck(scal1>=ep,PETSC_COMM_SELF,PETSC_ERR_FP,"Nearly infinite eigenvalue");
     348           5 :       if (wi1==0.0) { /* Real eigenvalues */
     349           0 :         PetscCheck(scal2>=ep,PETSC_COMM_SELF,PETSC_ERR_FP,"Nearly infinite eigenvalue");
     350           0 :         wr[k] = wr1/scal1; wr[k+1] = wr2/scal2;
     351             : #if !defined(PETSC_USE_COMPLEX)
     352           0 :         wi[k] = wi[k+1] = 0.0;
     353             : #endif
     354             :       } else { /* Complex eigenvalues */
     355             : #if !defined(PETSC_USE_COMPLEX)
     356           5 :         wr[k]   = wr1/scal1;
     357           5 :         wr[k+1] = wr[k];
     358           5 :         wi[k]   = wi1/scal1;
     359           5 :         wi[k+1] = -wi[k];
     360             : #else
     361             :         wr[k]   = PetscCMPLX(wr1,wi1)/scal1;
     362             :         wr[k+1] = PetscConj(wr[k]);
     363             : #endif
     364             :       }
     365           5 :       k++;
     366             :     }
     367             :   }
     368             : #if defined(PETSC_USE_COMPLEX)
     369             :   if (wi) {
     370             :     for (k=n0;k<n1;k++) wi[k] = 0.0;
     371             :   }
     372             : #endif
     373        2759 :   PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_A],&A));
     374        2759 :   PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_B],&B));
     375        2759 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&T));
     376        2759 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_D,&D));
     377        2759 :   PetscFunctionReturn(PETSC_SUCCESS);
     378             : }
     379             : 
     380        2759 : static PetscErrorCode DSSort_GHIEP(DS ds,PetscScalar *wr,PetscScalar *wi,PetscScalar *rr,PetscScalar *ri,PetscInt *k)
     381             : {
     382        2759 :   PetscInt       n,i,*perm;
     383        2759 :   PetscReal      *d,*e,*s;
     384             : 
     385        2759 :   PetscFunctionBegin;
     386             : #if !defined(PETSC_USE_COMPLEX)
     387        2759 :   PetscAssertPointer(wi,3);
     388             : #endif
     389        2759 :   n = ds->n;
     390        2759 :   PetscCall(DSGetArrayReal(ds,DS_MAT_T,&d));
     391        2759 :   e = d + ds->ld;
     392        2759 :   PetscCall(DSGetArrayReal(ds,DS_MAT_D,&s));
     393        2759 :   PetscCall(DSAllocateWork_Private(ds,ds->ld,ds->ld,0));
     394        2759 :   perm = ds->perm;
     395        2759 :   if (!rr) {
     396        2759 :     rr = wr;
     397        2759 :     ri = wi;
     398             :   }
     399        2759 :   PetscCall(DSSortEigenvalues_Private(ds,rr,ri,perm,PETSC_TRUE));
     400        2759 :   if (!ds->compact) PetscCall(DSSwitchFormat_GHIEP(ds,PETSC_TRUE));
     401        2759 :   PetscCall(PetscArraycpy(ds->work,wr,n));
     402       88953 :   for (i=ds->l;i<n;i++) wr[i] = *(ds->work+perm[i]);
     403             : #if !defined(PETSC_USE_COMPLEX)
     404        2759 :   PetscCall(PetscArraycpy(ds->work,wi,n));
     405       88953 :   for (i=ds->l;i<n;i++) wi[i] = *(ds->work+perm[i]);
     406             : #endif
     407        2759 :   PetscCall(PetscArraycpy(ds->rwork,s,n));
     408       88953 :   for (i=ds->l;i<n;i++) s[i] = *(ds->rwork+perm[i]);
     409        2759 :   PetscCall(PetscArraycpy(ds->rwork,d,n));
     410       88953 :   for (i=ds->l;i<n;i++) d[i] = *(ds->rwork+perm[i]);
     411        2759 :   PetscCall(PetscArraycpy(ds->rwork,e,n-1));
     412        2759 :   PetscCall(PetscArrayzero(e+ds->l,n-1-ds->l));
     413       86194 :   for (i=ds->l;i<n-1;i++) {
     414       83435 :     if (perm[i]<n-1) e[i] = *(ds->rwork+perm[i]);
     415             :   }
     416        2759 :   if (!ds->compact) PetscCall(DSSwitchFormat_GHIEP(ds,PETSC_FALSE));
     417        2759 :   PetscCall(DSPermuteColumns_Private(ds,ds->l,n,n,DS_MAT_Q,perm));
     418        2759 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&d));
     419        2759 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_D,&s));
     420        2759 :   PetscFunctionReturn(PETSC_SUCCESS);
     421             : }
     422             : 
     423        2750 : static PetscErrorCode DSUpdateExtraRow_GHIEP(DS ds)
     424             : {
     425        2750 :   PetscInt          i;
     426        2750 :   PetscBLASInt      n,ld,incx=1;
     427        2750 :   PetscScalar       *A,*x,*y,one=1.0,zero=0.0;
     428        2750 :   const PetscScalar *Q;
     429        2750 :   PetscReal         *T,*b,*r,beta;
     430             : 
     431        2750 :   PetscFunctionBegin;
     432        2750 :   PetscCall(PetscBLASIntCast(ds->n,&n));
     433        2750 :   PetscCall(PetscBLASIntCast(ds->ld,&ld));
     434        2750 :   PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_Q],&Q));
     435        2750 :   if (ds->compact) {
     436        2747 :     PetscCall(DSGetArrayReal(ds,DS_MAT_T,&T));
     437        2747 :     b = T+ld;
     438        2747 :     r = T+2*ld;
     439        2747 :     beta = b[n-1];   /* in compact, we assume all entries are zero except the last one */
     440       90645 :     for (i=0;i<n;i++) r[i] = PetscRealPart(beta*Q[n-1+i*ld]);
     441        2747 :     ds->k = n;
     442        2747 :     PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&T));
     443             :   } else {
     444           3 :     PetscCall(MatDenseGetArray(ds->omat[DS_MAT_A],&A));
     445           3 :     PetscCall(DSAllocateWork_Private(ds,2*ld,0,0));
     446           3 :     x = ds->work;
     447           3 :     y = ds->work+ld;
     448          33 :     for (i=0;i<n;i++) x[i] = PetscConj(A[n+i*ld]);
     449           3 :     PetscCallBLAS("BLASgemv",BLASgemv_("C",&n,&n,&one,Q,&ld,x,&incx,&zero,y,&incx));
     450          33 :     for (i=0;i<n;i++) A[n+i*ld] = PetscConj(y[i]);
     451           3 :     ds->k = n;
     452           3 :     PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_A],&A));
     453             :   }
     454        2750 :   PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_Q],&Q));
     455        2750 :   PetscFunctionReturn(PETSC_SUCCESS);
     456             : }
     457             : 
     458             : /*
     459             :   Get eigenvectors with inverse iteration.
     460             :   The system matrix is in Hessenberg form.
     461             : */
     462        2750 : PetscErrorCode DSGHIEPInverseIteration(DS ds,PetscScalar *wr,PetscScalar *wi)
     463             : {
     464        2750 :   PetscInt          i,off;
     465        2750 :   PetscBLASInt      *select,*infoC,ld,n1,mout,info;
     466        2750 :   const PetscScalar *A,*B;
     467        2750 :   PetscScalar       *H,*X;
     468        2750 :   PetscReal         *s,*d,*e;
     469             : #if defined(PETSC_USE_COMPLEX)
     470             :   PetscInt          j;
     471             : #endif
     472             : 
     473        2750 :   PetscFunctionBegin;
     474        2750 :   PetscCall(PetscBLASIntCast(ds->ld,&ld));
     475        2750 :   PetscCall(PetscBLASIntCast(ds->n-ds->l,&n1));
     476        2750 :   PetscCall(DSAllocateWork_Private(ds,ld*ld+2*ld,ld,2*ld));
     477        2750 :   PetscCall(DSAllocateMat_Private(ds,DS_MAT_W));
     478        2750 :   PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_A],&A));
     479        2750 :   PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_B],&B));
     480        2750 :   PetscCall(MatDenseGetArrayWrite(ds->omat[DS_MAT_W],&H));
     481        2750 :   PetscCall(DSGetArrayReal(ds,DS_MAT_T,&d));
     482        2750 :   PetscCall(DSGetArrayReal(ds,DS_MAT_D,&s));
     483        2750 :   e = d + ld;
     484        2750 :   select = ds->iwork;
     485        2750 :   infoC = ds->iwork + ld;
     486        2750 :   off = ds->l+ds->l*ld;
     487        2750 :   if (ds->compact) {
     488        2748 :     H[off] = d[ds->l]*s[ds->l];
     489        2748 :     H[off+ld] = e[ds->l]*s[ds->l];
     490       83367 :     for (i=ds->l+1;i<ds->n-1;i++) {
     491       80619 :       H[i+(i-1)*ld] = e[i-1]*s[i];
     492       80619 :       H[i+i*ld] = d[i]*s[i];
     493       80619 :       H[i+(i+1)*ld] = e[i]*s[i];
     494             :     }
     495        2748 :     H[ds->n-1+(ds->n-2)*ld] = e[ds->n-2]*s[ds->n-1];
     496        2748 :     H[ds->n-1+(ds->n-1)*ld] = d[ds->n-1]*s[ds->n-1];
     497             :   } else {
     498           2 :     s[ds->l]  = PetscRealPart(B[off]);
     499           2 :     H[off]    = A[off]*s[ds->l];
     500           2 :     H[off+ld] = A[off+ld]*s[ds->l];
     501          18 :     for (i=ds->l+1;i<ds->n-1;i++) {
     502          16 :       s[i] = PetscRealPart(B[i+i*ld]);
     503          16 :       H[i+(i-1)*ld] = A[i+(i-1)*ld]*s[i];
     504          16 :       H[i+i*ld]     = A[i+i*ld]*s[i];
     505          16 :       H[i+(i+1)*ld] = A[i+(i+1)*ld]*s[i];
     506             :     }
     507           2 :     s[ds->n-1] = PetscRealPart(B[ds->n-1+(ds->n-1)*ld]);
     508           2 :     H[ds->n-1+(ds->n-2)*ld] = A[ds->n-1+(ds->n-2)*ld]*s[ds->n-1];
     509           2 :     H[ds->n-1+(ds->n-1)*ld] = A[ds->n-1+(ds->n-1)*ld]*s[ds->n-1];
     510             :   }
     511        2750 :   PetscCall(DSAllocateMat_Private(ds,DS_MAT_X));
     512        2750 :   PetscCall(MatDenseGetArray(ds->omat[DS_MAT_X],&X));
     513       88885 :   for (i=0;i<n1;i++) select[i] = 1;
     514             : #if !defined(PETSC_USE_COMPLEX)
     515        2750 :   PetscCallBLAS("LAPACKhsein",LAPACKhsein_("R","N","N",select,&n1,H+off,&ld,wr+ds->l,wi+ds->l,NULL,&ld,X+off,&ld,&n1,&mout,ds->work,NULL,infoC,&info));
     516             : #else
     517             :   PetscCallBLAS("LAPACKhsein",LAPACKhsein_("R","N","N",select,&n1,H+off,&ld,wr+ds->l,NULL,&ld,X+off,&ld,&n1,&mout,ds->work,ds->rwork,NULL,infoC,&info));
     518             : 
     519             :   /* Separate real and imaginary part of complex eigenvectors */
     520             :   for (j=ds->l;j<ds->n;j++) {
     521             :     if (PetscAbsReal(PetscImaginaryPart(wr[j])) > PetscAbsScalar(wr[j])*PETSC_SQRT_MACHINE_EPSILON) {
     522             :       for (i=ds->l;i<ds->n;i++) {
     523             :         X[i+(j+1)*ds->ld] = PetscImaginaryPart(X[i+j*ds->ld]);
     524             :         X[i+j*ds->ld] = PetscRealPart(X[i+j*ds->ld]);
     525             :       }
     526             :       j++;
     527             :     }
     528             :   }
     529             : #endif
     530        2750 :   SlepcCheckLapackInfo("hsein",info);
     531        2750 :   PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_A],&A));
     532        2750 :   PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_B],&B));
     533        2750 :   PetscCall(MatDenseRestoreArrayWrite(ds->omat[DS_MAT_W],&H));
     534        2750 :   PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_X],&X));
     535        2750 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&d));
     536        2750 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_D,&s));
     537        2750 :   PetscCall(DSGHIEPOrthogEigenv(ds,DS_MAT_X,wr,wi,PETSC_TRUE));
     538        2750 :   PetscFunctionReturn(PETSC_SUCCESS);
     539             : }
     540             : 
     541             : /*
     542             :    Undo 2x2 blocks that have real eigenvalues.
     543             : */
     544           3 : PetscErrorCode DSGHIEPRealBlocks(DS ds)
     545             : {
     546           3 :   PetscInt       i;
     547           3 :   PetscReal      e,d1,d2,s1,s2,ss1,ss2,t,dd,ss;
     548           3 :   PetscReal      maxy,ep,scal1,scal2,snorm;
     549           3 :   PetscReal      *T,*D,b[4],M[4],wr1,wr2,wi;
     550           3 :   PetscScalar    *A,*B,*Q,Y[4],sone=1.0,szero=0.0;
     551           3 :   PetscBLASInt   m,two=2,ld;
     552           3 :   PetscBool      isreal;
     553             : 
     554           3 :   PetscFunctionBegin;
     555           3 :   PetscCall(PetscBLASIntCast(ds->ld,&ld));
     556           3 :   PetscCall(PetscBLASIntCast(ds->n-ds->l,&m));
     557           3 :   PetscCall(MatDenseGetArray(ds->omat[DS_MAT_A],&A));
     558           3 :   PetscCall(MatDenseGetArray(ds->omat[DS_MAT_B],&B));
     559           3 :   PetscCall(MatDenseGetArray(ds->omat[DS_MAT_Q],&Q));
     560           3 :   PetscCall(DSGetArrayReal(ds,DS_MAT_T,&T));
     561           3 :   PetscCall(DSGetArrayReal(ds,DS_MAT_D,&D));
     562           3 :   PetscCall(DSAllocateWork_Private(ds,2*m,0,0));
     563          23 :   for (i=ds->l;i<ds->n-1;i++) {
     564          20 :     e = (ds->compact)?T[ld+i]:PetscRealPart(A[(i+1)+ld*i]);
     565          20 :     if (e != 0.0) { /* 2x2 block */
     566           5 :       if (ds->compact) {
     567           1 :         s1 = D[i];
     568           1 :         d1 = T[i];
     569           1 :         s2 = D[i+1];
     570           1 :         d2 = T[i+1];
     571             :       } else {
     572           4 :         s1 = PetscRealPart(B[i*ld+i]);
     573           4 :         d1 = PetscRealPart(A[i*ld+i]);
     574           4 :         s2 = PetscRealPart(B[(i+1)*ld+i+1]);
     575           4 :         d2 = PetscRealPart(A[(i+1)*ld+i+1]);
     576             :       }
     577           5 :       isreal = PETSC_FALSE;
     578           5 :       if (s1==s2) { /* apply a Jacobi rotation to compute the eigendecomposition */
     579           0 :         dd = d1-d2;
     580           0 :         if (2*PetscAbsReal(e) <= dd) {
     581           0 :           t = 2*e/dd;
     582           0 :           t = t/(1 + PetscSqrtReal(1+t*t));
     583             :         } else {
     584           0 :           t = dd/(2*e);
     585           0 :           ss = (t>=0)?1.0:-1.0;
     586           0 :           t = ss/(PetscAbsReal(t)+PetscSqrtReal(1+t*t));
     587             :         }
     588           0 :         Y[0] = 1/PetscSqrtReal(1 + t*t); Y[3] = Y[0]; /* c */
     589           0 :         Y[1] = Y[0]*t; Y[2] = -Y[1]; /* s */
     590           0 :         wr1 = d1+t*e; wr2 = d2-t*e;
     591           0 :         ss1 = s1; ss2 = s2;
     592           0 :         isreal = PETSC_TRUE;
     593             :       } else {
     594           5 :         ss1 = 1.0; ss2 = 1.0,
     595           5 :         M[0] = d1; M[1] = e; M[2] = e; M[3]= d2;
     596           5 :         b[0] = s1; b[1] = 0.0; b[2] = 0.0; b[3] = s2;
     597           5 :         ep = LAPACKlamch_("S");
     598             : 
     599             :         /* Compute eigenvalues of the block */
     600           5 :         PetscCallBLAS("LAPACKlag2",LAPACKlag2_(M,&two,b,&two,&ep,&scal1,&scal2,&wr1,&wr2,&wi));
     601           5 :         if (wi==0.0) { /* Real eigenvalues */
     602           2 :           isreal = PETSC_TRUE;
     603           2 :           PetscCheck(scal1>=ep && scal2>=ep,PETSC_COMM_SELF,PETSC_ERR_FP,"Nearly infinite eigenvalue");
     604           2 :           wr1 /= scal1;
     605           2 :           wr2 /= scal2;
     606           2 :           if (PetscAbsReal(s1*d1-wr1)<PetscAbsReal(s2*d2-wr1)) {
     607           0 :             Y[0] = wr1-s2*d2;
     608           0 :             Y[1] = s2*e;
     609             :           } else {
     610           2 :             Y[0] = s1*e;
     611           2 :             Y[1] = wr1-s1*d1;
     612             :           }
     613             :           /* normalize with a signature*/
     614           2 :           maxy = PetscMax(PetscAbsScalar(Y[0]),PetscAbsScalar(Y[1]));
     615           2 :           scal1 = PetscRealPart(Y[0])/maxy;
     616           2 :           scal2 = PetscRealPart(Y[1])/maxy;
     617           2 :           snorm = scal1*scal1*s1 + scal2*scal2*s2;
     618           2 :           if (snorm<0) { ss1 = -1.0; snorm = -snorm; }
     619           2 :           snorm = maxy*PetscSqrtReal(snorm);
     620           2 :           Y[0] = Y[0]/snorm;
     621           2 :           Y[1] = Y[1]/snorm;
     622           2 :           if (PetscAbsReal(s1*d1-wr2)<PetscAbsReal(s2*d2-wr2)) {
     623           2 :             Y[2] = wr2-s2*d2;
     624           2 :             Y[3] = s2*e;
     625             :           } else {
     626           0 :             Y[2] = s1*e;
     627           0 :             Y[3] = wr2-s1*d1;
     628             :           }
     629           2 :           maxy = PetscMax(PetscAbsScalar(Y[2]),PetscAbsScalar(Y[3]));
     630           2 :           scal1 = PetscRealPart(Y[2])/maxy;
     631           2 :           scal2 = PetscRealPart(Y[3])/maxy;
     632           2 :           snorm = scal1*scal1*s1 + scal2*scal2*s2;
     633           2 :           if (snorm<0) { ss2 = -1.0; snorm = -snorm; }
     634           2 :           snorm = maxy*PetscSqrtReal(snorm); Y[2] = Y[2]/snorm; Y[3] = Y[3]/snorm;
     635             :         }
     636           5 :         wr1 *= ss1; wr2 *= ss2;
     637             :       }
     638           5 :       if (isreal) {
     639           2 :         if (ds->compact) {
     640           0 :           D[i]    = ss1;
     641           0 :           T[i]    = wr1;
     642           0 :           D[i+1]  = ss2;
     643           0 :           T[i+1]  = wr2;
     644           0 :           T[ld+i] = 0.0;
     645             :         } else {
     646           2 :           B[i*ld+i]       = ss1;
     647           2 :           A[i*ld+i]       = wr1;
     648           2 :           B[(i+1)*ld+i+1] = ss2;
     649           2 :           A[(i+1)*ld+i+1] = wr2;
     650           2 :           A[(i+1)+ld*i]   = 0.0;
     651           2 :           A[i+ld*(i+1)]   = 0.0;
     652             :         }
     653           2 :         PetscCallBLAS("BLASgemm",BLASgemm_("N","N",&m,&two,&two,&sone,Q+ds->l+i*ld,&ld,Y,&two,&szero,ds->work,&m));
     654           2 :         PetscCall(PetscArraycpy(Q+ds->l+i*ld,ds->work,m));
     655           2 :         PetscCall(PetscArraycpy(Q+ds->l+(i+1)*ld,ds->work+m,m));
     656             :       }
     657           5 :       i++;
     658             :     }
     659             :   }
     660           3 :   PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_A],&A));
     661           3 :   PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_B],&B));
     662           3 :   PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_Q],&Q));
     663           3 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&T));
     664           3 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_D,&D));
     665           3 :   PetscFunctionReturn(PETSC_SUCCESS);
     666             : }
     667             : 
     668        2751 : static PetscErrorCode DSSolve_GHIEP_QR_II(DS ds,PetscScalar *wr,PetscScalar *wi)
     669             : {
     670        2751 :   PetscInt          i,off;
     671        2751 :   PetscBLASInt      n1,ld,one=1,info,lwork;
     672        2751 :   const PetscScalar *A,*B;
     673        2751 :   PetscScalar       *H,*Q;
     674        2751 :   PetscReal         *d,*e,*s;
     675             : #if defined(PETSC_USE_COMPLEX)
     676             :   PetscInt          j;
     677             : #endif
     678             : 
     679        2751 :   PetscFunctionBegin;
     680             : #if !defined(PETSC_USE_COMPLEX)
     681        2751 :   PetscAssertPointer(wi,3);
     682             : #endif
     683        2751 :   PetscCall(PetscBLASIntCast(ds->n-ds->l,&n1));
     684        2751 :   PetscCall(PetscBLASIntCast(ds->ld,&ld));
     685        2751 :   off = ds->l + ds->l*ld;
     686        2751 :   PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_A],&A));
     687        2751 :   PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_B],&B));
     688        2751 :   PetscCall(DSGetArrayReal(ds,DS_MAT_T,&d));
     689        2751 :   PetscCall(DSGetArrayReal(ds,DS_MAT_D,&s));
     690        2751 :   e = d + ld;
     691             : #if defined(PETSC_USE_DEBUG)
     692             :   /* Check signature */
     693       90684 :   for (i=0;i<ds->n;i++) {
     694       87933 :     PetscReal de = (ds->compact)?s[i]:PetscRealPart(B[i*ld+i]);
     695       87933 :     PetscCheck(de==1.0 || de==-1.0,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Diagonal elements of the signature matrix must be 1 or -1");
     696             :   }
     697             : #endif
     698             : 
     699             :   /* Quick return if possible */
     700        2751 :   if (n1 == 1) {
     701           1 :     PetscCall(MatDenseGetArray(ds->omat[DS_MAT_Q],&Q));
     702           6 :     for (i=0;i<=ds->l;i++) Q[i+i*ld] = 1.0;
     703           1 :     PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_Q],&Q));
     704           1 :     PetscCall(DSGHIEPComplexEigs(ds,0,ds->l,wr,wi));
     705           1 :     if (!ds->compact) {
     706           0 :       d[ds->l] = PetscRealPart(A[off]);
     707           0 :       s[ds->l] = PetscRealPart(B[off]);
     708             :     }
     709           1 :     PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_A],&A));
     710           1 :     PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_B],&B));
     711           1 :     wr[ds->l] = d[ds->l]/s[ds->l];
     712           1 :     if (wi) wi[ds->l] = 0.0;
     713           1 :     PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&d));
     714           1 :     PetscCall(DSRestoreArrayReal(ds,DS_MAT_D,&s));
     715           1 :     PetscFunctionReturn(PETSC_SUCCESS);
     716             :   }
     717             : 
     718        2750 :   PetscCall(DSAllocateWork_Private(ds,ld*ld,2*ld,ld*2));
     719        2750 :   lwork = ld*ld;
     720             : 
     721             :   /* Reduce to pseudotriadiagonal form */
     722        2750 :   PetscCall(DSIntermediate_GHIEP(ds));
     723             : 
     724             :   /* Compute Eigenvalues (QR) */
     725        2750 :   PetscCall(DSAllocateMat_Private(ds,DS_MAT_W));
     726        2750 :   PetscCall(MatDenseGetArrayWrite(ds->omat[DS_MAT_W],&H));
     727        2750 :   if (ds->compact) {
     728        2748 :     H[off]    = d[ds->l]*s[ds->l];
     729        2748 :     H[off+ld] = e[ds->l]*s[ds->l];
     730       83367 :     for (i=ds->l+1;i<ds->n-1;i++) {
     731       80619 :       H[i+(i-1)*ld] = e[i-1]*s[i];
     732       80619 :       H[i+i*ld]     = d[i]*s[i];
     733       80619 :       H[i+(i+1)*ld] = e[i]*s[i];
     734             :     }
     735        2748 :     H[ds->n-1+(ds->n-2)*ld] = e[ds->n-2]*s[ds->n-1];
     736        2748 :     H[ds->n-1+(ds->n-1)*ld] = d[ds->n-1]*s[ds->n-1];
     737             :   } else {
     738           2 :     s[ds->l]  = PetscRealPart(B[off]);
     739           2 :     H[off]    = A[off]*s[ds->l];
     740           2 :     H[off+ld] = A[off+ld]*s[ds->l];
     741          18 :     for (i=ds->l+1;i<ds->n-1;i++) {
     742          16 :       s[i] = PetscRealPart(B[i+i*ld]);
     743          16 :       H[i+(i-1)*ld] = A[i+(i-1)*ld]*s[i];
     744          16 :       H[i+i*ld]     = A[i+i*ld]*s[i];
     745          16 :       H[i+(i+1)*ld] = A[i+(i+1)*ld]*s[i];
     746             :     }
     747           2 :     s[ds->n-1] = PetscRealPart(B[ds->n-1+(ds->n-1)*ld]);
     748           2 :     H[ds->n-1+(ds->n-2)*ld] = A[ds->n-1+(ds->n-2)*ld]*s[ds->n-1];
     749           2 :     H[ds->n-1+(ds->n-1)*ld] = A[ds->n-1+(ds->n-1)*ld]*s[ds->n-1];
     750             :   }
     751             : 
     752             : #if !defined(PETSC_USE_COMPLEX)
     753        2750 :   PetscCallBLAS("LAPACKhseqr",LAPACKhseqr_("E","N",&n1,&one,&n1,H+off,&ld,wr+ds->l,wi+ds->l,NULL,&ld,ds->work,&lwork,&info));
     754             : #else
     755             :   PetscCallBLAS("LAPACKhseqr",LAPACKhseqr_("E","N",&n1,&one,&n1,H+off,&ld,wr+ds->l,NULL,&ld,ds->work,&lwork,&info));
     756             :   for (i=ds->l;i<ds->n;i++) if (PetscAbsReal(PetscImaginaryPart(wr[i]))<10*PETSC_MACHINE_EPSILON) wr[i] = PetscRealPart(wr[i]);
     757             :   /* Sort to have consecutive conjugate pairs */
     758             :   for (i=ds->l;i<ds->n;i++) {
     759             :     j=i+1;
     760             :     while (j<ds->n && (PetscAbsScalar(wr[i]-PetscConj(wr[j]))>PetscAbsScalar(wr[i])*PETSC_SQRT_MACHINE_EPSILON)) j++;
     761             :     if (j==ds->n) {
     762             :       PetscCheck(PetscAbsReal(PetscImaginaryPart(wr[i]))<PetscAbsScalar(wr[i])*PETSC_SQRT_MACHINE_EPSILON,PETSC_COMM_SELF,PETSC_ERR_LIB,"Found complex without conjugate pair");
     763             :       wr[i] = PetscRealPart(wr[i]);
     764             :     } else { /* complex eigenvalue */
     765             :       wr[j] = wr[i+1];
     766             :       if (PetscImaginaryPart(wr[i])<0) wr[i] = PetscConj(wr[i]);
     767             :       wr[i+1] = PetscConj(wr[i]);
     768             :       i++;
     769             :     }
     770             :   }
     771             : #endif
     772        2750 :   SlepcCheckLapackInfo("hseqr",info);
     773        2750 :   PetscCall(MatDenseRestoreArrayWrite(ds->omat[DS_MAT_W],&H));
     774        2750 :   PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_A],&A));
     775        2750 :   PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_B],&B));
     776        2750 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&d));
     777        2750 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_D,&s));
     778             : 
     779             :   /* Compute Eigenvectors with Inverse Iteration */
     780        2750 :   PetscCall(DSGHIEPInverseIteration(ds,wr,wi));
     781             : 
     782             :   /* Recover eigenvalues from diagonal */
     783        2750 :   PetscCall(DSGHIEPComplexEigs(ds,0,ds->l,wr,wi));
     784             : #if defined(PETSC_USE_COMPLEX)
     785             :   if (wi) {
     786             :     for (i=ds->l;i<ds->n;i++) wi[i] = 0.0;
     787             :   }
     788             : #endif
     789        2750 :   PetscFunctionReturn(PETSC_SUCCESS);
     790             : }
     791             : 
     792           4 : static PetscErrorCode DSSolve_GHIEP_QR(DS ds,PetscScalar *wr,PetscScalar *wi)
     793             : {
     794           4 :   PetscInt          i,j,off,nwu=0,n,lw,lwr,nwru=0;
     795           4 :   PetscBLASInt      n_,ld,info,lwork,ilo,ihi;
     796           4 :   const PetscScalar *A,*B;
     797           4 :   PetscScalar       *H,*Q,*X;
     798           4 :   PetscReal         *d,*s,*scale,nrm,*rcde,*rcdv;
     799             : #if defined(PETSC_USE_COMPLEX)
     800             :   PetscInt          k;
     801             : #endif
     802             : 
     803           4 :   PetscFunctionBegin;
     804             : #if !defined(PETSC_USE_COMPLEX)
     805           4 :   PetscAssertPointer(wi,3);
     806             : #endif
     807           4 :   n = ds->n-ds->l;
     808           4 :   PetscCall(PetscBLASIntCast(n,&n_));
     809           4 :   PetscCall(PetscBLASIntCast(ds->ld,&ld));
     810           4 :   off = ds->l + ds->l*ld;
     811           4 :   PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_A],&A));
     812           4 :   PetscCall(MatDenseGetArrayRead(ds->omat[DS_MAT_B],&B));
     813           4 :   PetscCall(DSGetArrayReal(ds,DS_MAT_T,&d));
     814           4 :   PetscCall(DSGetArrayReal(ds,DS_MAT_D,&s));
     815             : #if defined(PETSC_USE_DEBUG)
     816             :   /* Check signature */
     817          39 :   for (i=0;i<ds->n;i++) {
     818          35 :     PetscReal de = (ds->compact)?s[i]:PetscRealPart(B[i*ld+i]);
     819          35 :     PetscCheck(de==1.0 || de==-1.0,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Diagonal elements of the signature matrix must be 1 or -1");
     820             :   }
     821             : #endif
     822             : 
     823             :   /* Quick return if possible */
     824           4 :   if (n_ == 1) {
     825           1 :     PetscCall(MatDenseGetArray(ds->omat[DS_MAT_Q],&Q));
     826           6 :     for (i=0;i<=ds->l;i++) Q[i+i*ld] = 1.0;
     827           1 :     PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_Q],&Q));
     828           1 :     PetscCall(DSGHIEPComplexEigs(ds,0,ds->l,wr,wi));
     829           1 :     if (!ds->compact) {
     830           0 :       d[ds->l] = PetscRealPart(A[off]);
     831           0 :       s[ds->l] = PetscRealPart(B[off]);
     832             :     }
     833           1 :     PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_A],&A));
     834           1 :     PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_B],&B));
     835           1 :     wr[ds->l] = d[ds->l]/s[ds->l];
     836           1 :     if (wi) wi[ds->l] = 0.0;
     837           1 :     PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&d));
     838           1 :     PetscCall(DSRestoreArrayReal(ds,DS_MAT_D,&s));
     839           1 :     PetscFunctionReturn(PETSC_SUCCESS);
     840             :   }
     841             : 
     842           3 :   lw = 14*ld+ld*ld;
     843           3 :   lwr = 7*ld;
     844           3 :   PetscCall(DSAllocateWork_Private(ds,lw,lwr,0));
     845           3 :   scale = ds->rwork+nwru;
     846           3 :   nwru += ld;
     847           3 :   rcde = ds->rwork+nwru;
     848           3 :   nwru += ld;
     849           3 :   rcdv = ds->rwork+nwru;
     850             : 
     851             :   /* Form pseudo-symmetric matrix */
     852           3 :   H =  ds->work+nwu;
     853           3 :   nwu += n*n;
     854           3 :   PetscCall(PetscArrayzero(H,n*n));
     855           3 :   if (ds->compact) {
     856           8 :     for (i=0;i<n-1;i++) {
     857           7 :       H[i+i*n]     = s[ds->l+i]*d[ds->l+i];
     858           7 :       H[i+1+i*n]   = s[ds->l+i+1]*d[ld+ds->l+i];
     859           7 :       H[i+(i+1)*n] = s[ds->l+i]*d[ld+ds->l+i];
     860             :     }
     861           1 :     H[n-1+(n-1)*n] = s[ds->l+n-1]*d[ds->l+n-1];
     862           4 :     for (i=0;i<ds->k-ds->l;i++) {
     863           3 :       H[ds->k-ds->l+i*n] = s[ds->k]*d[2*ld+ds->l+i];
     864           3 :       H[i+(ds->k-ds->l)*n] = s[i+ds->l]*d[2*ld+ds->l+i];
     865             :     }
     866             :   } else {
     867          22 :     for (j=0;j<n;j++) {
     868         220 :       for (i=0;i<n;i++) H[i+j*n] = B[off+i+i*ld]*A[off+i+j*ld];
     869             :     }
     870             :   }
     871             : 
     872             :   /* Compute eigenpairs */
     873           3 :   PetscCall(PetscBLASIntCast(lw-nwu,&lwork));
     874           3 :   PetscCall(DSAllocateMat_Private(ds,DS_MAT_X));
     875           3 :   PetscCall(MatDenseGetArrayWrite(ds->omat[DS_MAT_X],&X));
     876             : #if !defined(PETSC_USE_COMPLEX)
     877           3 :   PetscCallBLAS("LAPACKgeevx",LAPACKgeevx_("B","N","V","N",&n_,H,&n_,wr+ds->l,wi+ds->l,NULL,&ld,X+off,&ld,&ilo,&ihi,scale,&nrm,rcde,rcdv,ds->work+nwu,&lwork,NULL,&info));
     878             : #else
     879             :   PetscCallBLAS("LAPACKgeevx",LAPACKgeevx_("B","N","V","N",&n_,H,&n_,wr+ds->l,NULL,&ld,X+off,&ld,&ilo,&ihi,scale,&nrm,rcde,rcdv,ds->work+nwu,&lwork,ds->rwork+nwru,&info));
     880             : 
     881             :   /* Sort to have consecutive conjugate pairs
     882             :      Separate real and imaginary part of complex eigenvectors*/
     883             :   for (i=ds->l;i<ds->n;i++) {
     884             :     j=i+1;
     885             :     while (j<ds->n && (PetscAbsScalar(wr[i]-PetscConj(wr[j]))>PetscAbsScalar(wr[i])*PETSC_SQRT_MACHINE_EPSILON)) j++;
     886             :     if (j==ds->n) {
     887             :       PetscCheck(PetscAbsReal(PetscImaginaryPart(wr[i]))<PetscAbsScalar(wr[i])*PETSC_SQRT_MACHINE_EPSILON,PETSC_COMM_SELF,PETSC_ERR_LIB,"Found complex without conjugate pair");
     888             :       wr[i]=PetscRealPart(wr[i]); /* real eigenvalue */
     889             :       for (k=ds->l;k<ds->n;k++) {
     890             :         X[k+i*ds->ld] = PetscRealPart(X[k+i*ds->ld]);
     891             :       }
     892             :     } else { /* complex eigenvalue */
     893             :       if (j!=i+1) {
     894             :         wr[j] = wr[i+1];
     895             :         PetscCall(PetscArraycpy(X+j*ds->ld,X+(i+1)*ds->ld,ds->ld));
     896             :       }
     897             :       if (PetscImaginaryPart(wr[i])<0) {
     898             :         wr[i] = PetscConj(wr[i]);
     899             :         for (k=ds->l;k<ds->n;k++) {
     900             :           X[k+(i+1)*ds->ld] = -PetscImaginaryPart(X[k+i*ds->ld]);
     901             :           X[k+i*ds->ld] = PetscRealPart(X[k+i*ds->ld]);
     902             :         }
     903             :       } else {
     904             :         for (k=ds->l;k<ds->n;k++) {
     905             :           X[k+(i+1)*ds->ld] = PetscImaginaryPart(X[k+i*ds->ld]);
     906             :           X[k+i*ds->ld] = PetscRealPart(X[k+i*ds->ld]);
     907             :         }
     908             :       }
     909             :       wr[i+1] = PetscConj(wr[i]);
     910             :       i++;
     911             :     }
     912             :   }
     913             : #endif
     914           3 :   SlepcCheckLapackInfo("geevx",info);
     915           3 :   PetscCall(MatDenseRestoreArrayWrite(ds->omat[DS_MAT_X],&X));
     916           3 :   PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_A],&A));
     917           3 :   PetscCall(MatDenseRestoreArrayRead(ds->omat[DS_MAT_B],&B));
     918           3 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&d));
     919           3 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_D,&s));
     920             : 
     921             :   /* Compute real s-orthonormal basis */
     922           3 :   PetscCall(DSGHIEPOrthogEigenv(ds,DS_MAT_X,wr,wi,PETSC_FALSE));
     923             : 
     924             :   /* Recover eigenvalues from diagonal */
     925           3 :   PetscCall(DSGHIEPComplexEigs(ds,0,ds->l,wr,wi));
     926             : #if defined(PETSC_USE_COMPLEX)
     927             :   if (wi) {
     928             :     for (i=ds->l;i<ds->n;i++) wi[i] = 0.0;
     929             :   }
     930             : #endif
     931           3 :   PetscFunctionReturn(PETSC_SUCCESS);
     932             : }
     933             : 
     934        2697 : static PetscErrorCode DSGetTruncateSize_GHIEP(DS ds,PetscInt l,PetscInt n,PetscInt *k)
     935             : {
     936        2697 :   PetscReal *T;
     937             : 
     938        2697 :   PetscFunctionBegin;
     939        2697 :   PetscCall(DSGetArrayReal(ds,DS_MAT_T,&T));
     940        2697 :   if (T[l+(*k)-1+ds->ld] !=0.0) {
     941           8 :     if (l+(*k)<n-1) (*k)++;
     942           0 :     else (*k)--;
     943             :   }
     944        2697 :   PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&T));
     945        2697 :   PetscFunctionReturn(PETSC_SUCCESS);
     946             : }
     947             : 
     948        2747 : static PetscErrorCode DSTruncate_GHIEP(DS ds,PetscInt n,PetscBool trim)
     949             : {
     950        2747 :   PetscInt    i,ld=ds->ld,l=ds->l;
     951        2747 :   PetscScalar *A;
     952        2747 :   PetscReal   *T,*b,*r,*omega;
     953             : 
     954        2747 :   PetscFunctionBegin;
     955        2747 :   if (ds->compact) {
     956        2747 :     PetscCall(DSGetArrayReal(ds,DS_MAT_T,&T));
     957        2747 :     PetscCall(DSGetArrayReal(ds,DS_MAT_D,&omega));
     958             : #if defined(PETSC_USE_DEBUG)
     959             :     /* make sure diagonal 2x2 block is not broken */
     960        2747 :     PetscCheck(ds->state<DS_STATE_CONDENSED || n==0 || n==ds->n || T[n-1+ld]==0.0,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"The given size would break a 2x2 block, call DSGetTruncateSize() first");
     961             : #endif
     962             :   }
     963        2747 :   if (trim) {
     964          50 :     if (!ds->compact && ds->extrarow) {   /* clean extra row */
     965           0 :       PetscCall(MatDenseGetArray(ds->omat[DS_MAT_A],&A));
     966           0 :       for (i=l;i<ds->n;i++) A[ds->n+i*ld] = 0.0;
     967           0 :       PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_A],&A));
     968             :     }
     969          50 :     ds->l = 0;
     970          50 :     ds->k = 0;
     971          50 :     ds->n = n;
     972          50 :     ds->t = ds->n;   /* truncated length equal to the new dimension */
     973             :   } else {
     974        2697 :     if (!ds->compact && ds->extrarow && ds->k==ds->n) {
     975             :       /* copy entries of extra row to the new position, then clean last row */
     976           0 :       PetscCall(MatDenseGetArray(ds->omat[DS_MAT_A],&A));
     977           0 :       for (i=l;i<n;i++) A[n+i*ld] = A[ds->n+i*ld];
     978           0 :       for (i=l;i<ds->n;i++) A[ds->n+i*ld] = 0.0;
     979           0 :       PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_A],&A));
     980             :     }
     981        2697 :     if (ds->compact) {
     982        2697 :       b = T+ld;
     983        2697 :       r = T+2*ld;
     984        2697 :       b[n-1] = r[n-1];
     985        2697 :       b[n] = b[ds->n];
     986        2697 :       omega[n] = omega[ds->n];
     987             :     }
     988        2697 :     ds->k = (ds->extrarow)? n: 0;
     989        2697 :     ds->t = ds->n;   /* truncated length equal to previous dimension */
     990        2697 :     ds->n = n;
     991             :   }
     992        2747 :   if (ds->compact) {
     993        2747 :     PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&T));
     994        2747 :     PetscCall(DSRestoreArrayReal(ds,DS_MAT_D,&omega));
     995             :   }
     996        2747 :   PetscFunctionReturn(PETSC_SUCCESS);
     997             : }
     998             : 
     999             : #if !defined(PETSC_HAVE_MPIUNI)
    1000           2 : static PetscErrorCode DSSynchronize_GHIEP(DS ds,PetscScalar eigr[],PetscScalar eigi[])
    1001             : {
    1002           2 :   PetscScalar    *A,*B,*Q;
    1003           2 :   PetscReal      *T,*D;
    1004           2 :   PetscInt       ld=ds->ld,l=ds->l,k=0,kr=0;
    1005           2 :   PetscMPIInt    n,rank,off=0,size,ldn,ld3,ld_;
    1006             : 
    1007           2 :   PetscFunctionBegin;
    1008           2 :   if (ds->compact) kr = 4*ld;
    1009           0 :   else k = 2*(ds->n-l)*ld;
    1010           2 :   if (ds->state>DS_STATE_RAW) k += (ds->n-l)*ld;
    1011           2 :   if (eigr) k += (ds->n-l);
    1012           2 :   if (eigi) k += (ds->n-l);
    1013           2 :   PetscCall(DSAllocateWork_Private(ds,k+kr,0,0));
    1014           2 :   PetscCall(PetscMPIIntCast(k*sizeof(PetscScalar)+kr*sizeof(PetscReal),&size));
    1015           2 :   PetscCall(PetscMPIIntCast(ds->n-l,&n));
    1016           2 :   PetscCall(PetscMPIIntCast(ld*(ds->n-l),&ldn));
    1017           2 :   PetscCall(PetscMPIIntCast(ld*3,&ld3));
    1018           2 :   PetscCall(PetscMPIIntCast(ld,&ld_));
    1019           2 :   if (ds->compact) {
    1020           2 :     PetscCall(DSGetArrayReal(ds,DS_MAT_T,&T));
    1021           2 :     PetscCall(DSGetArrayReal(ds,DS_MAT_D,&D));
    1022             :   } else {
    1023           0 :     PetscCall(MatDenseGetArray(ds->omat[DS_MAT_A],&A));
    1024           0 :     PetscCall(MatDenseGetArray(ds->omat[DS_MAT_B],&B));
    1025             :   }
    1026           2 :   if (ds->state>DS_STATE_RAW) PetscCall(MatDenseGetArray(ds->omat[DS_MAT_Q],&Q));
    1027           2 :   PetscCallMPI(MPI_Comm_rank(PetscObjectComm((PetscObject)ds),&rank));
    1028           2 :   if (!rank) {
    1029           1 :     if (ds->compact) {
    1030           1 :       PetscCallMPI(MPI_Pack(T,ld3,MPIU_REAL,ds->work,size,&off,PetscObjectComm((PetscObject)ds)));
    1031           1 :       PetscCallMPI(MPI_Pack(D,ld_,MPIU_REAL,ds->work,size,&off,PetscObjectComm((PetscObject)ds)));
    1032             :     } else {
    1033           0 :       PetscCallMPI(MPI_Pack(A+l*ld,ldn,MPIU_SCALAR,ds->work,size,&off,PetscObjectComm((PetscObject)ds)));
    1034           0 :       PetscCallMPI(MPI_Pack(B+l*ld,ldn,MPIU_SCALAR,ds->work,size,&off,PetscObjectComm((PetscObject)ds)));
    1035             :     }
    1036           1 :     if (ds->state>DS_STATE_RAW) PetscCallMPI(MPI_Pack(Q+l*ld,ldn,MPIU_SCALAR,ds->work,size,&off,PetscObjectComm((PetscObject)ds)));
    1037           1 :     if (eigr) PetscCallMPI(MPI_Pack(eigr+l,n,MPIU_SCALAR,ds->work,size,&off,PetscObjectComm((PetscObject)ds)));
    1038             : #if !defined(PETSC_USE_COMPLEX)
    1039           1 :     if (eigi) PetscCallMPI(MPI_Pack(eigi+l,n,MPIU_SCALAR,ds->work,size,&off,PetscObjectComm((PetscObject)ds)));
    1040             : #endif
    1041             :   }
    1042           4 :   PetscCallMPI(MPI_Bcast(ds->work,size,MPI_BYTE,0,PetscObjectComm((PetscObject)ds)));
    1043           2 :   if (rank) {
    1044           1 :     if (ds->compact) {
    1045           1 :       PetscCallMPI(MPI_Unpack(ds->work,size,&off,T,ld3,MPIU_REAL,PetscObjectComm((PetscObject)ds)));
    1046           1 :       PetscCallMPI(MPI_Unpack(ds->work,size,&off,D,ld_,MPIU_REAL,PetscObjectComm((PetscObject)ds)));
    1047             :     } else {
    1048           0 :       PetscCallMPI(MPI_Unpack(ds->work,size,&off,A+l*ld,ldn,MPIU_SCALAR,PetscObjectComm((PetscObject)ds)));
    1049           0 :       PetscCallMPI(MPI_Unpack(ds->work,size,&off,B+l*ld,ldn,MPIU_SCALAR,PetscObjectComm((PetscObject)ds)));
    1050             :     }
    1051           1 :     if (ds->state>DS_STATE_RAW) PetscCallMPI(MPI_Unpack(ds->work,size,&off,Q+l*ld,ldn,MPIU_SCALAR,PetscObjectComm((PetscObject)ds)));
    1052           1 :     if (eigr) PetscCallMPI(MPI_Unpack(ds->work,size,&off,eigr+l,n,MPIU_SCALAR,PetscObjectComm((PetscObject)ds)));
    1053             : #if !defined(PETSC_USE_COMPLEX)
    1054           1 :     if (eigi) PetscCallMPI(MPI_Unpack(ds->work,size,&off,eigi+l,n,MPIU_SCALAR,PetscObjectComm((PetscObject)ds)));
    1055             : #endif
    1056             :   }
    1057           2 :   if (ds->compact) {
    1058           2 :     PetscCall(DSRestoreArrayReal(ds,DS_MAT_T,&T));
    1059           2 :     PetscCall(DSRestoreArrayReal(ds,DS_MAT_D,&D));
    1060             :   } else {
    1061           0 :     PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_A],&A));
    1062           0 :     PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_B],&B));
    1063             :   }
    1064           2 :   if (ds->state>DS_STATE_RAW) PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_Q],&Q));
    1065           2 :   PetscFunctionReturn(PETSC_SUCCESS);
    1066             : }
    1067             : #endif
    1068             : 
    1069        5543 : static PetscErrorCode DSHermitian_GHIEP(DS ds,DSMatType m,PetscBool *flg)
    1070             : {
    1071        5543 :   PetscFunctionBegin;
    1072        5543 :   if ((m==DS_MAT_A && !ds->extrarow) || m==DS_MAT_B) *flg = PETSC_TRUE;
    1073        5543 :   else *flg = PETSC_FALSE;
    1074        5543 :   PetscFunctionReturn(PETSC_SUCCESS);
    1075             : }
    1076             : 
    1077             : /*MC
    1078             :    DSGHIEP - Dense Generalized Hermitian Indefinite Eigenvalue Problem.
    1079             : 
    1080             :    Level: beginner
    1081             : 
    1082             :    Notes:
    1083             :    The problem is expressed as A*X = B*X*Lambda, where both A and B are
    1084             :    real symmetric (or complex Hermitian) and possibly indefinite. Lambda
    1085             :    is a diagonal matrix whose diagonal elements are the arguments of DSSolve().
    1086             :    After solve, A is overwritten with Lambda. Note that in the case of real
    1087             :    scalars, A is overwritten with a real representation of Lambda, i.e.,
    1088             :    complex conjugate eigenvalue pairs are stored as a 2x2 block in the
    1089             :    quasi-diagonal matrix.
    1090             : 
    1091             :    In the intermediate state A is reduced to tridiagonal form and B is
    1092             :    transformed into a signature matrix. In compact storage format, these
    1093             :    matrices are stored in T and D, respectively.
    1094             : 
    1095             :    Used DS matrices:
    1096             : +  DS_MAT_A - first problem matrix
    1097             : .  DS_MAT_B - second problem matrix
    1098             : .  DS_MAT_T - symmetric tridiagonal matrix of the reduced pencil
    1099             : .  DS_MAT_D - diagonal matrix (signature) of the reduced pencil
    1100             : -  DS_MAT_Q - pseudo-orthogonal transformation that reduces (A,B) to
    1101             :    tridiagonal-diagonal form (intermediate step) or a real basis of eigenvectors
    1102             : 
    1103             :    Implemented methods:
    1104             : +  0 - QR iteration plus inverse iteration for the eigenvectors
    1105             : .  1 - HZ iteration
    1106             : -  2 - QR iteration plus pseudo-orthogonalization for the eigenvectors
    1107             : 
    1108             :    References:
    1109             : .  1. - C. Campos and J. E. Roman, "Restarted Q-Arnoldi-type methods exploiting
    1110             :    symmetry in quadratic eigenvalue problems", BIT Numer. Math. 56(4):1213-1236, 2016.
    1111             : 
    1112             : .seealso: DSCreate(), DSSetType(), DSType
    1113             : M*/
    1114          48 : SLEPC_EXTERN PetscErrorCode DSCreate_GHIEP(DS ds)
    1115             : {
    1116          48 :   PetscFunctionBegin;
    1117          48 :   ds->ops->allocate        = DSAllocate_GHIEP;
    1118          48 :   ds->ops->view            = DSView_GHIEP;
    1119          48 :   ds->ops->vectors         = DSVectors_GHIEP;
    1120          48 :   ds->ops->solve[0]        = DSSolve_GHIEP_QR_II;
    1121          48 :   ds->ops->solve[1]        = DSSolve_GHIEP_HZ;
    1122          48 :   ds->ops->solve[2]        = DSSolve_GHIEP_QR;
    1123          48 :   ds->ops->sort            = DSSort_GHIEP;
    1124             : #if !defined(PETSC_HAVE_MPIUNI)
    1125          48 :   ds->ops->synchronize     = DSSynchronize_GHIEP;
    1126             : #endif
    1127          48 :   ds->ops->gettruncatesize = DSGetTruncateSize_GHIEP;
    1128          48 :   ds->ops->truncate        = DSTruncate_GHIEP;
    1129          48 :   ds->ops->update          = DSUpdateExtraRow_GHIEP;
    1130          48 :   ds->ops->hermitian       = DSHermitian_GHIEP;
    1131          48 :   PetscFunctionReturn(PETSC_SUCCESS);
    1132             : }

Generated by: LCOV version 1.14