Actual source code: dsnep.c
slepc-main 2024-12-17
1: /*
2: - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
3: SLEPc - Scalable Library for Eigenvalue Problem Computations
4: Copyright (c) 2002-, Universitat Politecnica de Valencia, Spain
6: This file is part of SLEPc.
7: SLEPc is distributed under a 2-clause BSD license (see LICENSE).
8: - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
9: */
11: #include <slepc/private/dsimpl.h>
12: #include <slepcblaslapack.h>
14: typedef struct {
15: PetscInt nf; /* number of functions in f[] */
16: FN f[DS_NUM_EXTRA]; /* functions defining the nonlinear operator */
17: PetscInt max_mid; /* maximum minimality index */
18: PetscInt nnod; /* number of nodes for quadrature rules */
19: PetscInt spls; /* number of sampling columns for quadrature rules */
20: PetscInt Nit; /* number of refinement iterations */
21: PetscReal rtol; /* tolerance of Newton refinement */
22: RG rg; /* region for contour integral */
23: PetscLayout map; /* used to distribute work among MPI processes */
24: void *computematrixctx;
25: DSNEPMatrixFunctionFn *computematrix;
26: } DS_NEP;
28: /*
29: DSNEPComputeMatrix - Build the matrix associated with a nonlinear operator
30: T(lambda) or its derivative T'(lambda), given the parameter lambda, where
31: T(lambda) = sum_i E_i*f_i(lambda). The result is written in mat.
32: */
33: static PetscErrorCode DSNEPComputeMatrix(DS ds,PetscScalar lambda,PetscBool deriv,DSMatType mat)
34: {
35: DS_NEP *ctx = (DS_NEP*)ds->data;
36: PetscScalar *T,alpha;
37: const PetscScalar *E;
38: PetscInt i,ld,n;
39: PetscBLASInt k,inc=1;
41: PetscFunctionBegin;
42: PetscCall(PetscLogEventBegin(DS_Other,ds,0,0,0));
43: if (ctx->computematrix) PetscCall((*ctx->computematrix)(ds,lambda,deriv,mat,ctx->computematrixctx));
44: else {
45: PetscCall(DSGetDimensions(ds,&n,NULL,NULL,NULL));
46: PetscCall(DSGetLeadingDimension(ds,&ld));
47: PetscCall(PetscBLASIntCast(ld*n,&k));
48: PetscCall(MatDenseGetArray(ds->omat[mat],&T));
49: PetscCall(PetscArrayzero(T,k));
50: for (i=0;i<ctx->nf;i++) {
51: if (deriv) PetscCall(FNEvaluateDerivative(ctx->f[i],lambda,&alpha));
52: else PetscCall(FNEvaluateFunction(ctx->f[i],lambda,&alpha));
53: PetscCall(MatDenseGetArrayRead(ds->omat[DSMatExtra[i]],&E));
54: PetscCallBLAS("BLASaxpy",BLASaxpy_(&k,&alpha,E,&inc,T,&inc));
55: PetscCall(MatDenseRestoreArrayRead(ds->omat[DSMatExtra[i]],&E));
56: }
57: PetscCall(MatDenseRestoreArray(ds->omat[mat],&T));
58: }
59: PetscCall(PetscLogEventEnd(DS_Other,ds,0,0,0));
60: PetscFunctionReturn(PETSC_SUCCESS);
61: }
63: static PetscErrorCode DSAllocate_NEP(DS ds,PetscInt ld)
64: {
65: DS_NEP *ctx = (DS_NEP*)ds->data;
66: PetscInt i;
68: PetscFunctionBegin;
69: PetscCall(DSAllocateMat_Private(ds,DS_MAT_X));
70: for (i=0;i<ctx->nf;i++) PetscCall(DSAllocateMat_Private(ds,DSMatExtra[i]));
71: PetscCall(PetscFree(ds->perm));
72: PetscCall(PetscMalloc1(ld*ctx->max_mid,&ds->perm));
73: PetscFunctionReturn(PETSC_SUCCESS);
74: }
76: static PetscErrorCode DSView_NEP(DS ds,PetscViewer viewer)
77: {
78: DS_NEP *ctx = (DS_NEP*)ds->data;
79: PetscViewerFormat format;
80: PetscInt i;
81: const char *methodname[] = {
82: "Successive Linear Problems",
83: "Contour Integral"
84: };
85: const int nmeth=PETSC_STATIC_ARRAY_LENGTH(methodname);
87: PetscFunctionBegin;
88: PetscCall(PetscViewerGetFormat(viewer,&format));
89: if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) {
90: if (ds->method<nmeth) PetscCall(PetscViewerASCIIPrintf(viewer,"solving the problem with: %s\n",methodname[ds->method]));
91: #if defined(PETSC_USE_COMPLEX)
92: if (ds->method==1) { /* contour integral method */
93: PetscCall(PetscViewerASCIIPrintf(viewer,"number of integration points: %" PetscInt_FMT "\n",ctx->nnod));
94: PetscCall(PetscViewerASCIIPrintf(viewer,"maximum minimality index: %" PetscInt_FMT "\n",ctx->max_mid));
95: if (ctx->spls) PetscCall(PetscViewerASCIIPrintf(viewer,"number of sampling columns for quadrature: %" PetscInt_FMT "\n",ctx->spls));
96: if (ctx->Nit) PetscCall(PetscViewerASCIIPrintf(viewer,"doing iterative refinement (%" PetscInt_FMT " its, tolerance %g)\n",ctx->Nit,(double)ctx->rtol));
97: PetscCall(RGView(ctx->rg,viewer));
98: }
99: #endif
100: if (format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscCall(PetscViewerASCIIPrintf(viewer,"number of functions: %" PetscInt_FMT "\n",ctx->nf));
101: PetscFunctionReturn(PETSC_SUCCESS);
102: }
103: for (i=0;i<ctx->nf;i++) {
104: PetscCall(FNView(ctx->f[i],viewer));
105: PetscCall(DSViewMat(ds,viewer,DSMatExtra[i]));
106: }
107: if (ds->state>DS_STATE_INTERMEDIATE) PetscCall(DSViewMat(ds,viewer,DS_MAT_X));
108: PetscFunctionReturn(PETSC_SUCCESS);
109: }
111: static PetscErrorCode DSVectors_NEP(DS ds,DSMatType mat,PetscInt *j,PetscReal *rnorm)
112: {
113: PetscFunctionBegin;
114: PetscCheck(!rnorm,PetscObjectComm((PetscObject)ds),PETSC_ERR_SUP,"Not implemented yet");
115: switch (mat) {
116: case DS_MAT_X:
117: break;
118: case DS_MAT_Y:
119: SETERRQ(PetscObjectComm((PetscObject)ds),PETSC_ERR_SUP,"Not implemented yet");
120: default:
121: SETERRQ(PetscObjectComm((PetscObject)ds),PETSC_ERR_ARG_OUTOFRANGE,"Invalid mat parameter");
122: }
123: PetscFunctionReturn(PETSC_SUCCESS);
124: }
126: static PetscErrorCode DSSort_NEP(DS ds,PetscScalar *wr,PetscScalar *wi,PetscScalar *rr,PetscScalar *ri,PetscInt *dummy)
127: {
128: DS_NEP *ctx = (DS_NEP*)ds->data;
129: PetscInt n,l,i,*perm,lds;
130: PetscScalar *Q;
132: PetscFunctionBegin;
133: if (!ds->sc) PetscFunctionReturn(PETSC_SUCCESS);
134: if (!ds->method) PetscFunctionReturn(PETSC_SUCCESS); /* SLP computes just one eigenvalue */
135: n = ds->n*ctx->max_mid;
136: lds = ds->ld*ctx->max_mid;
137: l = ds->l;
138: perm = ds->perm;
139: for (i=0;i<n;i++) perm[i] = i;
140: if (rr) PetscCall(DSSortEigenvalues_Private(ds,rr,ri,perm,PETSC_FALSE));
141: else PetscCall(DSSortEigenvalues_Private(ds,wr,NULL,perm,PETSC_FALSE));
142: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_Q],&Q));
143: for (i=l;i<ds->t;i++) Q[i+i*lds] = wr[perm[i]];
144: for (i=l;i<ds->t;i++) wr[i] = Q[i+i*lds];
145: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_Q],&Q));
146: /* n != ds->n */
147: PetscCall(DSPermuteColumns_Private(ds,0,ds->t,ds->n,DS_MAT_X,perm));
148: PetscFunctionReturn(PETSC_SUCCESS);
149: }
151: #if defined(SLEPC_MISSING_LAPACK_GGEV3)
152: #define LAPGEEV "ggev"
153: #else
154: #define LAPGEEV "ggev3"
155: #endif
157: static PetscErrorCode DSSolve_NEP_SLP(DS ds,PetscScalar *wr,PetscScalar *wi)
158: {
159: PetscScalar *A,*B,*W,*X,*work,*alpha,*beta,a;
160: PetscScalar sigma,lambda,mu,re,re2,sone=1.0,szero=0.0;
161: PetscBLASInt info,n,ld,lwork,one=1,zero=0;
162: PetscInt it,pos,j,maxit=100,result;
163: PetscReal norm,tol,done=1.0;
164: #if !defined(PETSC_USE_COMPLEX)
165: PetscReal *alphai,im,im2;
166: #endif
168: PetscFunctionBegin;
169: PetscCall(PetscBLASIntCast(ds->n,&n));
170: PetscCall(PetscBLASIntCast(ds->ld,&ld));
171: PetscCall(DSAllocateMat_Private(ds,DS_MAT_A));
172: PetscCall(DSAllocateMat_Private(ds,DS_MAT_B));
173: PetscCall(DSAllocateMat_Private(ds,DS_MAT_W));
174: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_A],&A));
175: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_B],&B));
176: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_W],&W));
177: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_X],&X));
179: /* workspace query and memory allocation */
180: lwork = -1;
181: #if defined(PETSC_USE_COMPLEX)
182: PetscCallBLAS("LAPACK" LAPGEEV,LAPACKggevalt_("N","V",&n,A,&ld,B,&ld,NULL,NULL,NULL,&ld,W,&ld,&a,&lwork,NULL,&info));
183: PetscCall(PetscBLASIntCast((PetscInt)PetscRealPart(a),&lwork));
184: PetscCall(DSAllocateWork_Private(ds,lwork+2*ds->n,8*ds->n,0));
185: alpha = ds->work;
186: beta = ds->work + ds->n;
187: work = ds->work + 2*ds->n;
188: #else
189: PetscCallBLAS("LAPACK" LAPGEEV,LAPACKggevalt_("N","V",&n,A,&ld,B,&ld,NULL,NULL,NULL,NULL,&ld,W,&ld,&a,&lwork,&info));
190: PetscCall(PetscBLASIntCast((PetscInt)a,&lwork));
191: PetscCall(DSAllocateWork_Private(ds,lwork+3*ds->n,0,0));
192: alpha = ds->work;
193: beta = ds->work + ds->n;
194: alphai = ds->work + 2*ds->n;
195: work = ds->work + 3*ds->n;
196: #endif
198: sigma = 0.0;
199: if (ds->sc->comparison==SlepcCompareTargetMagnitude || ds->sc->comparison==SlepcCompareTargetReal) sigma = *(PetscScalar*)ds->sc->comparisonctx;
200: lambda = sigma;
201: tol = n*PETSC_MACHINE_EPSILON/PetscSqrtReal(PETSC_SQRT_MACHINE_EPSILON);
203: for (it=0;it<maxit;it++) {
205: /* evaluate T and T' */
206: PetscCall(DSNEPComputeMatrix(ds,lambda,PETSC_FALSE,DS_MAT_A));
207: if (it) {
208: PetscCallBLAS("BLASgemv",BLASgemv_("N",&n,&n,&sone,A,&ld,X,&one,&szero,X+ld,&one));
209: norm = BLASnrm2_(&n,X+ld,&one);
210: if (norm/PetscAbsScalar(lambda)<=tol) break;
211: }
212: PetscCall(DSNEPComputeMatrix(ds,lambda,PETSC_TRUE,DS_MAT_B));
214: /* compute eigenvalue correction mu and eigenvector u */
215: #if defined(PETSC_USE_COMPLEX)
216: PetscCallBLAS("LAPACK" LAPGEEV,LAPACKggevalt_("N","V",&n,A,&ld,B,&ld,alpha,beta,NULL,&ld,W,&ld,work,&lwork,ds->rwork,&info));
217: #else
218: PetscCallBLAS("LAPACK" LAPGEEV,LAPACKggevalt_("N","V",&n,A,&ld,B,&ld,alpha,alphai,beta,NULL,&ld,W,&ld,work,&lwork,&info));
219: #endif
220: SlepcCheckLapackInfo(LAPGEEV,info);
222: /* find smallest eigenvalue */
223: j = 0;
224: if (beta[j]==0.0) re = (PetscRealPart(alpha[j])>0.0)? PETSC_MAX_REAL: PETSC_MIN_REAL;
225: else re = alpha[j]/beta[j];
226: #if !defined(PETSC_USE_COMPLEX)
227: if (beta[j]==0.0) im = (alphai[j]>0.0)? PETSC_MAX_REAL: PETSC_MIN_REAL;
228: else im = alphai[j]/beta[j];
229: #endif
230: pos = 0;
231: for (j=1;j<n;j++) {
232: if (beta[j]==0.0) re2 = (PetscRealPart(alpha[j])>0.0)? PETSC_MAX_REAL: PETSC_MIN_REAL;
233: else re2 = alpha[j]/beta[j];
234: #if !defined(PETSC_USE_COMPLEX)
235: if (beta[j]==0.0) im2 = (alphai[j]>0.0)? PETSC_MAX_REAL: PETSC_MIN_REAL;
236: else im2 = alphai[j]/beta[j];
237: PetscCall(SlepcCompareSmallestMagnitude(re,im,re2,im2,&result,NULL));
238: #else
239: PetscCall(SlepcCompareSmallestMagnitude(re,0.0,re2,0.0,&result,NULL));
240: #endif
241: if (result > 0) {
242: re = re2;
243: #if !defined(PETSC_USE_COMPLEX)
244: im = im2;
245: #endif
246: pos = j;
247: }
248: }
250: #if !defined(PETSC_USE_COMPLEX)
251: PetscCheck(im==0.0,PETSC_COMM_SELF,PETSC_ERR_SUP,"DSNEP found a complex eigenvalue; try rerunning with complex scalars");
252: #endif
253: mu = alpha[pos]/beta[pos];
254: PetscCall(PetscArraycpy(X,W+pos*ld,n));
255: norm = BLASnrm2_(&n,X,&one);
256: PetscCallBLAS("LAPACKlascl",LAPACKlascl_("G",&zero,&zero,&norm,&done,&n,&one,X,&n,&info));
257: SlepcCheckLapackInfo("lascl",info);
259: /* correct eigenvalue approximation */
260: lambda = lambda - mu;
261: }
262: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_A],&A));
263: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_B],&B));
264: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_W],&W));
265: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_X],&X));
267: PetscCheck(it<maxit,PETSC_COMM_SELF,PETSC_ERR_CONV_FAILED,"DSNEP did not converge");
268: ds->t = 1;
269: wr[0] = lambda;
270: if (wi) wi[0] = 0.0;
271: PetscFunctionReturn(PETSC_SUCCESS);
272: }
274: #if defined(PETSC_USE_COMPLEX)
275: /*
276: Newton refinement for eigenpairs computed with contour integral.
277: k - number of eigenpairs to refine
278: wr - eigenvalues (eigenvectors are stored in DS_MAT_X)
279: */
280: static PetscErrorCode DSNEPNewtonRefine(DS ds,PetscInt k,PetscScalar *wr)
281: {
282: DS_NEP *ctx = (DS_NEP*)ds->data;
283: PetscScalar *X,*W,*U,*R,sone=1.0,szero=0.0;
284: PetscReal norm;
285: PetscInt i,j,ii,nwu=0,*p,jstart=0,jend=k;
286: const PetscInt *range;
287: PetscBLASInt n,*perm,info,ld,one=1,n1;
288: PetscMPIInt len,size,root;
289: PetscLayout map;
291: PetscFunctionBegin;
292: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_X],&X));
293: PetscCall(PetscBLASIntCast(ds->n,&n));
294: PetscCall(PetscBLASIntCast(ds->ld,&ld));
295: n1 = n+1;
296: p = ds->perm;
297: PetscCall(PetscArrayzero(p,k));
298: PetscCall(DSAllocateWork_Private(ds,(n+2)*(n+1),0,n+1));
299: U = ds->work+nwu; nwu += (n+1)*(n+1);
300: R = ds->work+nwu; /*nwu += n+1;*/
301: perm = ds->iwork;
302: if (ds->pmode==DS_PARALLEL_DISTRIBUTED) {
303: PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)ds),PETSC_DECIDE,k,1,&map));
304: PetscCall(PetscLayoutGetRange(map,&jstart,&jend));
305: }
306: for (ii=0;ii<ctx->Nit;ii++) {
307: for (j=jstart;j<jend;j++) {
308: if (p[j]<2) {
309: PetscCall(DSNEPComputeMatrix(ds,wr[j],PETSC_FALSE,DS_MAT_W));
310: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_W],&W));
311: PetscCallBLAS("BLASgemv",BLASgemv_("N",&n,&n,&sone,W,&ld,X+ld*j,&one,&szero,R,&one));
312: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_W],&W));
313: norm = BLASnrm2_(&n,R,&one);
314: if (norm/PetscAbsScalar(wr[j]) > ctx->rtol) {
315: PetscCall(PetscInfo(NULL,"Refining eigenpair %" PetscInt_FMT ", residual=%g\n",j,(double)(norm/PetscAbsScalar(wr[j]))));
316: p[j] = 1;
317: R[n] = 0.0;
318: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_W],&W));
319: for (i=0;i<n;i++) {
320: PetscCall(PetscArraycpy(U+i*n1,W+i*ld,n));
321: U[n+i*n1] = PetscConj(X[j*ld+i]);
322: }
323: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_W],&W));
324: U[n+n*n1] = 0.0;
325: PetscCall(DSNEPComputeMatrix(ds,wr[j],PETSC_TRUE,DS_MAT_W));
326: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_W],&W));
327: PetscCallBLAS("BLASgemv",BLASgemv_("N",&n,&n,&sone,W,&ld,X+ld*j,&one,&szero,U+n*(n+1),&one));
328: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_W],&W));
329: /* solve system */
330: PetscCallBLAS("LAPACKgetrf",LAPACKgetrf_(&n1,&n1,U,&n1,perm,&info));
331: SlepcCheckLapackInfo("getrf",info);
332: PetscCallBLAS("LAPACKgetrs",LAPACKgetrs_("N",&n1,&one,U,&n1,perm,R,&n1,&info));
333: SlepcCheckLapackInfo("getrs",info);
334: wr[j] -= R[n];
335: for (i=0;i<n;i++) X[j*ld+i] -= R[i];
336: /* normalization */
337: norm = BLASnrm2_(&n,X+ld*j,&one);
338: for (i=0;i<n;i++) X[ld*j+i] /= norm;
339: } else p[j] = 2;
340: }
341: }
342: }
343: if (ds->pmode==DS_PARALLEL_DISTRIBUTED) { /* communicate results */
344: PetscCall(PetscMPIIntCast(k,&len));
345: PetscCallMPI(MPIU_Allreduce(MPI_IN_PLACE,p,len,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)ds)));
346: PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)ds),&size));
347: PetscCall(PetscLayoutGetRanges(map,&range));
348: for (j=0;j<k;j++) {
349: if (p[j]) { /* j-th eigenpair has been refined */
350: for (root=0;root<size;root++) if (range[root+1]>j) break;
351: PetscCall(PetscMPIIntCast(1,&len));
352: PetscCallMPI(MPI_Bcast(wr+j,len,MPIU_SCALAR,root,PetscObjectComm((PetscObject)ds)));
353: PetscCall(PetscMPIIntCast(n,&len));
354: PetscCallMPI(MPI_Bcast(X+ld*j,len,MPIU_SCALAR,root,PetscObjectComm((PetscObject)ds)));
355: }
356: }
357: PetscCall(PetscLayoutDestroy(&map));
358: }
359: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_X],&X));
360: PetscFunctionReturn(PETSC_SUCCESS);
361: }
363: PetscErrorCode DSSolve_NEP_Contour(DS ds,PetscScalar *wr,PetscScalar *wi)
364: {
365: DS_NEP *ctx = (DS_NEP*)ds->data;
366: PetscScalar *alpha,*beta,*Q,*Z,*X,*U,*V,*W,*work,*Rc,*R,*w,*z,*zn,*S;
367: PetscScalar sone=1.0,szero=0.0,center,a;
368: PetscReal *rwork,norm,radius,vscale,rgscale,*sigma;
369: PetscBLASInt info,n,*perm,p,pp,ld,lwork,k_,rk_,colA,rowA,one=1;
370: PetscInt mid,lds,nnod=ctx->nnod,k,i,ii,jj,j,s,off,rk,nwu=0,nw,lrwork,*inside,kstart=0,kend=nnod;
371: PetscMPIInt len;
372: PetscBool isellipse;
373: PetscRandom rand;
375: PetscFunctionBegin;
376: PetscCheck(ctx->rg,PetscObjectComm((PetscObject)ds),PETSC_ERR_ORDER,"The contour solver requires a region passed with DSNEPSetRG()");
377: /* Contour parameters */
378: PetscCall(PetscObjectTypeCompare((PetscObject)ctx->rg,RGELLIPSE,&isellipse));
379: PetscCheck(isellipse,PetscObjectComm((PetscObject)ds),PETSC_ERR_SUP,"Region must be Ellipse");
380: PetscCall(RGEllipseGetParameters(ctx->rg,¢er,&radius,&vscale));
381: PetscCall(RGGetScale(ctx->rg,&rgscale));
382: if (ds->pmode==DS_PARALLEL_DISTRIBUTED) {
383: if (!ctx->map) PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)ds),PETSC_DECIDE,ctx->nnod,1,&ctx->map));
384: PetscCall(PetscLayoutGetRange(ctx->map,&kstart,&kend));
385: }
387: PetscCall(DSAllocateMat_Private(ds,DS_MAT_W)); /* size n */
388: PetscCall(DSAllocateMat_Private(ds,DS_MAT_Q)); /* size mid*n */
389: PetscCall(DSAllocateMat_Private(ds,DS_MAT_Z)); /* size mid*n */
390: PetscCall(DSAllocateMat_Private(ds,DS_MAT_U)); /* size mid*n */
391: PetscCall(DSAllocateMat_Private(ds,DS_MAT_V)); /* size mid*n */
392: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_Q],&Q));
393: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_Z],&Z));
394: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_U],&U));
395: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_V],&V));
396: mid = ctx->max_mid;
397: PetscCall(PetscBLASIntCast(ds->n,&n));
398: p = n; /* maximum number of columns for the probing matrix */
399: PetscCall(PetscBLASIntCast(ds->ld,&ld));
400: PetscCall(PetscBLASIntCast(mid*n,&rowA));
401: nw = 2*n*(p+mid)+3*nnod+2*mid*n*p;
402: lrwork = 9*mid*n;
404: /* workspace query and memory allocation */
405: lwork = -1;
406: PetscCallBLAS("LAPACK" LAPGEEV,LAPACKggevalt_("N","V",&rowA,Q,&rowA,Z,&rowA,NULL,NULL,NULL,&ld,V,&rowA,&a,&lwork,NULL,&info));
407: PetscCall(PetscBLASIntCast((PetscInt)PetscRealPart(a),&lwork));
408: PetscCall(DSAllocateWork_Private(ds,lwork+nw,lrwork,n+1));
410: sigma = ds->rwork;
411: rwork = ds->rwork+mid*n;
412: perm = ds->iwork;
413: z = ds->work+nwu; nwu += nnod; /* quadrature points */
414: zn = ds->work+nwu; nwu += nnod; /* normalized quadrature points */
415: w = ds->work+nwu; nwu += nnod; /* quadrature weights */
416: Rc = ds->work+nwu; nwu += n*p;
417: R = ds->work+nwu; nwu += n*p;
418: alpha = ds->work+nwu; nwu += mid*n;
419: beta = ds->work+nwu; nwu += mid*n;
420: S = ds->work+nwu; nwu += 2*mid*n*p;
421: work = ds->work+nwu;
423: /* Compute quadrature parameters */
424: PetscCall(RGComputeQuadrature(ctx->rg,RG_QUADRULE_TRAPEZOIDAL,nnod,z,zn,w));
426: /* Set random matrix */
427: PetscCall(PetscRandomCreate(PetscObjectComm((PetscObject)ds),&rand));
428: PetscCall(PetscRandomSetSeed(rand,0x12345678));
429: PetscCall(PetscRandomSeed(rand));
430: for (j=0;j<p;j++)
431: for (i=0;i<n;i++) PetscCall(PetscRandomGetValue(rand,Rc+i+j*n));
432: PetscCall(PetscArrayzero(S,2*mid*n*p));
433: /* Loop of integration points */
434: for (k=kstart;k<kend;k++) {
435: PetscCall(PetscInfo(NULL,"Solving integration point %" PetscInt_FMT "\n",k));
436: PetscCall(PetscArraycpy(R,Rc,p*n));
437: PetscCall(DSNEPComputeMatrix(ds,z[k],PETSC_FALSE,DS_MAT_W));
439: /* LU factorization */
440: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_W],&W));
441: PetscCallBLAS("LAPACKgetrf",LAPACKgetrf_(&n,&n,W,&ld,perm,&info));
442: SlepcCheckLapackInfo("getrf",info);
443: PetscCallBLAS("LAPACKgetrs",LAPACKgetrs_("N",&n,&p,W,&ld,perm,R,&n,&info));
444: SlepcCheckLapackInfo("getrs",info);
445: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_W],&W));
447: /* Moments computation */
448: for (s=0;s<2*ctx->max_mid;s++) {
449: off = s*n*p;
450: for (j=0;j<p;j++)
451: for (i=0;i<n;i++) S[off+i+j*n] += w[k]*R[j*n+i];
452: w[k] *= zn[k];
453: }
454: }
456: if (ds->pmode==DS_PARALLEL_DISTRIBUTED) { /* compute final S via reduction */
457: PetscCall(PetscMPIIntCast(2*mid*n*p,&len));
458: PetscCallMPI(MPIU_Allreduce(MPI_IN_PLACE,S,len,MPIU_SCALAR,MPIU_SUM,PetscObjectComm((PetscObject)ds)));
459: }
460: PetscCall(PetscBLASIntCast(ctx->spls?PetscMin(ctx->spls,n):n,&p));
461: pp = p;
462: do {
463: p = pp;
464: PetscCall(PetscBLASIntCast(mid*p,&colA));
466: PetscCall(PetscInfo(ds,"Computing SVD of size %" PetscBLASInt_FMT "x%" PetscBLASInt_FMT "\n",rowA,colA));
467: for (jj=0;jj<mid;jj++) {
468: for (ii=0;ii<mid;ii++) {
469: off = jj*p*rowA+ii*n;
470: for (j=0;j<p;j++)
471: for (i=0;i<n;i++) Q[off+j*rowA+i] = S[((jj+ii)*n+j)*n+i];
472: }
473: }
474: PetscCallBLAS("LAPACKgesvd",LAPACKgesvd_("S","S",&rowA,&colA,Q,&rowA,sigma,U,&rowA,V,&colA,work,&lwork,rwork,&info));
475: SlepcCheckLapackInfo("gesvd",info);
477: rk = colA;
478: for (i=1;i<colA;i++) if (sigma[i]/sigma[0]<PETSC_MACHINE_EPSILON*1e4) {rk = i; break;}
479: if (rk<colA || p==n) break;
480: pp *= 2;
481: } while (pp<=n);
482: PetscCall(PetscInfo(ds,"Solving generalized eigenproblem of size %" PetscInt_FMT "\n",rk));
483: for (jj=0;jj<mid;jj++) {
484: for (ii=0;ii<mid;ii++) {
485: off = jj*p*rowA+ii*n;
486: for (j=0;j<p;j++)
487: for (i=0;i<n;i++) Q[off+j*rowA+i] = S[((jj+ii+1)*n+j)*n+i];
488: }
489: }
490: PetscCall(PetscBLASIntCast(rk,&rk_));
491: PetscCallBLAS("BLASgemm",BLASgemm_("N","C",&rowA,&rk_,&colA,&sone,Q,&rowA,V,&colA,&szero,Z,&rowA));
492: PetscCallBLAS("BLASgemm",BLASgemm_("C","N",&rk_,&rk_,&rowA,&sone,U,&rowA,Z,&rowA,&szero,Q,&rk_));
493: PetscCall(PetscArrayzero(Z,n*mid*n*mid));
494: for (j=0;j<rk;j++) Z[j+j*rk_] = sigma[j];
495: PetscCallBLAS("LAPACK" LAPGEEV,LAPACKggevalt_("N","V",&rk_,Q,&rk_,Z,&rk_,alpha,beta,NULL,&ld,V,&rk_,work,&lwork,rwork,&info));
496: SlepcCheckLapackInfo(LAPGEEV,info);
497: for (i=0;i<rk;i++) wr[i] = (center+radius*alpha[i]/beta[i])*rgscale;
498: PetscCall(PetscMalloc1(rk,&inside));
499: PetscCall(RGCheckInside(ctx->rg,rk,wr,wi,inside));
500: k=0;
501: for (i=0;i<rk;i++)
502: if (inside[i]==1) inside[k++] = i;
503: /* Discard values outside region */
504: lds = ld*mid;
505: PetscCall(PetscArrayzero(Q,lds*lds));
506: PetscCall(PetscArrayzero(Z,lds*lds));
507: for (i=0;i<k;i++) Q[i+i*lds] = (center*beta[inside[i]]+radius*alpha[inside[i]])*rgscale;
508: for (i=0;i<k;i++) Z[i+i*lds] = beta[inside[i]];
509: for (i=0;i<k;i++) wr[i] = Q[i+i*lds]/Z[i+i*lds];
510: for (j=0;j<k;j++) for (i=0;i<rk;i++) V[j*rk+i] = sigma[i]*V[inside[j]*rk+i];
511: PetscCall(PetscBLASIntCast(k,&k_));
512: PetscCall(MatDenseGetArray(ds->omat[DS_MAT_X],&X));
513: PetscCallBLAS("BLASgemm",BLASgemm_("N","N",&n,&k_,&rk_,&sone,U,&rowA,V,&rk_,&szero,X,&ld));
514: /* Normalize */
515: for (j=0;j<k;j++) {
516: norm = BLASnrm2_(&n,X+ld*j,&one);
517: for (i=0;i<n;i++) X[ld*j+i] /= norm;
518: }
519: PetscCall(PetscFree(inside));
520: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_X],&X));
521: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_Q],&Q));
522: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_Z],&Z));
523: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_U],&U));
524: PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_V],&V));
526: /* Newton refinement */
527: if (ctx->Nit) PetscCall(DSNEPNewtonRefine(ds,k,wr));
528: ds->t = k;
529: PetscCall(PetscRandomDestroy(&rand));
530: PetscFunctionReturn(PETSC_SUCCESS);
531: }
532: #endif
534: #if !defined(PETSC_HAVE_MPIUNI)
535: static PetscErrorCode DSSynchronize_NEP(DS ds,PetscScalar eigr[],PetscScalar eigi[])
536: {
537: DS_NEP *ctx = (DS_NEP*)ds->data;
538: PetscInt ld=ds->ld,k=0;
539: PetscMPIInt n,n2,rank,size,off=0;
540: PetscScalar *X;
542: PetscFunctionBegin;
543: if (!ds->method) { /* SLP */
544: if (ds->state>=DS_STATE_CONDENSED) k += ds->n;
545: if (eigr) k += 1;
546: if (eigi) k += 1;
547: PetscCall(PetscMPIIntCast(1,&n));
548: PetscCall(PetscMPIIntCast(ds->n,&n2));
549: } else { /* Contour */
550: if (ds->state>=DS_STATE_CONDENSED) k += ctx->max_mid*ds->n*ld;
551: if (eigr) k += ctx->max_mid*ds->n;
552: if (eigi) k += ctx->max_mid*ds->n;
553: PetscCall(PetscMPIIntCast(ctx->max_mid*ds->n,&n));
554: PetscCall(PetscMPIIntCast(ctx->max_mid*ds->n*ld,&n2));
555: }
556: PetscCall(DSAllocateWork_Private(ds,k,0,0));
557: PetscCall(PetscMPIIntCast(k*sizeof(PetscScalar),&size));
558: if (ds->state>=DS_STATE_CONDENSED) PetscCall(MatDenseGetArray(ds->omat[DS_MAT_X],&X));
559: PetscCallMPI(MPI_Comm_rank(PetscObjectComm((PetscObject)ds),&rank));
560: if (!rank) {
561: if (ds->state>=DS_STATE_CONDENSED) PetscCallMPI(MPI_Pack(X,n2,MPIU_SCALAR,ds->work,size,&off,PetscObjectComm((PetscObject)ds)));
562: if (eigr) PetscCallMPI(MPI_Pack(eigr,n,MPIU_SCALAR,ds->work,size,&off,PetscObjectComm((PetscObject)ds)));
563: #if !defined(PETSC_USE_COMPLEX)
564: if (eigi) PetscCallMPI(MPI_Pack(eigi,n,MPIU_SCALAR,ds->work,size,&off,PetscObjectComm((PetscObject)ds)));
565: #endif
566: }
567: PetscCallMPI(MPI_Bcast(ds->work,size,MPI_BYTE,0,PetscObjectComm((PetscObject)ds)));
568: if (rank) {
569: if (ds->state>=DS_STATE_CONDENSED) PetscCallMPI(MPI_Unpack(ds->work,size,&off,X,n2,MPIU_SCALAR,PetscObjectComm((PetscObject)ds)));
570: if (eigr) PetscCallMPI(MPI_Unpack(ds->work,size,&off,eigr,n,MPIU_SCALAR,PetscObjectComm((PetscObject)ds)));
571: #if !defined(PETSC_USE_COMPLEX)
572: if (eigi) PetscCallMPI(MPI_Unpack(ds->work,size,&off,eigi,n,MPIU_SCALAR,PetscObjectComm((PetscObject)ds)));
573: #endif
574: }
575: if (ds->state>=DS_STATE_CONDENSED) PetscCall(MatDenseRestoreArray(ds->omat[DS_MAT_X],&X));
576: PetscFunctionReturn(PETSC_SUCCESS);
577: }
578: #endif
580: static PetscErrorCode DSNEPSetFN_NEP(DS ds,PetscInt n,FN fn[])
581: {
582: DS_NEP *ctx = (DS_NEP*)ds->data;
583: PetscInt i;
585: PetscFunctionBegin;
586: PetscCheck(n>0,PetscObjectComm((PetscObject)ds),PETSC_ERR_ARG_OUTOFRANGE,"Must have one or more functions, you have %" PetscInt_FMT,n);
587: PetscCheck(n<=DS_NUM_EXTRA,PetscObjectComm((PetscObject)ds),PETSC_ERR_ARG_OUTOFRANGE,"Too many functions, you specified %" PetscInt_FMT " but the limit is %d",n,DS_NUM_EXTRA);
588: if (ds->ld) PetscCall(PetscInfo(ds,"DSNEPSetFN() called after DSAllocate()\n"));
589: for (i=0;i<n;i++) PetscCall(PetscObjectReference((PetscObject)fn[i]));
590: for (i=0;i<ctx->nf;i++) PetscCall(FNDestroy(&ctx->f[i]));
591: for (i=0;i<n;i++) ctx->f[i] = fn[i];
592: ctx->nf = n;
593: PetscFunctionReturn(PETSC_SUCCESS);
594: }
596: /*@
597: DSNEPSetFN - Sets a number of functions that define the nonlinear
598: eigenproblem.
600: Collective
602: Input Parameters:
603: + ds - the direct solver context
604: . n - number of functions
605: - fn - array of functions
607: Notes:
608: The nonlinear eigenproblem is defined in terms of the split nonlinear
609: operator T(lambda) = sum_i A_i*f_i(lambda).
611: This function must be called before DSAllocate(). Then DSAllocate()
612: will allocate an extra matrix A_i per each function, that can be
613: filled in the usual way.
615: Level: advanced
617: .seealso: DSNEPGetFN(), DSAllocate()
618: @*/
619: PetscErrorCode DSNEPSetFN(DS ds,PetscInt n,FN fn[])
620: {
621: PetscInt i;
623: PetscFunctionBegin;
626: PetscAssertPointer(fn,3);
627: for (i=0;i<n;i++) {
629: PetscCheckSameComm(ds,1,fn[i],3);
630: }
631: PetscTryMethod(ds,"DSNEPSetFN_C",(DS,PetscInt,FN[]),(ds,n,fn));
632: PetscFunctionReturn(PETSC_SUCCESS);
633: }
635: static PetscErrorCode DSNEPGetFN_NEP(DS ds,PetscInt k,FN *fn)
636: {
637: DS_NEP *ctx = (DS_NEP*)ds->data;
639: PetscFunctionBegin;
640: PetscCheck(k>=0 && k<ctx->nf,PetscObjectComm((PetscObject)ds),PETSC_ERR_ARG_OUTOFRANGE,"k must be between 0 and %" PetscInt_FMT,ctx->nf-1);
641: *fn = ctx->f[k];
642: PetscFunctionReturn(PETSC_SUCCESS);
643: }
645: /*@
646: DSNEPGetFN - Gets the functions associated with the nonlinear DS.
648: Not Collective
650: Input Parameters:
651: + ds - the direct solver context
652: - k - the index of the requested function (starting in 0)
654: Output Parameter:
655: . fn - the function
657: Level: advanced
659: .seealso: DSNEPSetFN()
660: @*/
661: PetscErrorCode DSNEPGetFN(DS ds,PetscInt k,FN *fn)
662: {
663: PetscFunctionBegin;
665: PetscAssertPointer(fn,3);
666: PetscUseMethod(ds,"DSNEPGetFN_C",(DS,PetscInt,FN*),(ds,k,fn));
667: PetscFunctionReturn(PETSC_SUCCESS);
668: }
670: static PetscErrorCode DSNEPGetNumFN_NEP(DS ds,PetscInt *n)
671: {
672: DS_NEP *ctx = (DS_NEP*)ds->data;
674: PetscFunctionBegin;
675: *n = ctx->nf;
676: PetscFunctionReturn(PETSC_SUCCESS);
677: }
679: /*@
680: DSNEPGetNumFN - Returns the number of functions stored internally by
681: the DS.
683: Not Collective
685: Input Parameter:
686: . ds - the direct solver context
688: Output Parameters:
689: . n - the number of functions passed in DSNEPSetFN()
691: Level: advanced
693: .seealso: DSNEPSetFN()
694: @*/
695: PetscErrorCode DSNEPGetNumFN(DS ds,PetscInt *n)
696: {
697: PetscFunctionBegin;
699: PetscAssertPointer(n,2);
700: PetscUseMethod(ds,"DSNEPGetNumFN_C",(DS,PetscInt*),(ds,n));
701: PetscFunctionReturn(PETSC_SUCCESS);
702: }
704: static PetscErrorCode DSNEPSetMinimality_NEP(DS ds,PetscInt n)
705: {
706: DS_NEP *ctx = (DS_NEP*)ds->data;
708: PetscFunctionBegin;
709: if (n == PETSC_DECIDE || n == PETSC_DEFAULT) ctx->max_mid = 4;
710: else {
711: PetscCheck(n>0,PetscObjectComm((PetscObject)ds),PETSC_ERR_ARG_OUTOFRANGE,"The minimality value must be > 0");
712: ctx->max_mid = n;
713: }
714: PetscFunctionReturn(PETSC_SUCCESS);
715: }
717: /*@
718: DSNEPSetMinimality - Sets the maximum minimality index used internally by
719: the DSNEP.
721: Logically Collective
723: Input Parameters:
724: + ds - the direct solver context
725: - n - the maximum minimality index
727: Options Database Key:
728: . -ds_nep_minimality <n> - sets the maximum minimality index
730: Notes:
731: The maximum minimality index is used only in the contour integral method,
732: and is related to the highest momemts used in the method. The default
733: value is 1, an larger value might give better accuracy in some cases, but
734: at a higher cost.
736: Level: advanced
738: .seealso: DSNEPGetMinimality()
739: @*/
740: PetscErrorCode DSNEPSetMinimality(DS ds,PetscInt n)
741: {
742: PetscFunctionBegin;
745: PetscTryMethod(ds,"DSNEPSetMinimality_C",(DS,PetscInt),(ds,n));
746: PetscFunctionReturn(PETSC_SUCCESS);
747: }
749: static PetscErrorCode DSNEPGetMinimality_NEP(DS ds,PetscInt *n)
750: {
751: DS_NEP *ctx = (DS_NEP*)ds->data;
753: PetscFunctionBegin;
754: *n = ctx->max_mid;
755: PetscFunctionReturn(PETSC_SUCCESS);
756: }
758: /*@
759: DSNEPGetMinimality - Returns the maximum minimality index used internally by
760: the DSNEP.
762: Not Collective
764: Input Parameter:
765: . ds - the direct solver context
767: Output Parameters:
768: . n - the maximum minimality index passed in DSNEPSetMinimality()
770: Level: advanced
772: .seealso: DSNEPSetMinimality()
773: @*/
774: PetscErrorCode DSNEPGetMinimality(DS ds,PetscInt *n)
775: {
776: PetscFunctionBegin;
778: PetscAssertPointer(n,2);
779: PetscUseMethod(ds,"DSNEPGetMinimality_C",(DS,PetscInt*),(ds,n));
780: PetscFunctionReturn(PETSC_SUCCESS);
781: }
783: static PetscErrorCode DSNEPSetRefine_NEP(DS ds,PetscReal tol,PetscInt its)
784: {
785: DS_NEP *ctx = (DS_NEP*)ds->data;
787: PetscFunctionBegin;
788: if (tol == (PetscReal)PETSC_DETERMINE) {
789: ctx->rtol = PETSC_MACHINE_EPSILON/PetscSqrtReal(PETSC_SQRT_MACHINE_EPSILON);
790: } else if (tol != (PetscReal)PETSC_CURRENT) {
791: PetscCheck(tol>0.0,PetscObjectComm((PetscObject)ds),PETSC_ERR_ARG_OUTOFRANGE,"The tolerance must be > 0");
792: ctx->rtol = tol;
793: }
794: if (its == PETSC_DETERMINE) {
795: ctx->Nit = 3;
796: } else if (its != PETSC_CURRENT) {
797: PetscCheck(its>=0,PetscObjectComm((PetscObject)ds),PETSC_ERR_ARG_OUTOFRANGE,"The number of iterations must be >= 0");
798: ctx->Nit = its;
799: }
800: PetscFunctionReturn(PETSC_SUCCESS);
801: }
803: /*@
804: DSNEPSetRefine - Sets the tolerance and the number of iterations of Newton iterative
805: refinement for eigenpairs.
807: Logically Collective
809: Input Parameters:
810: + ds - the direct solver context
811: . tol - the tolerance
812: - its - the number of iterations
814: Options Database Key:
815: + -ds_nep_refine_tol <tol> - sets the tolerance
816: - -ds_nep_refine_its <its> - sets the number of Newton iterations
818: Notes:
819: Iterative refinement of eigenpairs is currently used only in the contour
820: integral method.
822: Use PETSC_CURRENT to retain the current value of any of the parameters.
823: Use PETSC_DETERMINE for either argument to assign a default value computed
824: internally.
826: Level: advanced
828: .seealso: DSNEPGetRefine()
829: @*/
830: PetscErrorCode DSNEPSetRefine(DS ds,PetscReal tol,PetscInt its)
831: {
832: PetscFunctionBegin;
836: PetscTryMethod(ds,"DSNEPSetRefine_C",(DS,PetscReal,PetscInt),(ds,tol,its));
837: PetscFunctionReturn(PETSC_SUCCESS);
838: }
840: static PetscErrorCode DSNEPGetRefine_NEP(DS ds,PetscReal *tol,PetscInt *its)
841: {
842: DS_NEP *ctx = (DS_NEP*)ds->data;
844: PetscFunctionBegin;
845: if (tol) *tol = ctx->rtol;
846: if (its) *its = ctx->Nit;
847: PetscFunctionReturn(PETSC_SUCCESS);
848: }
850: /*@
851: DSNEPGetRefine - Returns the tolerance and the number of iterations of Newton iterative
852: refinement for eigenpairs.
854: Not Collective
856: Input Parameter:
857: . ds - the direct solver context
859: Output Parameters:
860: + tol - the tolerance
861: - its - the number of iterations
863: Level: advanced
865: .seealso: DSNEPSetRefine()
866: @*/
867: PetscErrorCode DSNEPGetRefine(DS ds,PetscReal *tol,PetscInt *its)
868: {
869: PetscFunctionBegin;
871: PetscUseMethod(ds,"DSNEPGetRefine_C",(DS,PetscReal*,PetscInt*),(ds,tol,its));
872: PetscFunctionReturn(PETSC_SUCCESS);
873: }
875: static PetscErrorCode DSNEPSetIntegrationPoints_NEP(DS ds,PetscInt ip)
876: {
877: DS_NEP *ctx = (DS_NEP*)ds->data;
879: PetscFunctionBegin;
880: if (ip == PETSC_DECIDE || ip == PETSC_DEFAULT) ctx->nnod = 64;
881: else {
882: PetscCheck(ip>0,PetscObjectComm((PetscObject)ds),PETSC_ERR_ARG_OUTOFRANGE,"The number of integration points must be > 0");
883: ctx->nnod = ip;
884: }
885: PetscCall(PetscLayoutDestroy(&ctx->map)); /* need to redistribute at next solve */
886: PetscFunctionReturn(PETSC_SUCCESS);
887: }
889: /*@
890: DSNEPSetIntegrationPoints - Sets the number of integration points to be
891: used in the contour integral method.
893: Logically Collective
895: Input Parameters:
896: + ds - the direct solver context
897: - ip - the number of integration points
899: Options Database Key:
900: . -ds_nep_integration_points <ip> - sets the number of integration points
902: Notes:
903: This parameter is relevant only in the contour integral method.
905: Level: advanced
907: .seealso: DSNEPGetIntegrationPoints()
908: @*/
909: PetscErrorCode DSNEPSetIntegrationPoints(DS ds,PetscInt ip)
910: {
911: PetscFunctionBegin;
914: PetscTryMethod(ds,"DSNEPSetIntegrationPoints_C",(DS,PetscInt),(ds,ip));
915: PetscFunctionReturn(PETSC_SUCCESS);
916: }
918: static PetscErrorCode DSNEPGetIntegrationPoints_NEP(DS ds,PetscInt *ip)
919: {
920: DS_NEP *ctx = (DS_NEP*)ds->data;
922: PetscFunctionBegin;
923: *ip = ctx->nnod;
924: PetscFunctionReturn(PETSC_SUCCESS);
925: }
927: /*@
928: DSNEPGetIntegrationPoints - Returns the number of integration points used
929: in the contour integral method.
931: Not Collective
933: Input Parameter:
934: . ds - the direct solver context
936: Output Parameters:
937: . ip - the number of integration points
939: Level: advanced
941: .seealso: DSNEPSetIntegrationPoints()
942: @*/
943: PetscErrorCode DSNEPGetIntegrationPoints(DS ds,PetscInt *ip)
944: {
945: PetscFunctionBegin;
947: PetscAssertPointer(ip,2);
948: PetscUseMethod(ds,"DSNEPGetIntegrationPoints_C",(DS,PetscInt*),(ds,ip));
949: PetscFunctionReturn(PETSC_SUCCESS);
950: }
952: static PetscErrorCode DSNEPSetSamplingSize_NEP(DS ds,PetscInt p)
953: {
954: DS_NEP *ctx = (DS_NEP*)ds->data;
956: PetscFunctionBegin;
957: if (p == PETSC_DECIDE || p == PETSC_DEFAULT) ctx->spls = 0;
958: else {
959: PetscCheck(p>0,PetscObjectComm((PetscObject)ds),PETSC_ERR_ARG_OUTOFRANGE,"The sample size must be > 0");
960: PetscCheck(p>=20,PetscObjectComm((PetscObject)ds),PETSC_ERR_ARG_OUTOFRANGE,"The sample size cannot be smaller than 20");
961: ctx->spls = p;
962: }
963: PetscFunctionReturn(PETSC_SUCCESS);
964: }
966: /*@
967: DSNEPSetSamplingSize - Sets the number of sampling columns to be
968: used in the contour integral method.
970: Logically Collective
972: Input Parameters:
973: + ds - the direct solver context
974: - p - the number of columns for the sampling matrix
976: Options Database Key:
977: . -ds_nep_sampling_size <p> - sets the number of sampling columns
979: Notes:
980: This parameter is relevant only in the contour integral method.
982: Level: advanced
984: .seealso: DSNEPGetSamplingSize()
985: @*/
986: PetscErrorCode DSNEPSetSamplingSize(DS ds,PetscInt p)
987: {
988: PetscFunctionBegin;
991: PetscTryMethod(ds,"DSNEPSetSamplingSize_C",(DS,PetscInt),(ds,p));
992: PetscFunctionReturn(PETSC_SUCCESS);
993: }
995: static PetscErrorCode DSNEPGetSamplingSize_NEP(DS ds,PetscInt *p)
996: {
997: DS_NEP *ctx = (DS_NEP*)ds->data;
999: PetscFunctionBegin;
1000: *p = ctx->spls;
1001: PetscFunctionReturn(PETSC_SUCCESS);
1002: }
1004: /*@
1005: DSNEPGetSamplingSize - Returns the number of sampling columns used
1006: in the contour integral method.
1008: Not Collective
1010: Input Parameter:
1011: . ds - the direct solver context
1013: Output Parameters:
1014: . p - the number of columns for the sampling matrix
1016: Level: advanced
1018: .seealso: DSNEPSetSamplingSize()
1019: @*/
1020: PetscErrorCode DSNEPGetSamplingSize(DS ds,PetscInt *p)
1021: {
1022: PetscFunctionBegin;
1024: PetscAssertPointer(p,2);
1025: PetscUseMethod(ds,"DSNEPGetSamplingSize_C",(DS,PetscInt*),(ds,p));
1026: PetscFunctionReturn(PETSC_SUCCESS);
1027: }
1029: static PetscErrorCode DSNEPSetComputeMatrixFunction_NEP(DS ds,DSNEPMatrixFunctionFn *fun,void *ctx)
1030: {
1031: DS_NEP *dsctx = (DS_NEP*)ds->data;
1033: PetscFunctionBegin;
1034: dsctx->computematrix = fun;
1035: dsctx->computematrixctx = ctx;
1036: PetscFunctionReturn(PETSC_SUCCESS);
1037: }
1039: /*@C
1040: DSNEPSetComputeMatrixFunction - Sets a user-provided subroutine to compute
1041: the matrices T(lambda) or T'(lambda).
1043: Logically Collective
1045: Input Parameters:
1046: + ds - the direct solver context
1047: . fun - matrix function evaluation routine, see DSNEPMatrixFunctionFn for the calling sequence
1048: - ctx - a context pointer (the last parameter to the user function)
1050: Note:
1051: The result is computed as T(lambda) = sum_i E_i*f_i(lambda), and similarly
1052: for the derivative.
1054: Level: developer
1056: .seealso: DSNEPGetComputeMatrixFunction()
1057: @*/
1058: PetscErrorCode DSNEPSetComputeMatrixFunction(DS ds,DSNEPMatrixFunctionFn *fun,void *ctx)
1059: {
1060: PetscFunctionBegin;
1062: PetscTryMethod(ds,"DSNEPSetComputeMatrixFunction_C",(DS,DSNEPMatrixFunctionFn*,void*),(ds,fun,ctx));
1063: PetscFunctionReturn(PETSC_SUCCESS);
1064: }
1066: static PetscErrorCode DSNEPGetComputeMatrixFunction_NEP(DS ds,DSNEPMatrixFunctionFn **fun,void **ctx)
1067: {
1068: DS_NEP *dsctx = (DS_NEP*)ds->data;
1070: PetscFunctionBegin;
1071: if (fun) *fun = dsctx->computematrix;
1072: if (ctx) *ctx = dsctx->computematrixctx;
1073: PetscFunctionReturn(PETSC_SUCCESS);
1074: }
1076: /*@C
1077: DSNEPGetComputeMatrixFunction - Returns the user-provided callback function
1078: set in DSNEPSetComputeMatrixFunction().
1080: Not Collective
1082: Input Parameter:
1083: . ds - the direct solver context
1085: Output Parameters:
1086: + fun - the pointer to the user function
1087: - ctx - the context pointer
1089: Level: developer
1091: .seealso: DSNEPSetComputeMatrixFunction()
1092: @*/
1093: PetscErrorCode DSNEPGetComputeMatrixFunction(DS ds,DSNEPMatrixFunctionFn **fun,void **ctx)
1094: {
1095: PetscFunctionBegin;
1097: PetscUseMethod(ds,"DSNEPGetComputeMatrixFunction_C",(DS,DSNEPMatrixFunctionFn**,void**),(ds,fun,ctx));
1098: PetscFunctionReturn(PETSC_SUCCESS);
1099: }
1101: static PetscErrorCode DSNEPSetRG_NEP(DS ds,RG rg)
1102: {
1103: DS_NEP *dsctx = (DS_NEP*)ds->data;
1105: PetscFunctionBegin;
1106: PetscCall(PetscObjectReference((PetscObject)rg));
1107: PetscCall(RGDestroy(&dsctx->rg));
1108: dsctx->rg = rg;
1109: PetscFunctionReturn(PETSC_SUCCESS);
1110: }
1112: /*@
1113: DSNEPSetRG - Associates a region object to the DSNEP solver.
1115: Collective
1117: Input Parameters:
1118: + ds - the direct solver context
1119: - rg - the region context
1121: Notes:
1122: The region is used only in the contour integral method, and
1123: should enclose the wanted eigenvalues.
1125: Level: developer
1127: .seealso: DSNEPGetRG()
1128: @*/
1129: PetscErrorCode DSNEPSetRG(DS ds,RG rg)
1130: {
1131: PetscFunctionBegin;
1133: if (rg) {
1135: PetscCheckSameComm(ds,1,rg,2);
1136: }
1137: PetscTryMethod(ds,"DSNEPSetRG_C",(DS,RG),(ds,rg));
1138: PetscFunctionReturn(PETSC_SUCCESS);
1139: }
1141: static PetscErrorCode DSNEPGetRG_NEP(DS ds,RG *rg)
1142: {
1143: DS_NEP *ctx = (DS_NEP*)ds->data;
1145: PetscFunctionBegin;
1146: if (!ctx->rg) {
1147: PetscCall(RGCreate(PetscObjectComm((PetscObject)ds),&ctx->rg));
1148: PetscCall(PetscObjectIncrementTabLevel((PetscObject)ctx->rg,(PetscObject)ds,1));
1149: PetscCall(RGSetOptionsPrefix(ctx->rg,((PetscObject)ds)->prefix));
1150: PetscCall(RGAppendOptionsPrefix(ctx->rg,"ds_nep_"));
1151: PetscCall(PetscObjectSetOptions((PetscObject)ctx->rg,((PetscObject)ds)->options));
1152: }
1153: *rg = ctx->rg;
1154: PetscFunctionReturn(PETSC_SUCCESS);
1155: }
1157: /*@
1158: DSNEPGetRG - Obtain the region object associated to the DSNEP solver.
1160: Collective
1162: Input Parameter:
1163: . ds - the direct solver context
1165: Output Parameter:
1166: . rg - the region context
1168: Level: developer
1170: .seealso: DSNEPSetRG()
1171: @*/
1172: PetscErrorCode DSNEPGetRG(DS ds,RG *rg)
1173: {
1174: PetscFunctionBegin;
1176: PetscAssertPointer(rg,2);
1177: PetscUseMethod(ds,"DSNEPGetRG_C",(DS,RG*),(ds,rg));
1178: PetscFunctionReturn(PETSC_SUCCESS);
1179: }
1181: static PetscErrorCode DSSetFromOptions_NEP(DS ds,PetscOptionItems *PetscOptionsObject)
1182: {
1183: PetscInt k;
1184: PetscBool flg;
1185: #if defined(PETSC_USE_COMPLEX)
1186: PetscReal r;
1187: PetscBool flg1;
1188: DS_NEP *ctx = (DS_NEP*)ds->data;
1189: #endif
1191: PetscFunctionBegin;
1192: PetscOptionsHeadBegin(PetscOptionsObject,"DS NEP Options");
1194: PetscCall(PetscOptionsInt("-ds_nep_minimality","Maximum minimality index","DSNEPSetMinimality",4,&k,&flg));
1195: if (flg) PetscCall(DSNEPSetMinimality(ds,k));
1197: PetscCall(PetscOptionsInt("-ds_nep_integration_points","Number of integration points","DSNEPSetIntegrationPoints",64,&k,&flg));
1198: if (flg) PetscCall(DSNEPSetIntegrationPoints(ds,k));
1200: PetscCall(PetscOptionsInt("-ds_nep_sampling_size","Number of sampling columns","DSNEPSetSamplingSize",0,&k,&flg));
1201: if (flg) PetscCall(DSNEPSetSamplingSize(ds,k));
1203: #if defined(PETSC_USE_COMPLEX)
1204: r = ctx->rtol;
1205: PetscCall(PetscOptionsReal("-ds_nep_refine_tol","Refinement tolerance","DSNEPSetRefine",ctx->rtol,&r,&flg1));
1206: k = ctx->Nit;
1207: PetscCall(PetscOptionsInt("-ds_nep_refine_its","Number of iterative refinement iterations","DSNEPSetRefine",ctx->Nit,&k,&flg));
1208: if (flg1||flg) PetscCall(DSNEPSetRefine(ds,r,k));
1210: if (ds->method==1) {
1211: if (!ctx->rg) PetscCall(DSNEPGetRG(ds,&ctx->rg));
1212: PetscCall(RGSetFromOptions(ctx->rg));
1213: }
1214: #endif
1216: PetscOptionsHeadEnd();
1217: PetscFunctionReturn(PETSC_SUCCESS);
1218: }
1220: static PetscErrorCode DSDestroy_NEP(DS ds)
1221: {
1222: DS_NEP *ctx = (DS_NEP*)ds->data;
1223: PetscInt i;
1225: PetscFunctionBegin;
1226: for (i=0;i<ctx->nf;i++) PetscCall(FNDestroy(&ctx->f[i]));
1227: PetscCall(RGDestroy(&ctx->rg));
1228: PetscCall(PetscLayoutDestroy(&ctx->map));
1229: PetscCall(PetscFree(ds->data));
1230: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetFN_C",NULL));
1231: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetFN_C",NULL));
1232: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetNumFN_C",NULL));
1233: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetMinimality_C",NULL));
1234: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetMinimality_C",NULL));
1235: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetRefine_C",NULL));
1236: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetRefine_C",NULL));
1237: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetIntegrationPoints_C",NULL));
1238: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetIntegrationPoints_C",NULL));
1239: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetSamplingSize_C",NULL));
1240: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetSamplingSize_C",NULL));
1241: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetRG_C",NULL));
1242: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetRG_C",NULL));
1243: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetComputeMatrixFunction_C",NULL));
1244: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetComputeMatrixFunction_C",NULL));
1245: PetscFunctionReturn(PETSC_SUCCESS);
1246: }
1248: static PetscErrorCode DSMatGetSize_NEP(DS ds,DSMatType t,PetscInt *rows,PetscInt *cols)
1249: {
1250: DS_NEP *ctx = (DS_NEP*)ds->data;
1252: PetscFunctionBegin;
1253: *rows = ds->n;
1254: if (t==DS_MAT_Q || t==DS_MAT_Z || t==DS_MAT_U || t==DS_MAT_V) *rows *= ctx->max_mid;
1255: *cols = ds->n;
1256: if (t==DS_MAT_Q || t==DS_MAT_Z || t==DS_MAT_U || t==DS_MAT_V || t==DS_MAT_X || t==DS_MAT_Y) *cols *= ctx->max_mid;
1257: PetscFunctionReturn(PETSC_SUCCESS);
1258: }
1260: /*MC
1261: DSNEP - Dense Nonlinear Eigenvalue Problem.
1263: Level: beginner
1265: Notes:
1266: The problem is expressed as T(lambda)*x = 0, where T(lambda) is a
1267: parameter-dependent matrix written as T(lambda) = sum_i E_i*f_i(lambda).
1268: The eigenvalues lambda are the arguments returned by DSSolve()..
1270: The coefficient matrices E_i are the extra matrices of the DS, and
1271: the scalar functions f_i are passed via DSNEPSetFN(). Optionally, a
1272: callback function to fill the E_i matrices can be set with
1273: DSNEPSetComputeMatrixFunction().
1275: Used DS matrices:
1276: + DS_MAT_Ex - coefficient matrices of the split form of T(lambda)
1277: . DS_MAT_X - eigenvectors
1278: . DS_MAT_A - (workspace) T(lambda) evaluated at a given lambda (SLP only)
1279: . DS_MAT_B - (workspace) T'(lambda) evaluated at a given lambda (SLP only)
1280: . DS_MAT_Q - (workspace) left Hankel matrix (contour only)
1281: . DS_MAT_Z - (workspace) right Hankel matrix (contour only)
1282: . DS_MAT_U - (workspace) left singular vectors (contour only)
1283: . DS_MAT_V - (workspace) right singular vectors (contour only)
1284: - DS_MAT_W - (workspace) auxiliary matrix of size nxn
1286: Implemented methods:
1287: + 0 - Successive Linear Problems (SLP), computes just one eigenpair
1288: - 1 - Contour integral, computes all eigenvalues inside a region
1290: .seealso: DSCreate(), DSSetType(), DSType, DSNEPSetFN(), DSNEPSetComputeMatrixFunction()
1291: M*/
1292: SLEPC_EXTERN PetscErrorCode DSCreate_NEP(DS ds)
1293: {
1294: DS_NEP *ctx;
1296: PetscFunctionBegin;
1297: PetscCall(PetscNew(&ctx));
1298: ds->data = (void*)ctx;
1299: ctx->max_mid = 4;
1300: ctx->nnod = 64;
1301: ctx->Nit = 3;
1302: ctx->rtol = PETSC_MACHINE_EPSILON/PetscSqrtReal(PETSC_SQRT_MACHINE_EPSILON);
1304: ds->ops->allocate = DSAllocate_NEP;
1305: ds->ops->setfromoptions = DSSetFromOptions_NEP;
1306: ds->ops->view = DSView_NEP;
1307: ds->ops->vectors = DSVectors_NEP;
1308: ds->ops->solve[0] = DSSolve_NEP_SLP;
1309: #if defined(PETSC_USE_COMPLEX)
1310: ds->ops->solve[1] = DSSolve_NEP_Contour;
1311: #endif
1312: ds->ops->sort = DSSort_NEP;
1313: #if !defined(PETSC_HAVE_MPIUNI)
1314: ds->ops->synchronize = DSSynchronize_NEP;
1315: #endif
1316: ds->ops->destroy = DSDestroy_NEP;
1317: ds->ops->matgetsize = DSMatGetSize_NEP;
1319: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetFN_C",DSNEPSetFN_NEP));
1320: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetFN_C",DSNEPGetFN_NEP));
1321: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetNumFN_C",DSNEPGetNumFN_NEP));
1322: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetMinimality_C",DSNEPGetMinimality_NEP));
1323: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetMinimality_C",DSNEPSetMinimality_NEP));
1324: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetRefine_C",DSNEPGetRefine_NEP));
1325: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetRefine_C",DSNEPSetRefine_NEP));
1326: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetIntegrationPoints_C",DSNEPGetIntegrationPoints_NEP));
1327: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetIntegrationPoints_C",DSNEPSetIntegrationPoints_NEP));
1328: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetSamplingSize_C",DSNEPGetSamplingSize_NEP));
1329: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetSamplingSize_C",DSNEPSetSamplingSize_NEP));
1330: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetRG_C",DSNEPSetRG_NEP));
1331: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetRG_C",DSNEPGetRG_NEP));
1332: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPSetComputeMatrixFunction_C",DSNEPSetComputeMatrixFunction_NEP));
1333: PetscCall(PetscObjectComposeFunction((PetscObject)ds,"DSNEPGetComputeMatrixFunction_C",DSNEPGetComputeMatrixFunction_NEP));
1334: PetscFunctionReturn(PETSC_SUCCESS);
1335: }