Actual source code: telescope.c

petsc-master 2019-11-16
Report Typos and Errors

  2:  #include <petsc/private/petscimpl.h>
  3:  #include <petsc/private/matimpl.h>
  4:  #include <petsc/private/pcimpl.h>
  5:  #include <petscksp.h>
  6:  #include <petscdm.h>
  7: #include "../src/ksp/pc/impls/telescope/telescope.h"

  9: static PetscBool  cited = PETSC_FALSE;
 10: static const char citation[] =
 11: "@inproceedings{MaySananRuppKnepleySmith2016,\n"
 12: "  title     = {Extreme-Scale Multigrid Components within PETSc},\n"
 13: "  author    = {Dave A. May and Patrick Sanan and Karl Rupp and Matthew G. Knepley and Barry F. Smith},\n"
 14: "  booktitle = {Proceedings of the Platform for Advanced Scientific Computing Conference},\n"
 15: "  series    = {PASC '16},\n"
 16: "  isbn      = {978-1-4503-4126-4},\n"
 17: "  location  = {Lausanne, Switzerland},\n"
 18: "  pages     = {5:1--5:12},\n"
 19: "  articleno = {5},\n"
 20: "  numpages  = {12},\n"
 21: "  url       = {https://doi.acm.org/10.1145/2929908.2929913},\n"
 22: "  doi       = {10.1145/2929908.2929913},\n"
 23: "  acmid     = {2929913},\n"
 24: "  publisher = {ACM},\n"
 25: "  address   = {New York, NY, USA},\n"
 26: "  keywords  = {GPU, HPC, agglomeration, coarse-level solver, multigrid, parallel computing, preconditioning},\n"
 27: "  year      = {2016}\n"
 28: "}\n";

 30: /*
 31:  default setup mode

 33:  [1a] scatter to (FORWARD)
 34:  x(comm) -> xtmp(comm)
 35:  [1b] local copy (to) ranks with color = 0
 36:  xred(subcomm) <- xtmp
 37:  
 38:  [2] solve on sub KSP to obtain yred(subcomm)

 40:  [3a] local copy (from) ranks with color = 0
 41:  yred(subcomm) --> xtmp
 42:  [2b] scatter from (REVERSE)
 43:  xtmp(comm) -> y(comm)
 44: */

 46: /*
 47:   Collective[comm_f]
 48:   Notes
 49:    * Using comm_f = MPI_COMM_NULL will result in an error
 50:    * Using comm_c = MPI_COMM_NULL is valid. If all instances of comm_c are NULL the subcomm is not valid.
 51:    * If any non NULL comm_c communicator cannot map any of its ranks to comm_f, the subcomm is not valid.
 52: */
 53: PetscErrorCode PCTelescopeTestValidSubcomm(MPI_Comm comm_f,MPI_Comm comm_c,PetscBool *isvalid)
 54: {
 55:   PetscInt       valid = 1;
 56:   MPI_Group      group_f,group_c;
 58:   PetscMPIInt    count,k,size_f = 0,size_c = 0,size_c_sum = 0;
 59:   PetscMPIInt    *ranks_f,*ranks_c;

 62:   if (comm_f == MPI_COMM_NULL) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"comm_f cannot be MPI_COMM_NULL");

 64:   MPI_Comm_group(comm_f,&group_f);
 65:   if (comm_c != MPI_COMM_NULL) {
 66:     MPI_Comm_group(comm_c,&group_c);
 67:   }

 69:   MPI_Comm_size(comm_f,&size_f);
 70:   if (comm_c != MPI_COMM_NULL) {
 71:     MPI_Comm_size(comm_c,&size_c);
 72:   }

 74:   /* check not all comm_c's are NULL */
 75:   size_c_sum = size_c;
 76:   MPI_Allreduce(MPI_IN_PLACE,&size_c_sum,1,MPI_INT,MPI_SUM,comm_f);
 77:   if (size_c_sum == 0) valid = 0;

 79:   /* check we can map at least 1 rank in comm_c to comm_f */
 80:   PetscMalloc1(size_f,&ranks_f);
 81:   PetscMalloc1(size_c,&ranks_c);
 82:   for (k=0; k<size_f; k++) ranks_f[k] = MPI_UNDEFINED;
 83:   for (k=0; k<size_c; k++) ranks_c[k] = k;

 85:   /*
 86:    MPI_Group_translate_ranks() returns a non-zero exit code if any rank cannot be translated.
 87:    I do not want the code to terminate immediately if this occurs, rather I want to throw 
 88:    the error later (during PCSetUp_Telescope()) via SETERRQ() with a message indicating 
 89:    that comm_c is not a valid sub-communicator.
 90:    Hence I purposefully do not call CHKERRQ() after MPI_Group_translate_ranks().
 91:   */
 92:   count = 0;
 93:   if (comm_c != MPI_COMM_NULL) {
 94:     (void)MPI_Group_translate_ranks(group_c,size_c,ranks_c,group_f,ranks_f);
 95:     for (k=0; k<size_f; k++) {
 96:       if (ranks_f[k] == MPI_UNDEFINED) {
 97:         count++;
 98:       }
 99:     }
100:   }
101:   if (count == size_f) valid = 0;

103:   MPI_Allreduce(MPI_IN_PLACE,&valid,1,MPIU_INT,MPI_MIN,comm_f);
104:   if (valid == 1) *isvalid = PETSC_TRUE;
105:   else *isvalid = PETSC_FALSE;

107:   PetscFree(ranks_f);
108:   PetscFree(ranks_c);
109:   MPI_Group_free(&group_f);
110:   if (comm_c != MPI_COMM_NULL) {
111:     MPI_Group_free(&group_c);
112:   }
113:   return(0);
114: }

116: DM private_PCTelescopeGetSubDM(PC_Telescope sred)
117: {
118:   DM subdm = NULL;

120:   if (!PCTelescope_isActiveRank(sred)) { subdm = NULL; }
121:   else {
122:     switch (sred->sr_type) {
123:     case TELESCOPE_DEFAULT: subdm = NULL;
124:       break;
125:     case TELESCOPE_DMDA:    subdm = ((PC_Telescope_DMDACtx*)sred->dm_ctx)->dmrepart;
126:       break;
127:     case TELESCOPE_DMPLEX:  subdm = NULL;
128:       break;
129:     case TELESCOPE_COARSEDM: if (sred->ksp) { KSPGetDM(sred->ksp,&subdm); }
130:       break;
131:     }
132:   }
133:   return(subdm);
134: }

136: PetscErrorCode PCTelescopeSetUp_default(PC pc,PC_Telescope sred)
137: {
139:   PetscInt       m,M,bs,st,ed;
140:   Vec            x,xred,yred,xtmp;
141:   Mat            B;
142:   MPI_Comm       comm,subcomm;
143:   VecScatter     scatter;
144:   IS             isin;

147:   PetscInfo(pc,"PCTelescope: setup (default)\n");
148:   comm = PetscSubcommParent(sred->psubcomm);
149:   subcomm = PetscSubcommChild(sred->psubcomm);

151:   PCGetOperators(pc,NULL,&B);
152:   MatGetSize(B,&M,NULL);
153:   MatGetBlockSize(B,&bs);
154:   MatCreateVecs(B,&x,NULL);

156:   xred = NULL;
157:   m    = 0;
158:   if (PCTelescope_isActiveRank(sred)) {
159:     VecCreate(subcomm,&xred);
160:     VecSetSizes(xred,PETSC_DECIDE,M);
161:     VecSetBlockSize(xred,bs);
162:     VecSetFromOptions(xred);
163:     VecGetLocalSize(xred,&m);
164:   }

166:   yred = NULL;
167:   if (PCTelescope_isActiveRank(sred)) {
168:     VecDuplicate(xred,&yred);
169:   }

171:   VecCreate(comm,&xtmp);
172:   VecSetSizes(xtmp,m,PETSC_DECIDE);
173:   VecSetBlockSize(xtmp,bs);
174:   VecSetType(xtmp,((PetscObject)x)->type_name);

176:   if (PCTelescope_isActiveRank(sred)) {
177:     VecGetOwnershipRange(xred,&st,&ed);
178:     ISCreateStride(comm,(ed-st),st,1,&isin);
179:   } else {
180:     VecGetOwnershipRange(x,&st,&ed);
181:     ISCreateStride(comm,0,st,1,&isin);
182:   }
183:   ISSetBlockSize(isin,bs);

185:   VecScatterCreate(x,isin,xtmp,NULL,&scatter);

187:   sred->isin    = isin;
188:   sred->scatter = scatter;
189:   sred->xred    = xred;
190:   sred->yred    = yred;
191:   sred->xtmp    = xtmp;
192:   VecDestroy(&x);
193:   return(0);
194: }

196: PetscErrorCode PCTelescopeMatCreate_default(PC pc,PC_Telescope sred,MatReuse reuse,Mat *A)
197: {
199:   MPI_Comm       comm,subcomm;
200:   Mat            Bred,B;
201:   PetscInt       nr,nc;
202:   IS             isrow,iscol;
203:   Mat            Blocal,*_Blocal;

206:   PetscInfo(pc,"PCTelescope: updating the redundant preconditioned operator (default)\n");
207:   PetscObjectGetComm((PetscObject)pc,&comm);
208:   subcomm = PetscSubcommChild(sred->psubcomm);
209:   PCGetOperators(pc,NULL,&B);
210:   MatGetSize(B,&nr,&nc);
211:   isrow = sred->isin;
212:   ISCreateStride(comm,nc,0,1,&iscol);
213:   MatCreateSubMatrices(B,1,&isrow,&iscol,MAT_INITIAL_MATRIX,&_Blocal);
214:   Blocal = *_Blocal;
215:   PetscFree(_Blocal);
216:   Bred = NULL;
217:   if (PCTelescope_isActiveRank(sred)) {
218:     PetscInt mm;

220:     if (reuse != MAT_INITIAL_MATRIX) { Bred = *A; }

222:     MatGetSize(Blocal,&mm,NULL);
223:     MatCreateMPIMatConcatenateSeqMat(subcomm,Blocal,mm,reuse,&Bred);
224:   }
225:   *A = Bred;
226:   ISDestroy(&iscol);
227:   MatDestroy(&Blocal);
228:   return(0);
229: }

231: static PetscErrorCode PCTelescopeSubNullSpaceCreate_Telescope(PC pc,PC_Telescope sred,MatNullSpace nullspace,MatNullSpace *sub_nullspace)
232: {
234:   PetscBool      has_const;
235:   const Vec      *vecs;
236:   Vec            *sub_vecs = NULL;
237:   PetscInt       i,k,n = 0;
238:   MPI_Comm       subcomm;

241:   subcomm = PetscSubcommChild(sred->psubcomm);
242:   MatNullSpaceGetVecs(nullspace,&has_const,&n,&vecs);

244:   if (PCTelescope_isActiveRank(sred)) {
245:     if (n) {
246:       VecDuplicateVecs(sred->xred,n,&sub_vecs);
247:     }
248:   }

250:   /* copy entries */
251:   for (k=0; k<n; k++) {
252:     const PetscScalar *x_array;
253:     PetscScalar       *LA_sub_vec;
254:     PetscInt          st,ed;

256:     /* pull in vector x->xtmp */
257:     VecScatterBegin(sred->scatter,vecs[k],sred->xtmp,INSERT_VALUES,SCATTER_FORWARD);
258:     VecScatterEnd(sred->scatter,vecs[k],sred->xtmp,INSERT_VALUES,SCATTER_FORWARD);
259:     if (sub_vecs) {
260:       /* copy vector entries into xred */
261:       VecGetArrayRead(sred->xtmp,&x_array);
262:       if (sub_vecs[k]) {
263:         VecGetOwnershipRange(sub_vecs[k],&st,&ed);
264:         VecGetArray(sub_vecs[k],&LA_sub_vec);
265:         for (i=0; i<ed-st; i++) {
266:           LA_sub_vec[i] = x_array[i];
267:         }
268:         VecRestoreArray(sub_vecs[k],&LA_sub_vec);
269:       }
270:       VecRestoreArrayRead(sred->xtmp,&x_array);
271:     }
272:   }

274:   if (PCTelescope_isActiveRank(sred)) {
275:     /* create new (near) nullspace for redundant object */
276:     MatNullSpaceCreate(subcomm,has_const,n,sub_vecs,sub_nullspace);
277:     VecDestroyVecs(n,&sub_vecs);
278:     if (nullspace->remove) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Propagation of custom remove callbacks not supported when propagating (near) nullspaces with PCTelescope");
279:     if (nullspace->rmctx) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Propagation of custom remove callback context not supported when propagating (near) nullspaces with PCTelescope");
280:   }
281:   return(0);
282: }

284: static PetscErrorCode PCTelescopeMatNullSpaceCreate_default(PC pc,PC_Telescope sred,Mat sub_mat)
285: {
287:   Mat            B;

290:   PCGetOperators(pc,NULL,&B);
291:   /* Propagate the nullspace if it exists */
292:   {
293:     MatNullSpace nullspace,sub_nullspace;
294:     MatGetNullSpace(B,&nullspace);
295:     if (nullspace) {
296:       PetscInfo(pc,"PCTelescope: generating nullspace (default)\n");
297:       PCTelescopeSubNullSpaceCreate_Telescope(pc,sred,nullspace,&sub_nullspace);
298:       if (PCTelescope_isActiveRank(sred)) {
299:         MatSetNullSpace(sub_mat,sub_nullspace);
300:         MatNullSpaceDestroy(&sub_nullspace);
301:       }
302:     }
303:   }
304:   /* Propagate the near nullspace if it exists */
305:   {
306:     MatNullSpace nearnullspace,sub_nearnullspace;
307:     MatGetNearNullSpace(B,&nearnullspace);
308:     if (nearnullspace) {
309:       PetscInfo(pc,"PCTelescope: generating near nullspace (default)\n");
310:       PCTelescopeSubNullSpaceCreate_Telescope(pc,sred,nearnullspace,&sub_nearnullspace);
311:       if (PCTelescope_isActiveRank(sred)) {
312:         MatSetNearNullSpace(sub_mat,sub_nearnullspace);
313:         MatNullSpaceDestroy(&sub_nearnullspace);
314:       }
315:     }
316:   }
317:   return(0);
318: }

320: static PetscErrorCode PCView_Telescope(PC pc,PetscViewer viewer)
321: {
322:   PC_Telescope   sred = (PC_Telescope)pc->data;
324:   PetscBool      iascii,isstring;
325:   PetscViewer    subviewer;

328:   PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);
329:   PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERSTRING,&isstring);
330:   if (iascii) {
331:     {
332:       MPI_Comm    comm,subcomm;
333:       PetscMPIInt comm_size,subcomm_size;
334:       DM          dm = NULL,subdm = NULL;

336:       PCGetDM(pc,&dm);
337:       subdm = private_PCTelescopeGetSubDM(sred);

339:       if (sred->psubcomm) {
340:         comm = PetscSubcommParent(sred->psubcomm);
341:         subcomm = PetscSubcommChild(sred->psubcomm);
342:         MPI_Comm_size(comm,&comm_size);
343:         MPI_Comm_size(subcomm,&subcomm_size);

345:         PetscViewerASCIIPushTab(viewer);
346:         PetscViewerASCIIPrintf(viewer,"petsc subcomm: parent comm size reduction factor = %D\n",sred->redfactor);
347:         PetscViewerASCIIPrintf(viewer,"petsc subcomm: parent_size = %d , subcomm_size = %d\n",(int)comm_size,(int)subcomm_size);
348:         switch (sred->subcommtype) {
349:         case PETSC_SUBCOMM_INTERLACED :
350:           PetscViewerASCIIPrintf(viewer,"petsc subcomm: type = interlaced\n",sred->subcommtype);
351:           break;
352:         case PETSC_SUBCOMM_CONTIGUOUS :
353:           PetscViewerASCIIPrintf(viewer,"petsc subcomm type = contiguous\n",sred->subcommtype);
354:           break;
355:         default :
356:           SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"General subcomm type not supported by PCTelescope");
357:         }
358:         PetscViewerASCIIPopTab(viewer);
359:       } else {
360:         PetscObjectGetComm((PetscObject)pc,&comm);
361:         subcomm = sred->subcomm;
362:         if (!PCTelescope_isActiveRank(sred)) {
363:           subcomm = PETSC_COMM_SELF;
364:         }

366:         PetscViewerASCIIPushTab(viewer);
367:         PetscViewerASCIIPrintf(viewer,"subcomm: using user provided sub-communicator\n");
368:         PetscViewerASCIIPopTab(viewer);
369:       }

371:       PetscViewerGetSubViewer(viewer,subcomm,&subviewer);
372:       if (PCTelescope_isActiveRank(sred)) {
373:         PetscViewerASCIIPushTab(subviewer);

375:         if (dm && sred->ignore_dm) {
376:           PetscViewerASCIIPrintf(subviewer,"ignoring DM\n");
377:         }
378:         if (sred->ignore_kspcomputeoperators) {
379:           PetscViewerASCIIPrintf(subviewer,"ignoring KSPComputeOperators\n");
380:         }
381:         switch (sred->sr_type) {
382:         case TELESCOPE_DEFAULT:
383:           PetscViewerASCIIPrintf(subviewer,"setup type: default\n");
384:           break;
385:         case TELESCOPE_DMDA:
386:           PetscViewerASCIIPrintf(subviewer,"setup type: DMDA auto-repartitioning\n");
387:           DMView_DA_Short(subdm,subviewer);
388:           break;
389:         case TELESCOPE_DMPLEX:
390:           PetscViewerASCIIPrintf(subviewer,"setup type: DMPLEX auto-repartitioning\n");
391:           break;
392:         case TELESCOPE_COARSEDM:
393:           PetscViewerASCIIPrintf(subviewer,"setup type: coarse DM\n");
394:           break;
395:         }

397:         if (dm) {
398:           PetscObject obj = (PetscObject)dm;
399:           PetscViewerASCIIPrintf(subviewer,"Parent DM object:");
400:           PetscViewerASCIIUseTabs(subviewer,PETSC_FALSE);
401:           if (obj->type_name) { PetscViewerASCIIPrintf(subviewer," type = %s;",obj->type_name); }
402:           if (obj->name) { PetscViewerASCIIPrintf(subviewer," name = %s;",obj->name); }
403:           if (obj->prefix) { PetscViewerASCIIPrintf(subviewer," prefix = %s",obj->prefix); }
404:           PetscViewerASCIIPrintf(subviewer,"\n");
405:           PetscViewerASCIIUseTabs(subviewer,PETSC_TRUE);
406:         } else {
407:           PetscViewerASCIIPrintf(subviewer,"Parent DM object: NULL\n");
408:         }
409:         if (subdm) {
410:           PetscObject obj = (PetscObject)subdm;
411:           PetscViewerASCIIPrintf(subviewer,"Sub DM object:");
412:           PetscViewerASCIIUseTabs(subviewer,PETSC_FALSE);
413:           if (obj->type_name) { PetscViewerASCIIPrintf(subviewer," type = %s;",obj->type_name); }
414:           if (obj->name) { PetscViewerASCIIPrintf(subviewer," name = %s;",obj->name); }
415:           if (obj->prefix) { PetscViewerASCIIPrintf(subviewer," prefix = %s",obj->prefix); }
416:           PetscViewerASCIIPrintf(subviewer,"\n");
417:           PetscViewerASCIIUseTabs(subviewer,PETSC_TRUE);
418:         } else {
419:           PetscViewerASCIIPrintf(subviewer,"Sub DM object: NULL\n");
420:         }
421: 
422:         KSPView(sred->ksp,subviewer);
423:         PetscViewerASCIIPopTab(subviewer);
424:       }
425:       PetscViewerRestoreSubViewer(viewer,subcomm,&subviewer);
426:     }
427:   }
428:   return(0);
429: }

431: static PetscErrorCode PCSetUp_Telescope(PC pc)
432: {
433:   PC_Telescope    sred = (PC_Telescope)pc->data;
434:   PetscErrorCode  ierr;
435:   MPI_Comm        comm,subcomm=0;
436:   PCTelescopeType sr_type;

439:   PetscObjectGetComm((PetscObject)pc,&comm);

441:   /* Determine type of setup/update */
442:   if (!pc->setupcalled) {
443:     PetscBool has_dm,same;
444:     DM        dm;

446:     sr_type = TELESCOPE_DEFAULT;
447:     has_dm = PETSC_FALSE;
448:     PCGetDM(pc,&dm);
449:     if (dm) { has_dm = PETSC_TRUE; }
450:     if (has_dm) {
451:       /* check for dmda */
452:       PetscObjectTypeCompare((PetscObject)dm,DMDA,&same);
453:       if (same) {
454:         PetscInfo(pc,"PCTelescope: found DMDA\n");
455:         sr_type = TELESCOPE_DMDA;
456:       }
457:       /* check for dmplex */
458:       PetscObjectTypeCompare((PetscObject)dm,DMPLEX,&same);
459:       if (same) {
460:         PetscInfo(pc,"PCTelescope: found DMPLEX\n");
461:         sr_type = TELESCOPE_DMPLEX;
462:       }

464:       if (sred->use_coarse_dm) {
465:         PetscInfo(pc,"PCTelescope: using coarse DM\n");
466:         sr_type = TELESCOPE_COARSEDM;
467:       }

469:       if (sred->ignore_dm) {
470:         PetscInfo(pc,"PCTelescope: ignoring DM\n");
471:         sr_type = TELESCOPE_DEFAULT;
472:       }
473:     }
474:     sred->sr_type = sr_type;
475:   } else {
476:     sr_type = sred->sr_type;
477:   }

479:   /* set function pointers for repartition setup, matrix creation/update, matrix (near) nullspace, and reset functionality */
480:   switch (sr_type) {
481:   case TELESCOPE_DEFAULT:
482:     sred->pctelescope_setup_type              = PCTelescopeSetUp_default;
483:     sred->pctelescope_matcreate_type          = PCTelescopeMatCreate_default;
484:     sred->pctelescope_matnullspacecreate_type = PCTelescopeMatNullSpaceCreate_default;
485:     sred->pctelescope_reset_type              = NULL;
486:     break;
487:   case TELESCOPE_DMDA:
488:     pc->ops->apply                            = PCApply_Telescope_dmda;
489:     pc->ops->applyrichardson                  = PCApplyRichardson_Telescope_dmda;
490:     sred->pctelescope_setup_type              = PCTelescopeSetUp_dmda;
491:     sred->pctelescope_matcreate_type          = PCTelescopeMatCreate_dmda;
492:     sred->pctelescope_matnullspacecreate_type = PCTelescopeMatNullSpaceCreate_dmda;
493:     sred->pctelescope_reset_type              = PCReset_Telescope_dmda;
494:     break;
495:   case TELESCOPE_DMPLEX: SETERRQ(comm,PETSC_ERR_SUP,"Support for DMPLEX is currently not available");
496:     break;
497:   case TELESCOPE_COARSEDM:
498:     pc->ops->apply                            = PCApply_Telescope_CoarseDM;
499:     pc->ops->applyrichardson                  = PCApplyRichardson_Telescope_CoarseDM;
500:     sred->pctelescope_setup_type              = PCTelescopeSetUp_CoarseDM;
501:     sred->pctelescope_matcreate_type          = NULL;
502:     sred->pctelescope_matnullspacecreate_type = NULL; /* PCTelescopeMatNullSpaceCreate_CoarseDM; */
503:     sred->pctelescope_reset_type              = PCReset_Telescope_CoarseDM;
504:     break;
505:   default: SETERRQ(comm,PETSC_ERR_SUP,"Support only provided for: repartitioning an operator; repartitioning a DMDA; or using a coarse DM");
506:     break;
507:   }

509:   /* subcomm definition */
510:   if (!pc->setupcalled) {
511:     if ((sr_type == TELESCOPE_DEFAULT) || (sr_type == TELESCOPE_DMDA)) {
512:       if (!sred->psubcomm) {
513:         PetscSubcommCreate(comm,&sred->psubcomm);
514:         PetscSubcommSetNumber(sred->psubcomm,sred->redfactor);
515:         PetscSubcommSetType(sred->psubcomm,sred->subcommtype);
516:         PetscLogObjectMemory((PetscObject)pc,sizeof(PetscSubcomm));
517:         sred->subcomm = PetscSubcommChild(sred->psubcomm);
518:       }
519:     } else { /* query PC for DM, check communicators */
520:       DM          dm,dm_coarse_partition = NULL;
521:       MPI_Comm    comm_fine,comm_coarse_partition = MPI_COMM_NULL;
522:       PetscMPIInt csize_fine=0,csize_coarse_partition=0,cs[2],csg[2],cnt=0;
523:       PetscBool   isvalidsubcomm;

525:       PCGetDM(pc,&dm);
526:       comm_fine = PetscObjectComm((PetscObject)dm);
527:       DMGetCoarseDM(dm,&dm_coarse_partition);
528:       if (dm_coarse_partition) { cnt = 1; }
529:       MPI_Allreduce(MPI_IN_PLACE,&cnt,1,MPI_INT,MPI_SUM,comm_fine);
530:       if (cnt == 0) SETERRQ(comm_fine,PETSC_ERR_SUP,"Zero instances of a coarse DM were found");

532:       MPI_Comm_size(comm_fine,&csize_fine);
533:       if (dm_coarse_partition) {
534:         comm_coarse_partition = PetscObjectComm((PetscObject)dm_coarse_partition);
535:         MPI_Comm_size(comm_coarse_partition,&csize_coarse_partition);
536:       }

538:       cs[0] = csize_fine;
539:       cs[1] = csize_coarse_partition;
540:       MPI_Allreduce(cs,csg,2,MPI_INT,MPI_MAX,comm_fine);
541:       if (csg[0] == csg[1]) SETERRQ(comm_fine,PETSC_ERR_SUP,"Coarse DM uses the same size communicator as the parent DM attached to the PC");

543:       PCTelescopeTestValidSubcomm(comm_fine,comm_coarse_partition,&isvalidsubcomm);
544:       if (!isvalidsubcomm) SETERRQ(comm_fine,PETSC_ERR_SUP,"Coarse DM communicator is not a sub-communicator of parentDM->comm");
545:       sred->subcomm = comm_coarse_partition;
546:     }
547:   }
548:   subcomm = sred->subcomm;

550:   /* internal KSP */
551:   if (!pc->setupcalled) {
552:     const char *prefix;

554:     if (PCTelescope_isActiveRank(sred)) {
555:       KSPCreate(subcomm,&sred->ksp);
556:       KSPSetErrorIfNotConverged(sred->ksp,pc->erroriffailure);
557:       PetscObjectIncrementTabLevel((PetscObject)sred->ksp,(PetscObject)pc,1);
558:       PetscLogObjectParent((PetscObject)pc,(PetscObject)sred->ksp);
559:       KSPSetType(sred->ksp,KSPPREONLY);
560:       PCGetOptionsPrefix(pc,&prefix);
561:       KSPSetOptionsPrefix(sred->ksp,prefix);
562:       KSPAppendOptionsPrefix(sred->ksp,"telescope_");
563:     }
564:   }

566:   /* setup */
567:   if (!pc->setupcalled && sred->pctelescope_setup_type) {
568:     sred->pctelescope_setup_type(pc,sred);
569:   }
570:   /* update */
571:   if (!pc->setupcalled) {
572:     if (sred->pctelescope_matcreate_type) {
573:       sred->pctelescope_matcreate_type(pc,sred,MAT_INITIAL_MATRIX,&sred->Bred);
574:     }
575:     if (sred->pctelescope_matnullspacecreate_type) {
576:       sred->pctelescope_matnullspacecreate_type(pc,sred,sred->Bred);
577:     }
578:   } else {
579:     if (sred->pctelescope_matcreate_type) {
580:       sred->pctelescope_matcreate_type(pc,sred,MAT_REUSE_MATRIX,&sred->Bred);
581:     }
582:   }

584:   /* common - no construction */
585:   if (PCTelescope_isActiveRank(sred)) {
586:     KSPSetOperators(sred->ksp,sred->Bred,sred->Bred);
587:     if (pc->setfromoptionscalled && !pc->setupcalled){
588:       KSPSetFromOptions(sred->ksp);
589:     }
590:   }
591:   return(0);
592: }

594: static PetscErrorCode PCApply_Telescope(PC pc,Vec x,Vec y)
595: {
596:   PC_Telescope      sred = (PC_Telescope)pc->data;
597:   PetscErrorCode    ierr;
598:   Vec               xtmp,xred,yred;
599:   PetscInt          i,st,ed;
600:   VecScatter        scatter;
601:   PetscScalar       *array;
602:   const PetscScalar *x_array;

605:   PetscCitationsRegister(citation,&cited);

607:   xtmp    = sred->xtmp;
608:   scatter = sred->scatter;
609:   xred    = sred->xred;
610:   yred    = sred->yred;

612:   /* pull in vector x->xtmp */
613:   VecScatterBegin(scatter,x,xtmp,INSERT_VALUES,SCATTER_FORWARD);
614:   VecScatterEnd(scatter,x,xtmp,INSERT_VALUES,SCATTER_FORWARD);

616:   /* copy vector entries into xred */
617:   VecGetArrayRead(xtmp,&x_array);
618:   if (xred) {
619:     PetscScalar *LA_xred;
620:     VecGetOwnershipRange(xred,&st,&ed);
621:     VecGetArray(xred,&LA_xred);
622:     for (i=0; i<ed-st; i++) {
623:       LA_xred[i] = x_array[i];
624:     }
625:     VecRestoreArray(xred,&LA_xred);
626:   }
627:   VecRestoreArrayRead(xtmp,&x_array);
628:   /* solve */
629:   if (PCTelescope_isActiveRank(sred)) {
630:     KSPSolve(sred->ksp,xred,yred);
631:     KSPCheckSolve(sred->ksp,pc,yred);
632:   }
633:   /* return vector */
634:   VecGetArray(xtmp,&array);
635:   if (yred) {
636:     const PetscScalar *LA_yred;
637:     VecGetOwnershipRange(yred,&st,&ed);
638:     VecGetArrayRead(yred,&LA_yred);
639:     for (i=0; i<ed-st; i++) {
640:       array[i] = LA_yred[i];
641:     }
642:     VecRestoreArrayRead(yred,&LA_yred);
643:   }
644:   VecRestoreArray(xtmp,&array);
645:   VecScatterBegin(scatter,xtmp,y,INSERT_VALUES,SCATTER_REVERSE);
646:   VecScatterEnd(scatter,xtmp,y,INSERT_VALUES,SCATTER_REVERSE);
647:   return(0);
648: }

650: static PetscErrorCode PCApplyRichardson_Telescope(PC pc,Vec x,Vec y,Vec w,PetscReal rtol,PetscReal abstol, PetscReal dtol,PetscInt its,PetscBool zeroguess,PetscInt *outits,PCRichardsonConvergedReason *reason)
651: {
652:   PC_Telescope      sred = (PC_Telescope)pc->data;
653:   PetscErrorCode    ierr;
654:   Vec               xtmp,yred;
655:   PetscInt          i,st,ed;
656:   VecScatter        scatter;
657:   const PetscScalar *x_array;
658:   PetscBool         default_init_guess_value;

661:   xtmp    = sred->xtmp;
662:   scatter = sred->scatter;
663:   yred    = sred->yred;

665:   if (its > 1) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"PCApplyRichardson_Telescope only supports max_it = 1");
666:   *reason = (PCRichardsonConvergedReason)0;

668:   if (!zeroguess) {
669:     PetscInfo(pc,"PCTelescope: Scattering y for non-zero initial guess\n");
670:     /* pull in vector y->xtmp */
671:     VecScatterBegin(scatter,y,xtmp,INSERT_VALUES,SCATTER_FORWARD);
672:     VecScatterEnd(scatter,y,xtmp,INSERT_VALUES,SCATTER_FORWARD);

674:     /* copy vector entries into xred */
675:     VecGetArrayRead(xtmp,&x_array);
676:     if (yred) {
677:       PetscScalar *LA_yred;
678:       VecGetOwnershipRange(yred,&st,&ed);
679:       VecGetArray(yred,&LA_yred);
680:       for (i=0; i<ed-st; i++) {
681:         LA_yred[i] = x_array[i];
682:       }
683:       VecRestoreArray(yred,&LA_yred);
684:     }
685:     VecRestoreArrayRead(xtmp,&x_array);
686:   }

688:   if (PCTelescope_isActiveRank(sred)) {
689:     KSPGetInitialGuessNonzero(sred->ksp,&default_init_guess_value);
690:     if (!zeroguess) KSPSetInitialGuessNonzero(sred->ksp,PETSC_TRUE);
691:   }

693:   PCApply_Telescope(pc,x,y);

695:   if (PCTelescope_isActiveRank(sred)) {
696:     KSPSetInitialGuessNonzero(sred->ksp,default_init_guess_value);
697:   }

699:   if (!*reason) *reason = PCRICHARDSON_CONVERGED_ITS;
700:   *outits = 1;
701:   return(0);
702: }

704: static PetscErrorCode PCReset_Telescope(PC pc)
705: {
706:   PC_Telescope   sred = (PC_Telescope)pc->data;

709:   ISDestroy(&sred->isin);
710:   VecScatterDestroy(&sred->scatter);
711:   VecDestroy(&sred->xred);
712:   VecDestroy(&sred->yred);
713:   VecDestroy(&sred->xtmp);
714:   MatDestroy(&sred->Bred);
715:   KSPReset(sred->ksp);
716:   if (sred->pctelescope_reset_type) {
717:     sred->pctelescope_reset_type(pc);
718:   }
719:   return(0);
720: }

722: static PetscErrorCode PCDestroy_Telescope(PC pc)
723: {
724:   PC_Telescope   sred = (PC_Telescope)pc->data;

728:   PCReset_Telescope(pc);
729:   KSPDestroy(&sred->ksp);
730:   PetscSubcommDestroy(&sred->psubcomm);
731:   PetscFree(sred->dm_ctx);
732:   PetscFree(pc->data);
733:   return(0);
734: }

736: static PetscErrorCode PCSetFromOptions_Telescope(PetscOptionItems *PetscOptionsObject,PC pc)
737: {
738:   PC_Telescope     sred = (PC_Telescope)pc->data;
739:   PetscErrorCode   ierr;
740:   MPI_Comm         comm;
741:   PetscMPIInt      size;
742:   PetscBool        flg;
743:   PetscSubcommType subcommtype;

746:   PetscObjectGetComm((PetscObject)pc,&comm);
747:   MPI_Comm_size(comm,&size);
748:   PetscOptionsHead(PetscOptionsObject,"Telescope options");
749:   PetscOptionsEnum("-pc_telescope_subcomm_type","Subcomm type (interlaced or contiguous)","PCTelescopeSetSubcommType",PetscSubcommTypes,(PetscEnum)sred->subcommtype,(PetscEnum*)&subcommtype,&flg);
750:   if (flg) {
751:     PCTelescopeSetSubcommType(pc,subcommtype);
752:   }
753:   PetscOptionsInt("-pc_telescope_reduction_factor","Factor to reduce comm size by","PCTelescopeSetReductionFactor",sred->redfactor,&sred->redfactor,0);
754:   if (sred->redfactor > size) SETERRQ(comm,PETSC_ERR_ARG_WRONG,"-pc_telescope_reduction_factor <= comm size");
755:   PetscOptionsBool("-pc_telescope_ignore_dm","Ignore any DM attached to the PC","PCTelescopeSetIgnoreDM",sred->ignore_dm,&sred->ignore_dm,0);
756:   PetscOptionsBool("-pc_telescope_ignore_kspcomputeoperators","Ignore method used to compute A","PCTelescopeSetIgnoreKSPComputeOperators",sred->ignore_kspcomputeoperators,&sred->ignore_kspcomputeoperators,0);
757:   PetscOptionsBool("-pc_telescope_use_coarse_dm","Define sub-communicator from the coarse DM","PCTelescopeSetUseCoarseDM",sred->use_coarse_dm,&sred->use_coarse_dm,0);
758:   PetscOptionsTail();
759:   return(0);
760: }

762: /* PC simplementation specific API's */

764: static PetscErrorCode PCTelescopeGetKSP_Telescope(PC pc,KSP *ksp)
765: {
766:   PC_Telescope red = (PC_Telescope)pc->data;
768:   if (ksp) *ksp = red->ksp;
769:   return(0);
770: }

772: static PetscErrorCode PCTelescopeGetSubcommType_Telescope(PC pc,PetscSubcommType *subcommtype)
773: {
774:   PC_Telescope red = (PC_Telescope)pc->data;
776:   if (subcommtype) *subcommtype = red->subcommtype;
777:   return(0);
778: }

780: static PetscErrorCode PCTelescopeSetSubcommType_Telescope(PC pc,PetscSubcommType subcommtype)
781: {
782:   PC_Telescope     red = (PC_Telescope)pc->data;

785:   if (pc->setupcalled) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_ARG_WRONGSTATE,"You cannot change the subcommunicator type for PCTelescope after it has been set up.");
786:   red->subcommtype = subcommtype;
787:   return(0);
788: }

790: static PetscErrorCode PCTelescopeGetReductionFactor_Telescope(PC pc,PetscInt *fact)
791: {
792:   PC_Telescope red = (PC_Telescope)pc->data;
794:   if (fact) *fact = red->redfactor;
795:   return(0);
796: }

798: static PetscErrorCode PCTelescopeSetReductionFactor_Telescope(PC pc,PetscInt fact)
799: {
800:   PC_Telescope     red = (PC_Telescope)pc->data;
801:   PetscMPIInt      size;
802:   PetscErrorCode   ierr;

805:   MPI_Comm_size(PetscObjectComm((PetscObject)pc),&size);
806:   if (fact <= 0) SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_ARG_WRONG,"Reduction factor of telescoping PC %D must be positive",fact);
807:   if (fact > size) SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_ARG_WRONG,"Reduction factor of telescoping PC %D must be <= comm.size",fact);
808:   red->redfactor = fact;
809:   return(0);
810: }

812: static PetscErrorCode PCTelescopeGetIgnoreDM_Telescope(PC pc,PetscBool *v)
813: {
814:   PC_Telescope red = (PC_Telescope)pc->data;
816:   if (v) *v = red->ignore_dm;
817:   return(0);
818: }

820: static PetscErrorCode PCTelescopeSetIgnoreDM_Telescope(PC pc,PetscBool v)
821: {
822:   PC_Telescope red = (PC_Telescope)pc->data;
824:   red->ignore_dm = v;
825:   return(0);
826: }

828: static PetscErrorCode PCTelescopeGetUseCoarseDM_Telescope(PC pc,PetscBool *v)
829: {
830:   PC_Telescope red = (PC_Telescope)pc->data;
832:   if (v) *v = red->use_coarse_dm;
833:   return(0);
834: }

836: static PetscErrorCode PCTelescopeSetUseCoarseDM_Telescope(PC pc,PetscBool v)
837: {
838:   PC_Telescope red = (PC_Telescope)pc->data;
840:   red->use_coarse_dm = v;
841:   return(0);
842: }

844: static PetscErrorCode PCTelescopeGetIgnoreKSPComputeOperators_Telescope(PC pc,PetscBool *v)
845: {
846:   PC_Telescope red = (PC_Telescope)pc->data;
848:   if (v) *v = red->ignore_kspcomputeoperators;
849:   return(0);
850: }

852: static PetscErrorCode PCTelescopeSetIgnoreKSPComputeOperators_Telescope(PC pc,PetscBool v)
853: {
854:   PC_Telescope red = (PC_Telescope)pc->data;
856:   red->ignore_kspcomputeoperators = v;
857:   return(0);
858: }

860: static PetscErrorCode PCTelescopeGetDM_Telescope(PC pc,DM *dm)
861: {
862:   PC_Telescope red = (PC_Telescope)pc->data;
864:   *dm = private_PCTelescopeGetSubDM(red);
865:   return(0);
866: }

868: /*@
869:  PCTelescopeGetKSP - Gets the KSP created by the telescoping PC.

871:  Not Collective

873:  Input Parameter:
874: .  pc - the preconditioner context

876:  Output Parameter:
877: .  subksp - the KSP defined the smaller set of processes

879:  Level: advanced

881: @*/
882: PetscErrorCode PCTelescopeGetKSP(PC pc,KSP *subksp)
883: {
886:   PetscUseMethod(pc,"PCTelescopeGetKSP_C",(PC,KSP*),(pc,subksp));
887:   return(0);
888: }

890: /*@
891:  PCTelescopeGetReductionFactor - Gets the factor by which the original number of processes has been reduced by.

893:  Not Collective

895:  Input Parameter:
896: .  pc - the preconditioner context

898:  Output Parameter:
899: .  fact - the reduction factor

901:  Level: advanced

903: @*/
904: PetscErrorCode PCTelescopeGetReductionFactor(PC pc,PetscInt *fact)
905: {
908:   PetscUseMethod(pc,"PCTelescopeGetReductionFactor_C",(PC,PetscInt*),(pc,fact));
909:   return(0);
910: }

912: /*@
913:  PCTelescopeSetReductionFactor - Sets the factor by which the original number of processes has been reduced by.

915:  Not Collective

917:  Input Parameter:
918: .  pc - the preconditioner context

920:  Output Parameter:
921: .  fact - the reduction factor

923:  Level: advanced

925: @*/
926: PetscErrorCode PCTelescopeSetReductionFactor(PC pc,PetscInt fact)
927: {
930:   PetscTryMethod(pc,"PCTelescopeSetReductionFactor_C",(PC,PetscInt),(pc,fact));
931:   return(0);
932: }

934: /*@
935:  PCTelescopeGetIgnoreDM - Get the flag indicating if any DM attached to the PC will be used.

937:  Not Collective

939:  Input Parameter:
940: .  pc - the preconditioner context

942:  Output Parameter:
943: .  v - the flag

945:  Level: advanced

947: @*/
948: PetscErrorCode PCTelescopeGetIgnoreDM(PC pc,PetscBool *v)
949: {
952:   PetscUseMethod(pc,"PCTelescopeGetIgnoreDM_C",(PC,PetscBool*),(pc,v));
953:   return(0);
954: }

956: /*@
957:  PCTelescopeSetIgnoreDM - Set a flag to ignore any DM attached to the PC.

959:  Not Collective

961:  Input Parameter:
962: .  pc - the preconditioner context

964:  Output Parameter:
965: .  v - Use PETSC_TRUE to ignore any DM

967:  Level: advanced

969: @*/
970: PetscErrorCode PCTelescopeSetIgnoreDM(PC pc,PetscBool v)
971: {
974:   PetscTryMethod(pc,"PCTelescopeSetIgnoreDM_C",(PC,PetscBool),(pc,v));
975:   return(0);
976: }

978: /*@
979:  PCTelescopeGetUseCoarseDM - Get the flag indicating if the coarse DM attached to DM associated with the PC will be used.

981:  Not Collective

983:  Input Parameter:
984: .  pc - the preconditioner context

986:  Output Parameter:
987: .  v - the flag

989:  Level: advanced

991: @*/
992: PetscErrorCode PCTelescopeGetUseCoarseDM(PC pc,PetscBool *v)
993: {
996:   PetscUseMethod(pc,"PCTelescopeGetUseCoarseDM_C",(PC,PetscBool*),(pc,v));
997:   return(0);
998: }

1000: /*@
1001:  PCTelescopeSetUseCoarseDM - Set a flag to query the DM attached to the PC if it also has a coarse DM

1003:  Not Collective

1005:  Input Parameter:
1006: .  pc - the preconditioner context

1008:  Output Parameter:
1009: .  v - Use PETSC_FALSE to ignore any coarse DM

1011:  Notes:
1012:  When you have specified to use a coarse DM, the communicator used to create the sub-KSP within PCTelescope
1013:  will be that of the coarse DM. Hence the flags -pc_telescope_reduction_factor and
1014:  -pc_telescope_subcomm_type will no longer have any meaning.
1015:  It is required that the communicator associated with the parent (fine) and the coarse DM are of different sizes.
1016:  An error will occur of the size of the communicator associated with the coarse DM
1017:  is the same as that of the parent DM.
1018:  Furthermore, it is required that the communicator on the coarse DM is a sub-communicator of the parent.
1019:  This will be checked at the time the preconditioner is setup and an error will occur if
1020:  the coarse DM does not define a sub-communicator of that used by the parent DM.

1022:  The particular Telescope setup invoked when using a coarse DM is agnostic with respect to the type of
1023:  the DM used (e.g. it supports DMSHELL, DMPLEX, etc).

1025:  Support is currently only provided for the case when you are using KSPSetComputeOperators()

1027:  The user is required to compose a function with the parent DM to facilitate the transfer of fields (Vec) between the different decompositions defined by the fine and coarse DMs.
1028:  In the user code, this is achieved via
1029: .vb
1030:    {
1031:      DM dm_fine;
1032:      PetscObjectCompose((PetscObject)dm_fine,"PCTelescopeFieldScatter",your_field_scatter_method);
1033:    }
1034: .ve
1035:  The signature of the user provided field scatter method is
1036: .vb
1037:    PetscErrorCode your_field_scatter_method(DM dm_fine,Vec x_fine,ScatterMode mode,DM dm_coarse,Vec x_coarse);
1038: .ve
1039:  The user must provide support for both mode = SCATTER_FORWARD and mode = SCATTER_REVERSE.
1040:  SCATTER_FORWARD implies the direction of transfer is from the parent (fine) DM to the coarse DM.

1042:  Optionally, the user may also compose a function with the parent DM to facilitate the transfer
1043:  of state variables between the fine and coarse DMs.
1044:  In the context of a finite element discretization, an example state variable might be
1045:  values associated with quadrature points within each element.
1046:  A user provided state scatter method is composed via
1047: .vb
1048:    {
1049:      DM dm_fine;
1050:      PetscObjectCompose((PetscObject)dm_fine,"PCTelescopeStateScatter",your_state_scatter_method);
1051:    }
1052: .ve
1053:  The signature of the user provided state scatter method is
1054: .vb
1055:    PetscErrorCode your_state_scatter_method(DM dm_fine,ScatterMode mode,DM dm_coarse);
1056: .ve
1057:  SCATTER_FORWARD implies the direction of transfer is from the fine DM to the coarse DM.
1058:  The user is only required to support mode = SCATTER_FORWARD.
1059:  No assumption is made about the data type of the state variables.
1060:  These must be managed by the user and must be accessible from the DM.

1062:  Care must be taken in defining the user context passed to KSPSetComputeOperators() which is to be
1063:  associated with the sub-KSP residing within PCTelescope.
1064:  In general, PCTelescope assumes that the context on the fine and coarse DM used with
1065:  KSPSetComputeOperators() should be "similar" in type or origin.
1066:  Specifically the following rules are used to infer what context on the sub-KSP should be.

1068:  First the contexts from the KSP and the fine and coarse DMs are retrieved.
1069:  Note that the special case of a DMSHELL context is queried.

1071: .vb
1072:    DMKSPGetComputeOperators(dm_fine,&dmfine_kspfunc,&dmfine_kspctx);
1073:    DMGetApplicationContext(dm_fine,&dmfine_appctx);
1074:    DMShellGetContext(dm_fine,&dmfine_shellctx);

1076:    DMGetApplicationContext(dm_coarse,&dmcoarse_appctx);
1077:    DMShellGetContext(dm_coarse,&dmcoarse_shellctx);
1078: .ve

1080:  The following rules are then enforced:

1082:  1. If dmfine_kspctx = NULL, then we provide a NULL pointer as the context for the sub-KSP:
1083:  KSPSetComputeOperators(sub_ksp,dmfine_kspfunc,NULL);

1085:  2. If dmfine_kspctx != NULL and dmfine_kspctx == dmfine_appctx,
1086:  check that dmcoarse_appctx is also non-NULL. If this is true, then:
1087:  KSPSetComputeOperators(sub_ksp,dmfine_kspfunc,dmcoarse_appctx);

1089:  3. If dmfine_kspctx != NULL and dmfine_kspctx == dmfine_shellctx,
1090:  check that dmcoarse_shellctx is also non-NULL. If this is true, then:
1091:  KSPSetComputeOperators(sub_ksp,dmfine_kspfunc,dmcoarse_shellctx);

1093:  If neither of the above three tests passed, then PCTelescope cannot safely determine what
1094:  context should be provided to KSPSetComputeOperators() for use with the sub-KSP.
1095:  In this case, an additional mechanism is provided via a composed function which will return
1096:  the actual context to be used. To use this feature you must compose the "getter" function
1097:  with the coarse DM, e.g.
1098: .vb
1099:    {
1100:      DM dm_coarse;
1101:      PetscObjectCompose((PetscObject)dm_coarse,"PCTelescopeGetCoarseDMKSPContext",your_coarse_context_getter);
1102:    }
1103: .ve
1104:  The signature of the user provided method is
1105: .vb
1106:    PetscErrorCode your_coarse_context_getter(DM dm_coarse,void **your_kspcontext);
1107: .ve

1109:  Level: advanced

1111: @*/
1112: PetscErrorCode PCTelescopeSetUseCoarseDM(PC pc,PetscBool v)
1113: {
1116:   PetscTryMethod(pc,"PCTelescopeSetUseCoarseDM_C",(PC,PetscBool),(pc,v));
1117:   return(0);
1118: }

1120: /*@
1121:  PCTelescopeGetIgnoreKSPComputeOperators - Get the flag indicating if KSPComputeOperators will be used.

1123:  Not Collective

1125:  Input Parameter:
1126: .  pc - the preconditioner context

1128:  Output Parameter:
1129: .  v - the flag

1131:  Level: advanced

1133: @*/
1134: PetscErrorCode PCTelescopeGetIgnoreKSPComputeOperators(PC pc,PetscBool *v)
1135: {
1138:   PetscUseMethod(pc,"PCTelescopeGetIgnoreKSPComputeOperators_C",(PC,PetscBool*),(pc,v));
1139:   return(0);
1140: }

1142: /*@
1143:  PCTelescopeSetIgnoreKSPComputeOperators - Set a flag to ignore KSPComputeOperators.

1145:  Not Collective

1147:  Input Parameter:
1148: .  pc - the preconditioner context

1150:  Output Parameter:
1151: .  v - Use PETSC_TRUE to ignore the method (if defined) set via KSPSetComputeOperators on pc

1153:  Level: advanced

1155: @*/
1156: PetscErrorCode PCTelescopeSetIgnoreKSPComputeOperators(PC pc,PetscBool v)
1157: {
1160:   PetscTryMethod(pc,"PCTelescopeSetIgnoreKSPComputeOperators_C",(PC,PetscBool),(pc,v));
1161:   return(0);
1162: }

1164: /*@
1165:  PCTelescopeGetDM - Get the re-partitioned DM attached to the sub KSP.

1167:  Not Collective

1169:  Input Parameter:
1170: .  pc - the preconditioner context

1172:  Output Parameter:
1173: .  subdm - The re-partitioned DM

1175:  Level: advanced

1177: @*/
1178: PetscErrorCode PCTelescopeGetDM(PC pc,DM *subdm)
1179: {
1182:   PetscUseMethod(pc,"PCTelescopeGetDM_C",(PC,DM*),(pc,subdm));
1183:   return(0);
1184: }

1186: /*@
1187:  PCTelescopeSetSubcommType - set subcommunicator type (interlaced or contiguous)

1189:  Logically Collective

1191:  Input Parameter:
1192: +  pc - the preconditioner context
1193: -  subcommtype - the subcommunicator type (see PetscSubcommType)

1195:  Level: advanced

1197: .seealso: PetscSubcommType, PetscSubcomm, PCTELESCOPE
1198: @*/
1199: PetscErrorCode PCTelescopeSetSubcommType(PC pc, PetscSubcommType subcommtype)
1200: {
1203:   PetscTryMethod(pc,"PCTelescopeSetSubcommType_C",(PC,PetscSubcommType),(pc,subcommtype));
1204:   return(0);
1205: }

1207: /*@
1208:  PCTelescopeGetSubcommType - Get the subcommunicator type (interlaced or contiguous)

1210:  Not Collective

1212:  Input Parameter:
1213: .  pc - the preconditioner context

1215:  Output Parameter:
1216: .  subcommtype - the subcommunicator type (see PetscSubcommType)

1218:  Level: advanced

1220: .seealso: PetscSubcomm, PetscSubcommType, PCTELESCOPE
1221: @*/
1222: PetscErrorCode PCTelescopeGetSubcommType(PC pc, PetscSubcommType *subcommtype)
1223: {
1226:   PetscUseMethod(pc,"PCTelescopeGetSubcommType_C",(PC,PetscSubcommType*),(pc,subcommtype));
1227:   return(0);
1228: }

1230: /* -------------------------------------------------------------------------------------*/
1231: /*MC
1232:    PCTELESCOPE - Runs a KSP solver on a sub-communicator. MPI ranks not in the sub-communicator are idle during the solve.

1234:    Options Database:
1235: +  -pc_telescope_reduction_factor <r> - factor to reduce the communicator size by. e.g. with 64 MPI ranks and r=4, the new sub-communicator will have 64/4 = 16 ranks.
1236: .  -pc_telescope_ignore_dm  - flag to indicate whether an attached DM should be ignored.
1237: .  -pc_telescope_subcomm_type <interlaced,contiguous> - defines the selection of MPI ranks on the sub-communicator. see PetscSubcomm for more information.
1238: .  -pc_telescope_ignore_kspcomputeoperators - flag to indicate whether KSPSetComputeOperators should be used on the sub-KSP.
1239: -  -pc_telescope_use_coarse_dm - flag to indicate whether the coarse DM should be used to define the sub-communicator.

1241:    Level: advanced

1243:    Notes:
1244:    Assuming that the parent preconditioner (PC) is defined on a communicator c, this implementation
1245:    creates a child sub-communicator (c') containing fewer MPI ranks than the original parent preconditioner (PC).
1246:    The preconditioner is deemed telescopic as it only calls KSPSolve() on a single
1247:    sub-communicator, in contrast with PCREDUNDANT which calls KSPSolve() on N sub-communicators.
1248:    This means there will be MPI ranks which will be idle during the application of this preconditioner.
1249:    Additionally, in comparison with PCREDUNDANT, PCTELESCOPE can utilize an attached DM.

1251:    The default type of the sub KSP (the KSP defined on c') is PREONLY.

1253:    There are three setup mechanisms for PCTelescope. Features support by each type are described below.
1254:    In the following, we will refer to the operators B and B', these are the Bmat provided to the KSP on the
1255:    communicators c and c' respectively.

1257:    [1] Default setup
1258:    The sub-communicator c' is created via PetscSubcommCreate().
1259:    Explicitly defined nullspace and near nullspace vectors will be propogated from B to B'.
1260:    Currently there is no support define nullspaces via a user supplied method (e.g. as passed to MatNullSpaceSetFunction()).
1261:    No support is provided for KSPSetComputeOperators().
1262:    Currently there is no support for the flag -pc_use_amat.

1264:    [2] DM aware setup
1265:    If a DM is attached to the PC, it is re-partitioned on the sub-communicator c'.
1266:    c' is created via PetscSubcommCreate().
1267:    Both the Bmat operator and the right hand side vector are permuted into the new DOF ordering defined by the re-partitioned DM.
1268:    Currently only support for re-partitioning a DMDA is provided.
1269:    Any explicitly defined nullspace or near nullspace vectors attached to the original Bmat operator (B) are extracted, re-partitioned and set on the re-partitioned Bmat operator (B').
1270:    Currently there is no support define nullspaces via a user supplied method (e.g. as passed to MatNullSpaceSetFunction()).
1271:    Support is provided for KSPSetComputeOperators(). The user provided function and context is propagated to the sub KSP.
1272:    This is fragile since the user must ensure that their user context is valid for use on c'.
1273:    Currently there is no support for the flag -pc_use_amat.

1275:    [3] Coarse DM setup
1276:    If a DM (dmfine) is attached to the PC, dmfine is queried for a "coarse" DM (call this dmcoarse) via DMGetCoarseDM().
1277:    PCTELESCOPE will interpret the coarse DM as being defined on a sub-communicator of c.
1278:    The communicator associated with dmcoarse will define the c' to be used within PCTELESCOPE.
1279:    PCTELESCOPE will check that c' is in fact a sub-communicator of c. If it is not, an error will be reported.
1280:    The intention of this setup type is that PCTELESCOPE will use an existing (e.g. user defined) communicator hierarchy, say as would be
1281:    available with using multi-grid on unstructured meshes.
1282:    This setup will not use the command line options -pc_telescope_reduction_factor or -pc_telescope_subcomm_type.
1283:    Any explicitly defined nullspace or near nullspace vectors attached to the original Bmat operator (B) are extracted, scattered into the correct ordering consistent with dmcoarse and set on B'.
1284:    Currently there is no support define nullspaces via a user supplied method (e.g. as passed to MatNullSpaceSetFunction()).
1285:    There is no general method to permute field orderings, hence only KSPSetComputeOperators() is supported.
1286:    The user must use PetscObjectComposeFunction() with dmfine to define the method to scatter fields from dmfine to dmcoarse.
1287:    Propogation of the user context for KSPSetComputeOperators() on the sub KSP is attempted by querying the DM contexts associated with dmfine and dmcoarse. Alternatively, the user may use PetscObjectComposeFunction() with dmcoarse to define a method which will return the appropriate user context for KSPSetComputeOperators().
1288:    Currently there is no support for the flag -pc_use_amat.
1289:    This setup can be invoked by the option -pc_telescope_use_coarse_dm or by calling PCTelescopeSetUseCoarseDM(pc,PETSC_TRUE);
1290:    Further information about the user-provided methods required by this setup type are described here PCTelescopeSetUseCoarseDM().

1292:    Developer Notes:
1293:    During PCSetup, the B operator is scattered onto c'.
1294:    Within PCApply, the RHS vector (x) is scattered into a redundant vector, xred (defined on c').
1295:    Then, KSPSolve() is executed on the c' communicator.

1297:    The communicator used within the telescoping preconditioner is defined by a PetscSubcomm using the INTERLACED 
1298:    creation routine by default (this can be changed with -pc_telescope_subcomm_type). We run the sub KSP on only the ranks within the communicator which have a color equal to zero.

1300:    The telescoping preconditioner is aware of nullspaces and near nullspaces which are attached to the B operator.
1301:    In the case where B has a (near) nullspace attached, the (near) nullspace vectors are extracted from B and mapped into
1302:    a new (near) nullspace, defined on the sub-communicator, which is attached to B' (the B operator which was scattered to c')

1304:    The telescoping preconditioner can re-partition an attached DM if it is a DMDA (2D or 3D -
1305:    support for 1D DMDAs is not provided). If a DMDA is found, a topologically equivalent DMDA is created on c'
1306:    and this new DM is attached the sub KSP. The design of telescope is such that it should be possible to extend support
1307:    for re-partitioning other to DM's (e.g. DMPLEX). The user can supply a flag to ignore attached DMs.
1308:    Alternatively, user-provided re-partitioned DMs can be used via -pc_telescope_use_coarse_dm.

1310:    With the default setup mode, B' is defined by fusing rows (in order) associated with MPI ranks common to c and c'.

1312:    When a DMDA is attached to the parent preconditioner, B' is defined by: (i) performing a symmetric permutation of B
1313:    into the ordering defined by the DMDA on c', (ii) extracting the local chunks via MatCreateSubMatrices(), (iii) fusing the
1314:    locally (sequential) matrices defined on the ranks common to c and c' into B' using MatCreateMPIMatConcatenateSeqMat()

1316:    Limitations/improvements include the following.
1317:    VecPlaceArray() could be used within PCApply() to improve efficiency and reduce memory usage.
1318:    A unified mechanism to query for user contexts as required by KSPSetComputeOperators() and MatNullSpaceSetFunction().

1320:    The symmetric permutation used when a DMDA is encountered is performed via explicitly assmbleming a permutation matrix P,
1321:    and performing P^T.A.P. Possibly it might be more efficient to use MatPermute(). We opted to use P^T.A.P as it appears
1322:    VecPermute() does not supported for the use case required here. By computing P, one can permute both the operator and RHS in a 
1323:    consistent manner.

1325:    Mapping of vectors (default setup mode) is performed in the following way.
1326:    Suppose the parent communicator size was 4, and we set a reduction factor of 2; this would give a comm size on c' of 2.
1327:    Using the interlaced creation routine, the ranks in c with color = 0 will be rank 0 and 2.
1328:    We perform the scatter to the sub-communicator in the following way.
1329:    [1] Given a vector x defined on communicator c

1331: .vb
1332:    rank(c)  local values of x
1333:    ------- ----------------------------------------
1334:         0   [  0.0,  1.0,  2.0,  3.0,  4.0,  5.0 ]
1335:         1   [  6.0,  7.0,  8.0,  9.0, 10.0, 11.0 ]
1336:         2   [ 12.0, 13.0, 14.0, 15.0, 16.0, 17.0 ]
1337:         3   [ 18.0, 19.0, 20.0, 21.0, 22.0, 23.0 ]
1338: .ve

1340:    scatter into xtmp defined also on comm c, so that we have the following values

1342: .vb
1343:    rank(c)  local values of xtmp
1344:    ------- ----------------------------------------------------------------------------
1345:         0   [  0.0,  1.0,  2.0,  3.0,  4.0,  5.0,  6.0,  7.0,  8.0,  9.0, 10.0, 11.0 ]
1346:         1   [ ]
1347:         2   [ 12.0, 13.0, 14.0, 15.0, 16.0, 17.0, 18.0, 19.0, 20.0, 21.0, 22.0, 23.0 ]
1348:         3   [ ]
1349: .ve

1351:    The entries on rank 1 and 3 (ranks which do not have a color = 0 in c') have no values


1354:    [2] Copy the values from ranks 0, 2 (indices with respect to comm c) into the vector xred which is defined on communicator c'.
1355:    Ranks 0 and 2 are the only ranks in the subcomm which have a color = 0.

1357: .vb
1358:    rank(c')  local values of xred
1359:    -------- ----------------------------------------------------------------------------
1360:          0   [  0.0,  1.0,  2.0,  3.0,  4.0,  5.0,  6.0,  7.0,  8.0,  9.0, 10.0, 11.0 ]
1361:          1   [ 12.0, 13.0, 14.0, 15.0, 16.0, 17.0, 18.0, 19.0, 20.0, 21.0, 22.0, 23.0 ]
1362: .ve

1364:   Contributed by Dave May

1366:   Reference:
1367:   Dave A. May, Patrick Sanan, Karl Rupp, Matthew G. Knepley, and Barry F. Smith, "Extreme-Scale Multigrid Components within PETSc". 2016. In Proceedings of the Platform for Advanced Scientific Computing Conference (PASC '16). DOI: 10.1145/2929908.2929913

1369: .seealso:  PCTelescopeGetKSP(), PCTelescopeGetDM(), PCTelescopeGetReductionFactor(), PCTelescopeSetReductionFactor(), PCTelescopeGetIgnoreDM(), PCTelescopeSetIgnoreDM(), PCREDUNDANT
1370: M*/
1371: PETSC_EXTERN PetscErrorCode PCCreate_Telescope(PC pc)
1372: {
1373:   PetscErrorCode       ierr;
1374:   struct _PC_Telescope *sred;

1377:   PetscNewLog(pc,&sred);
1378:   sred->psubcomm       = NULL;
1379:   sred->subcommtype    = PETSC_SUBCOMM_INTERLACED;
1380:   sred->subcomm        = MPI_COMM_NULL;
1381:   sred->redfactor      = 1;
1382:   sred->ignore_dm      = PETSC_FALSE;
1383:   sred->ignore_kspcomputeoperators = PETSC_FALSE;
1384:   sred->use_coarse_dm  = PETSC_FALSE;
1385:   pc->data             = (void*)sred;

1387:   pc->ops->apply           = PCApply_Telescope;
1388:   pc->ops->applytranspose  = NULL;
1389:   pc->ops->applyrichardson = PCApplyRichardson_Telescope;
1390:   pc->ops->setup           = PCSetUp_Telescope;
1391:   pc->ops->destroy         = PCDestroy_Telescope;
1392:   pc->ops->reset           = PCReset_Telescope;
1393:   pc->ops->setfromoptions  = PCSetFromOptions_Telescope;
1394:   pc->ops->view            = PCView_Telescope;

1396:   sred->pctelescope_setup_type              = PCTelescopeSetUp_default;
1397:   sred->pctelescope_matcreate_type          = PCTelescopeMatCreate_default;
1398:   sred->pctelescope_matnullspacecreate_type = PCTelescopeMatNullSpaceCreate_default;
1399:   sred->pctelescope_reset_type              = NULL;

1401:   PetscObjectComposeFunction((PetscObject)pc,"PCTelescopeGetKSP_C",PCTelescopeGetKSP_Telescope);
1402:   PetscObjectComposeFunction((PetscObject)pc,"PCTelescopeGetSubcommType_C",PCTelescopeGetSubcommType_Telescope);
1403:   PetscObjectComposeFunction((PetscObject)pc,"PCTelescopeSetSubcommType_C",PCTelescopeSetSubcommType_Telescope);
1404:   PetscObjectComposeFunction((PetscObject)pc,"PCTelescopeGetReductionFactor_C",PCTelescopeGetReductionFactor_Telescope);
1405:   PetscObjectComposeFunction((PetscObject)pc,"PCTelescopeSetReductionFactor_C",PCTelescopeSetReductionFactor_Telescope);
1406:   PetscObjectComposeFunction((PetscObject)pc,"PCTelescopeGetIgnoreDM_C",PCTelescopeGetIgnoreDM_Telescope);
1407:   PetscObjectComposeFunction((PetscObject)pc,"PCTelescopeSetIgnoreDM_C",PCTelescopeSetIgnoreDM_Telescope);
1408:   PetscObjectComposeFunction((PetscObject)pc,"PCTelescopeGetIgnoreKSPComputeOperators_C",PCTelescopeGetIgnoreKSPComputeOperators_Telescope);
1409:   PetscObjectComposeFunction((PetscObject)pc,"PCTelescopeSetIgnoreKSPComputeOperators_C",PCTelescopeSetIgnoreKSPComputeOperators_Telescope);
1410:   PetscObjectComposeFunction((PetscObject)pc,"PCTelescopeGetDM_C",PCTelescopeGetDM_Telescope);
1411:   PetscObjectComposeFunction((PetscObject)pc,"PCTelescopeGetUseCoarseDM_C",PCTelescopeGetUseCoarseDM_Telescope);
1412:   PetscObjectComposeFunction((PetscObject)pc,"PCTelescopeSetUseCoarseDM_C",PCTelescopeSetUseCoarseDM_Telescope);
1413:   return(0);
1414: }