Actual source code: init.c

petsc-master 2018-02-24
Report Typos and Errors
  1: /*

  3:    This file defines part of the initialization of PETSc

  5:   This file uses regular malloc and free because it cannot known
  6:   what malloc is being used until it has already processed the input.
  7: */

  9:  #include <petscsys.h>
 10:  #include <petsc/private/petscimpl.h>
 11:  #include <petscvalgrind.h>
 12:  #include <petscviewer.h>

 14: #if defined(PETSC_HAVE_SYS_SYSINFO_H)
 15: #include <sys/sysinfo.h>
 16: #endif
 17: #if defined(PETSC_HAVE_UNISTD_H)
 18: #include <unistd.h>
 19: #endif
 20: #if defined(PETSC_HAVE_CUDA)
 21: #include <cuda_runtime.h>
 22: #endif

 24: #if defined(PETSC_HAVE_VIENNACL)
 25: PETSC_EXTERN PetscErrorCode PetscViennaCLInit();
 26: #endif

 28: /* ------------------------Nasty global variables -------------------------------*/
 29: /*
 30:      Indicates if PETSc started up MPI, or it was
 31:    already started before PETSc was initialized.
 32: */
 33: PetscBool   PetscBeganMPI         = PETSC_FALSE;
 34: PetscBool   PetscInitializeCalled = PETSC_FALSE;
 35: PetscBool   PetscFinalizeCalled   = PETSC_FALSE;
 36: PetscBool   PetscCUDAInitialized  = PETSC_FALSE;

 38: PetscMPIInt PetscGlobalRank       = -1;
 39: PetscMPIInt PetscGlobalSize       = -1;

 41: #if defined(PETSC_HAVE_COMPLEX)
 42: #if defined(PETSC_COMPLEX_INSTANTIATE)
 43: template <> class std::complex<double>; /* instantiate complex template class */
 44: #endif
 45: #if !defined(PETSC_HAVE_MPI_C_DOUBLE_COMPLEX)
 46: MPI_Datatype MPIU_C_DOUBLE_COMPLEX;
 47: MPI_Datatype MPIU_C_COMPLEX;
 48: #endif

 50: /*MC
 51:    PETSC_i - the imaginary number i

 53:    Synopsis:
 54:    #include <petscsys.h>
 55:    PetscComplex PETSC_i;

 57:    Level: beginner

 59:    Note:
 60:    Complex numbers are automatically available if PETSc located a working complex implementation

 62: .seealso: PetscRealPart(), PetscImaginaryPart(), PetscRealPartComplex(), PetscImaginaryPartComplex()
 63: M*/
 64: PetscComplex PETSC_i;
 65: #endif
 66: #if defined(PETSC_USE_REAL___FLOAT128)
 67: MPI_Datatype MPIU___FLOAT128 = 0;
 68: #if defined(PETSC_HAVE_COMPLEX)
 69: MPI_Datatype MPIU___COMPLEX128 = 0;
 70: #endif
 71: #elif defined(PETSC_USE_REAL___FP16)
 72: MPI_Datatype MPIU___FP16 = 0;
 73: #endif
 74: MPI_Datatype MPIU_2SCALAR = 0;
 75: #if defined(PETSC_USE_64BIT_INDICES) || !defined(MPI_2INT)
 76: MPI_Datatype MPIU_2INT = 0;
 77: #endif
 78: MPI_Datatype MPIU_BOOL;
 79: MPI_Datatype MPIU_ENUM;

 81: /*
 82:        Function that is called to display all error messages
 83: */
 84: PetscErrorCode (*PetscErrorPrintf)(const char [],...)          = PetscErrorPrintfDefault;
 85: PetscErrorCode (*PetscHelpPrintf)(MPI_Comm,const char [],...)  = PetscHelpPrintfDefault;
 86: #if defined(PETSC_HAVE_MATLAB_ENGINE)
 87: PetscErrorCode (*PetscVFPrintf)(FILE*,const char[],va_list)    = PetscVFPrintf_Matlab;
 88: #else
 89: PetscErrorCode (*PetscVFPrintf)(FILE*,const char[],va_list)    = PetscVFPrintfDefault;
 90: #endif
 91: /*
 92:   This is needed to turn on/off GPU synchronization
 93: */
 94: PetscBool PetscCUSPSynchronize = PETSC_FALSE;
 95: PetscBool PetscViennaCLSynchronize = PETSC_FALSE;
 96: PetscBool PetscCUDASynchronize = PETSC_FALSE;

 98: /* ------------------------------------------------------------------------------*/
 99: /*
100:    Optional file where all PETSc output from various prints is saved
101: */
102: FILE *petsc_history = NULL;

104: PetscErrorCode  PetscOpenHistoryFile(const char filename[],FILE **fd)
105: {
107:   PetscMPIInt    rank,size;
108:   char           pfile[PETSC_MAX_PATH_LEN],pname[PETSC_MAX_PATH_LEN],fname[PETSC_MAX_PATH_LEN],date[64];
109:   char           version[256];

112:   MPI_Comm_rank(PETSC_COMM_WORLD,&rank);
113:   if (!rank) {
114:     char        arch[10];
115:     int         err;

117:     PetscGetArchType(arch,10);
118:     PetscGetDate(date,64);
119:     PetscGetVersion(version,256);
120:     MPI_Comm_size(PETSC_COMM_WORLD,&size);
121:     if (filename) {
122:       PetscFixFilename(filename,fname);
123:     } else {
124:       PetscGetHomeDirectory(pfile,240);
125:       PetscStrcat(pfile,"/.petschistory");
126:       PetscFixFilename(pfile,fname);
127:     }

129:     *fd = fopen(fname,"a");
130:     if (!fd) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_FILE_OPEN,"Cannot open file: %s",fname);

132:     PetscFPrintf(PETSC_COMM_SELF,*fd,"---------------------------------------------------------\n");
133:     PetscFPrintf(PETSC_COMM_SELF,*fd,"%s %s\n",version,date);
134:     PetscGetProgramName(pname,PETSC_MAX_PATH_LEN);
135:     PetscFPrintf(PETSC_COMM_SELF,*fd,"%s on a %s, %d proc. with options:\n",pname,arch,size);
136:     PetscFPrintf(PETSC_COMM_SELF,*fd,"---------------------------------------------------------\n");

138:     err = fflush(*fd);
139:     if (err) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SYS,"fflush() failed on file");
140:   }
141:   return(0);
142: }

144: PetscErrorCode  PetscCloseHistoryFile(FILE **fd)
145: {
147:   PetscMPIInt    rank;
148:   char           date[64];
149:   int            err;

152:   MPI_Comm_rank(PETSC_COMM_WORLD,&rank);
153:   if (!rank) {
154:     PetscGetDate(date,64);
155:     PetscFPrintf(PETSC_COMM_SELF,*fd,"---------------------------------------------------------\n");
156:     PetscFPrintf(PETSC_COMM_SELF,*fd,"Finished at %s\n",date);
157:     PetscFPrintf(PETSC_COMM_SELF,*fd,"---------------------------------------------------------\n");
158:     err  = fflush(*fd);
159:     if (err) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SYS,"fflush() failed on file");
160:     err = fclose(*fd);
161:     if (err) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SYS,"fclose() failed on file");
162:   }
163:   return(0);
164: }

166: /* ------------------------------------------------------------------------------*/

168: /*
169:    This is ugly and probably belongs somewhere else, but I want to
170:   be able to put a true MPI abort error handler with command line args.

172:     This is so MPI errors in the debugger will leave all the stack
173:   frames. The default MP_Abort() cleans up and exits thus providing no useful information
174:   in the debugger hence we call abort() instead of MPI_Abort().
175: */

177: void Petsc_MPI_AbortOnError(MPI_Comm *comm,PetscMPIInt *flag)
178: {
180:   (*PetscErrorPrintf)("MPI error %d\n",*flag);
181:   abort();
182: }

184: void Petsc_MPI_DebuggerOnError(MPI_Comm *comm,PetscMPIInt *flag)
185: {

189:   (*PetscErrorPrintf)("MPI error %d\n",*flag);
190:   PetscAttachDebugger();
191:   if (ierr) MPI_Abort(*comm,*flag); /* hopeless so get out */
192: }

194: /*@C
195:    PetscEnd - Calls PetscFinalize() and then ends the program. This is useful if one
196:      wishes a clean exit somewhere deep in the program.

198:    Collective on PETSC_COMM_WORLD

200:    Options Database Keys are the same as for PetscFinalize()

202:    Level: advanced

204:    Note:
205:    See PetscInitialize() for more general runtime options.

207: .seealso: PetscInitialize(), PetscOptionsView(), PetscMallocDump(), PetscMPIDump(), PetscFinalize()
208: @*/
209: PetscErrorCode  PetscEnd(void)
210: {
212:   PetscFinalize();
213:   exit(0);
214:   return 0;
215: }

217: PetscBool PetscOptionsPublish = PETSC_FALSE;
218: extern PetscErrorCode PetscSetUseTrMalloc_Private(void);
219: extern PetscErrorCode PetscSetUseHBWMalloc_Private(void);
220: extern PetscBool      petscsetmallocvisited;
221: static char           emacsmachinename[256];

223: PetscErrorCode (*PetscExternalVersionFunction)(MPI_Comm) = 0;
224: PetscErrorCode (*PetscExternalHelpFunction)(MPI_Comm)    = 0;

226: /*@C
227:    PetscSetHelpVersionFunctions - Sets functions that print help and version information
228:    before the PETSc help and version information is printed. Must call BEFORE PetscInitialize().
229:    This routine enables a "higher-level" package that uses PETSc to print its messages first.

231:    Input Parameter:
232: +  help - the help function (may be NULL)
233: -  version - the version function (may be NULL)

235:    Level: developer

237:    Concepts: package help message

239: @*/
240: PetscErrorCode  PetscSetHelpVersionFunctions(PetscErrorCode (*help)(MPI_Comm),PetscErrorCode (*version)(MPI_Comm))
241: {
243:   PetscExternalHelpFunction    = help;
244:   PetscExternalVersionFunction = version;
245:   return(0);
246: }

248: #if defined(PETSC_USE_LOG)
249: extern PetscBool   PetscObjectsLog;
250: #endif

252: PetscErrorCode  PetscOptionsCheckInitial_Private(void)
253: {
254:   char              string[64],mname[PETSC_MAX_PATH_LEN],*f;
255:   MPI_Comm          comm = PETSC_COMM_WORLD;
256:   PetscBool         flg1 = PETSC_FALSE,flg2 = PETSC_FALSE,flg3 = PETSC_FALSE,flag;
257:   PetscErrorCode    ierr;
258:   PetscReal         si;
259:   PetscInt          intensity;
260:   int               i;
261:   PetscMPIInt       rank;
262:   char              version[256],helpoptions[256];
263: #if !defined(PETSC_HAVE_THREADSAFETY)
264:   PetscReal         logthreshold;
265: #endif
266: #if defined(PETSC_USE_LOG)
267:   PetscViewerFormat format;
268:   PetscBool         flg4 = PETSC_FALSE;
269: #endif

272:   MPI_Comm_rank(comm,&rank);

274: #if !defined(PETSC_HAVE_THREADSAFETY)
275:   /*
276:       Setup the memory management; support for tracing malloc() usage
277:   */
278:   PetscOptionsHasName(NULL,NULL,"-malloc_log",&flg3);
279:   logthreshold = 0.0;
280:   PetscOptionsGetReal(NULL,NULL,"-malloc_log_threshold",&logthreshold,&flg1);
281:   if (flg1) flg3 = PETSC_TRUE;
282: #if defined(PETSC_USE_DEBUG)
283:   PetscOptionsGetBool(NULL,NULL,"-malloc",&flg1,&flg2);
284:   if ((!flg2 || flg1) && !petscsetmallocvisited) {
285:     if (flg2 || !(PETSC_RUNNING_ON_VALGRIND)) {
286:       /* turn off default -malloc if valgrind is being used */
287:       PetscSetUseTrMalloc_Private();
288:     }
289:   }
290: #else
291:   PetscOptionsGetBool(NULL,NULL,"-malloc_dump",&flg1,NULL);
292:   PetscOptionsGetBool(NULL,NULL,"-malloc",&flg2,NULL);
293:   if (flg1 || flg2 || flg3) {PetscSetUseTrMalloc_Private();}
294: #endif
295:   if (flg3) {
296:     PetscMallocSetDumpLogThreshold((PetscLogDouble)logthreshold);
297:   }
298:   PetscOptionsGetBool(NULL,NULL,"-malloc_coalesce",&flg1,&flg2);
299:   if (flg2) {PetscMallocSetCoalesce(flg1);}
300:   flg1 = PETSC_FALSE;
301:   PetscOptionsGetBool(NULL,NULL,"-malloc_debug",&flg1,NULL);
302:   if (flg1) {
303:     PetscSetUseTrMalloc_Private();
304:     PetscMallocDebug(PETSC_TRUE);
305:   }
306:   flg1 = PETSC_FALSE;
307:   PetscOptionsGetBool(NULL,NULL,"-malloc_test",&flg1,NULL);
308: #if defined(PETSC_USE_DEBUG)
309:   if (flg1 && !PETSC_RUNNING_ON_VALGRIND) {
310:     PetscSetUseTrMalloc_Private();
311:     PetscMallocSetDumpLog();
312:     PetscMallocDebug(PETSC_TRUE);
313:   }
314: #endif
315:   flg1 = PETSC_FALSE;
316:   PetscOptionsGetBool(NULL,NULL,"-malloc_hbw",&flg1,NULL);
317:   /* ignore this option if malloc is already set */
318:   if (flg1 && !petscsetmallocvisited) {PetscSetUseHBWMalloc_Private();}

320:   flg1 = PETSC_FALSE;
321:   PetscOptionsGetBool(NULL,NULL,"-malloc_info",&flg1,NULL);
322:   if (!flg1) {
323:     flg1 = PETSC_FALSE;
324:     PetscOptionsGetBool(NULL,NULL,"-memory_view",&flg1,NULL);
325:   }
326:   if (flg1) {
327:     PetscMemorySetGetMaximumUsage();
328:   }
329: #endif

331: #if defined(PETSC_USE_LOG)
332:   PetscOptionsHasName(NULL,NULL,"-objects_dump",&PetscObjectsLog);
333: #endif

335:   /*
336:       Set the display variable for graphics
337:   */
338:   PetscSetDisplay();

340:   /*
341:       Print the PETSc version information
342:   */
343:   PetscOptionsHasName(NULL,NULL,"-v",&flg1);
344:   PetscOptionsHasName(NULL,NULL,"-version",&flg2);
345:   PetscOptionsHasName(NULL,NULL,"-help",&flg3);
346:   if (flg1 || flg2 || flg3) {

348:     /*
349:        Print "higher-level" package version message
350:     */
351:     if (PetscExternalVersionFunction) {
352:       (*PetscExternalVersionFunction)(comm);
353:     }

355:     PetscGetVersion(version,256);
356:     (*PetscHelpPrintf)(comm,"--------------------------------------------------------------------------\n");
357:     (*PetscHelpPrintf)(comm,"%s\n",version);
358:     (*PetscHelpPrintf)(comm,"%s",PETSC_AUTHOR_INFO);
359:     (*PetscHelpPrintf)(comm,"See docs/changes/index.html for recent updates.\n");
360:     (*PetscHelpPrintf)(comm,"See docs/faq.html for problems.\n");
361:     (*PetscHelpPrintf)(comm,"See docs/manualpages/index.html for help. \n");
362:     (*PetscHelpPrintf)(comm,"Libraries linked from %s\n",PETSC_LIB_DIR);
363:     (*PetscHelpPrintf)(comm,"--------------------------------------------------------------------------\n");
364:   }

366:   /*
367:        Print "higher-level" package help message
368:   */
369:   if (flg3) {
370:     if (PetscExternalHelpFunction) {
371:       (*PetscExternalHelpFunction)(comm);
372:     }
373:   }

375:   PetscOptionsGetString(NULL,NULL,"-help",helpoptions,sizeof(helpoptions),&flg1);
376:   if (flg1) {
377:     PetscStrcmp(helpoptions,"intro",&flg2);
378:     if (flg2) {
379:       PetscOptionsDestroyDefault();
380:       PetscFreeMPIResources();
381:       MPI_Finalize();
382:       exit(0);
383:     }
384:   }

386:   /*
387:       Setup the error handling
388:   */
389:   flg1 = PETSC_FALSE;
390:   PetscOptionsGetBool(NULL,NULL,"-on_error_abort",&flg1,NULL);
391:   if (flg1) {
392:     MPI_Comm_set_errhandler(comm,MPI_ERRORS_ARE_FATAL);
393:     PetscPushErrorHandler(PetscAbortErrorHandler,0);
394:   }
395:   flg1 = PETSC_FALSE;
396:   PetscOptionsGetBool(NULL,NULL,"-on_error_mpiabort",&flg1,NULL);
397:   if (flg1) { PetscPushErrorHandler(PetscMPIAbortErrorHandler,0);}
398:   flg1 = PETSC_FALSE;
399:   PetscOptionsGetBool(NULL,NULL,"-mpi_return_on_error",&flg1,NULL);
400:   if (flg1) {
401:     MPI_Comm_set_errhandler(comm,MPI_ERRORS_RETURN);
402:   }
403:   flg1 = PETSC_FALSE;
404:   PetscOptionsGetBool(NULL,NULL,"-no_signal_handler",&flg1,NULL);
405:   if (!flg1) {PetscPushSignalHandler(PetscSignalHandlerDefault,(void*)0);}
406:   flg1 = PETSC_FALSE;
407:   PetscOptionsGetBool(NULL,NULL,"-fp_trap",&flg1,NULL);
408:   if (flg1) {PetscSetFPTrap(PETSC_FP_TRAP_ON);}
409:   PetscOptionsGetInt(NULL,NULL,"-check_pointer_intensity",&intensity,&flag);

412:   /*
413:       Setup debugger information
414:   */
415:   PetscSetDefaultDebugger();
416:   PetscOptionsGetString(NULL,NULL,"-on_error_attach_debugger",string,64,&flg1);
417:   if (flg1) {
418:     MPI_Errhandler err_handler;

420:     PetscSetDebuggerFromString(string);
421:     MPI_Comm_create_errhandler((MPI_Handler_function*)Petsc_MPI_DebuggerOnError,&err_handler);
422:     MPI_Comm_set_errhandler(comm,err_handler);
423:     PetscPushErrorHandler(PetscAttachDebuggerErrorHandler,0);
424:   }
425:   PetscOptionsGetString(NULL,NULL,"-debug_terminal",string,64,&flg1);
426:   if (flg1) { PetscSetDebugTerminal(string); }
427:   PetscOptionsGetString(NULL,NULL,"-start_in_debugger",string,64,&flg1);
428:   PetscOptionsGetString(NULL,NULL,"-stop_for_debugger",string,64,&flg2);
429:   if (flg1 || flg2) {
430:     PetscMPIInt    size;
431:     PetscInt       lsize,*nodes;
432:     MPI_Errhandler err_handler;
433:     /*
434:        we have to make sure that all processors have opened
435:        connections to all other processors, otherwise once the
436:        debugger has stated it is likely to receive a SIGUSR1
437:        and kill the program.
438:     */
439:     MPI_Comm_size(comm,&size);
440:     if (size > 2) {
441:       PetscMPIInt dummy = 0;
442:       MPI_Status  status;
443:       for (i=0; i<size; i++) {
444:         if (rank != i) {
445:           MPI_Send(&dummy,1,MPI_INT,i,109,comm);
446:         }
447:       }
448:       for (i=0; i<size; i++) {
449:         if (rank != i) {
450:           MPI_Recv(&dummy,1,MPI_INT,i,109,comm,&status);
451:         }
452:       }
453:     }
454:     /* check if this processor node should be in debugger */
455:     PetscMalloc1(size,&nodes);
456:     lsize = size;
457:     PetscOptionsGetIntArray(NULL,NULL,"-debugger_nodes",nodes,&lsize,&flag);
458:     if (flag) {
459:       for (i=0; i<lsize; i++) {
460:         if (nodes[i] == rank) { flag = PETSC_FALSE; break; }
461:       }
462:     }
463:     if (!flag) {
464:       PetscSetDebuggerFromString(string);
465:       PetscPushErrorHandler(PetscAbortErrorHandler,0);
466:       if (flg1) {
467:         PetscAttachDebugger();
468:       } else {
469:         PetscStopForDebugger();
470:       }
471:       MPI_Comm_create_errhandler((MPI_Handler_function*)Petsc_MPI_AbortOnError,&err_handler);
472:       MPI_Comm_set_errhandler(comm,err_handler);
473:     }
474:     PetscFree(nodes);
475:   }

477:   PetscOptionsGetString(NULL,NULL,"-on_error_emacs",emacsmachinename,128,&flg1);
478:   if (flg1 && !rank) {PetscPushErrorHandler(PetscEmacsClientErrorHandler,emacsmachinename);}

480:   /*
481:         Setup profiling and logging
482:   */
483: #if defined(PETSC_USE_INFO)
484:   {
485:     char logname[PETSC_MAX_PATH_LEN]; logname[0] = 0;
486:     PetscOptionsGetString(NULL,NULL,"-info",logname,250,&flg1);
487:     if (flg1 && logname[0]) {
488:       PetscInfoAllow(PETSC_TRUE,logname);
489:     } else if (flg1) {
490:       PetscInfoAllow(PETSC_TRUE,NULL);
491:     }
492:   }
493: #endif
494: #if defined(PETSC_USE_LOG)
495:   mname[0] = 0;
496:   PetscOptionsGetString(NULL,NULL,"-history",mname,PETSC_MAX_PATH_LEN,&flg1);
497:   if (flg1) {
498:     if (mname[0]) {
499:       PetscOpenHistoryFile(mname,&petsc_history);
500:     } else {
501:       PetscOpenHistoryFile(NULL,&petsc_history);
502:     }
503:   }
504: #if defined(PETSC_HAVE_MPE)
505:   flg1 = PETSC_FALSE;
506:   PetscOptionsHasName(NULL,NULL,"-log_mpe",&flg1);
507:   if (flg1) {PetscLogMPEBegin();}
508: #endif
509:   flg1 = PETSC_FALSE;
510:   flg3 = PETSC_FALSE;
511:   PetscOptionsGetBool(NULL,NULL,"-log_all",&flg1,NULL);
512:   PetscOptionsHasName(NULL,NULL,"-log_summary",&flg3);
513:   if (flg1)                      { PetscLogAllBegin(); }
514:   else if (flg3)                 { PetscLogDefaultBegin();}

516:   PetscOptionsGetString(NULL,NULL,"-log_trace",mname,250,&flg1);
517:   if (flg1) {
518:     char name[PETSC_MAX_PATH_LEN],fname[PETSC_MAX_PATH_LEN];
519:     FILE *file;
520:     if (mname[0]) {
521:       sprintf(name,"%s.%d",mname,rank);
522:       PetscFixFilename(name,fname);
523:       file = fopen(fname,"w");
524:       if (!file) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_FILE_OPEN,"Unable to open trace file: %s",fname);
525:     } else file = PETSC_STDOUT;
526:     PetscLogTraceBegin(file);
527:   }

529:   PetscOptionsGetViewer(comm,NULL,"-log_view",NULL,&format,&flg4);
530:   if (flg4) {
531:     if (format == PETSC_VIEWER_ASCII_XML){
532:       PetscLogNestedBegin();
533:     } else {
534:       PetscLogDefaultBegin();
535:     }
536:   }
537: #endif

539:   PetscOptionsGetBool(NULL,NULL,"-saws_options",&PetscOptionsPublish,NULL);


542: #if defined(PETSC_HAVE_CUDA)
543:   PetscOptionsHasName(NULL,NULL,"-cuda_show_devices",&flg1);
544:   if (flg1) {
545:     struct cudaDeviceProp prop;
546:     int                   devCount;
547:     PetscInt              device;
548:     cudaError_t           err = cudaSuccess;

550:     err = cudaGetDeviceCount(&devCount);
551:     if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaGetDeviceCount %s",cudaGetErrorString(err));
552:     for (device = 0; device < devCount; ++device) {
553:       err = cudaGetDeviceProperties(&prop, (int)device);
554:       if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaGetDeviceProperties %s",cudaGetErrorString(err));
555:       PetscPrintf(comm, "CUDA device %D: %s\n", device, prop.name);
556:     }
557:   }
558:   if (!PetscCUDAInitialized) {
559:     PetscMPIInt size;
560:     MPI_Comm_size(comm,&size);
561:     if (size>1) {
562:       int         devCount;
563:       PetscInt    device;
564:       PetscMPIInt rank;
565:       cudaError_t err = cudaSuccess;

567:       /* check to see if we force multiple ranks to hit the same GPU */
568:       PetscOptionsGetInt(NULL,NULL,"-cuda_set_device", &device, &flg1);
569:       if (flg1) {
570:         err = cudaSetDevice((int)device);
571:         if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaSetDevice %s",cudaGetErrorString(err));
572:       } else {
573:         /* we're not using the same GPU on multiple MPI threads. So try to allocated different   GPUs to different processes */

575:         /* First get the device count */
576:         err   = cudaGetDeviceCount(&devCount);
577:         if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaGetDeviceCount %s",cudaGetErrorString(err));

579:         /* next determine the rank and then set the device via a mod */
580:         MPI_Comm_rank(comm,&rank);
581:         device = rank % devCount;
582:         err    = cudaSetDevice((int)device);
583:         if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaSetDevice %s",cudaGetErrorString(err));
584:       }

586:       /* set the device flags so that it can map host memory ... do NOT throw exception on err!=cudaSuccess
587:        multiple devices may try to set the flags on the same device. So long as one of them succeeds, things
588:        are ok. */
589:       err = cudaSetDeviceFlags(cudaDeviceMapHost);
590:       if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaSetDeviceFlags %s",cudaGetErrorString(err));
591:     } else {
592:       PetscInt    device;
593:       cudaError_t err = cudaSuccess;

595:       /* the code below works for serial GPU simulations */
596:       PetscOptionsGetInt(NULL,NULL,"-cuda_set_device", &device, &flg1);
597:       if (flg1) {
598:         err = cudaSetDevice((int)device);
599:         if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaSetDevice %s",cudaGetErrorString(err));
600:       }

602:       /* set the device flags so that it can map host memory ... here, we error check. */
603:       err = cudaSetDeviceFlags(cudaDeviceMapHost);
604:       if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaSetDeviceFlags %s",cudaGetErrorString(err));
605:     }

607:     PetscCUDAInitialized = PETSC_TRUE;
608:   }
609: #endif


612:   /*
613:        Print basic help message
614:   */
615:   PetscOptionsHasName(NULL,NULL,"-help",&flg1);
616:   if (flg1) {
617:     (*PetscHelpPrintf)(comm,"Options for all PETSc programs:\n");
618:     (*PetscHelpPrintf)(comm," -help: prints help method for each option\n");
619:     (*PetscHelpPrintf)(comm," -on_error_abort: cause an abort when an error is detected. Useful \n ");
620:     (*PetscHelpPrintf)(comm,"       only when run in the debugger\n");
621:     (*PetscHelpPrintf)(comm," -on_error_attach_debugger [gdb,dbx,xxgdb,ups,noxterm]\n");
622:     (*PetscHelpPrintf)(comm,"       start the debugger in new xterm\n");
623:     (*PetscHelpPrintf)(comm,"       unless noxterm is given\n");
624:     (*PetscHelpPrintf)(comm," -start_in_debugger [gdb,dbx,xxgdb,ups,noxterm]\n");
625:     (*PetscHelpPrintf)(comm,"       start all processes in the debugger\n");
626:     (*PetscHelpPrintf)(comm," -on_error_emacs <machinename>\n");
627:     (*PetscHelpPrintf)(comm,"    emacs jumps to error file\n");
628:     (*PetscHelpPrintf)(comm," -debugger_nodes [n1,n2,..] Nodes to start in debugger\n");
629:     (*PetscHelpPrintf)(comm," -debugger_pause [m] : delay (in seconds) to attach debugger\n");
630:     (*PetscHelpPrintf)(comm," -stop_for_debugger : prints message on how to attach debugger manually\n");
631:     (*PetscHelpPrintf)(comm,"                      waits the delay for you to attach\n");
632:     (*PetscHelpPrintf)(comm," -display display: Location where X window graphics and debuggers are displayed\n");
633:     (*PetscHelpPrintf)(comm," -no_signal_handler: do not trap error signals\n");
634:     (*PetscHelpPrintf)(comm," -mpi_return_on_error: MPI returns error code, rather than abort on internal error\n");
635:     (*PetscHelpPrintf)(comm," -fp_trap: stop on floating point exceptions\n");
636:     (*PetscHelpPrintf)(comm,"           note on IBM RS6000 this slows run greatly\n");
637:     (*PetscHelpPrintf)(comm," -malloc_dump <optional filename>: dump list of unfreed memory at conclusion\n");
638:     (*PetscHelpPrintf)(comm," -malloc: use our error checking malloc\n");
639:     (*PetscHelpPrintf)(comm," -malloc no: don't use error checking malloc\n");
640:     (*PetscHelpPrintf)(comm," -malloc_info: prints total memory usage\n");
641:     (*PetscHelpPrintf)(comm," -malloc_log: keeps log of all memory allocations\n");
642:     (*PetscHelpPrintf)(comm," -malloc_debug: enables extended checking for memory corruption\n");
643:     (*PetscHelpPrintf)(comm," -options_table: dump list of options inputted\n");
644:     (*PetscHelpPrintf)(comm," -options_left: dump list of unused options\n");
645:     (*PetscHelpPrintf)(comm," -options_left no: don't dump list of unused options\n");
646:     (*PetscHelpPrintf)(comm," -tmp tmpdir: alternative /tmp directory\n");
647:     (*PetscHelpPrintf)(comm," -shared_tmp: tmp directory is shared by all processors\n");
648:     (*PetscHelpPrintf)(comm," -not_shared_tmp: each processor has separate tmp directory\n");
649:     (*PetscHelpPrintf)(comm," -memory_view: print memory usage at end of run\n");
650: #if defined(PETSC_USE_LOG)
651:     (*PetscHelpPrintf)(comm," -get_total_flops: total flops over all processors\n");
652:     (*PetscHelpPrintf)(comm," -log_view [:filename:[format]]: logging objects and events\n");
653:     (*PetscHelpPrintf)(comm," -log_trace [filename]: prints trace of all PETSc calls\n");
654: #if defined(PETSC_HAVE_MPE)
655:     (*PetscHelpPrintf)(comm," -log_mpe: Also create logfile viewable through Jumpshot\n");
656: #endif
657:     (*PetscHelpPrintf)(comm," -info <optional filename>: print informative messages about the calculations\n");
658: #endif
659:     (*PetscHelpPrintf)(comm," -v: prints PETSc version number and release date\n");
660:     (*PetscHelpPrintf)(comm," -options_file <file>: reads options from file\n");
661:     (*PetscHelpPrintf)(comm," -petsc_sleep n: sleeps n seconds before running program\n");
662:     (*PetscHelpPrintf)(comm,"-----------------------------------------------\n");
663:   }

665: #if defined(PETSC_HAVE_POPEN)
666:   {
667:   char machine[128];
668:   PetscOptionsGetString(NULL,NULL,"-popen_machine",machine,128,&flg1);
669:   if (flg1) {
670:     PetscPOpenSetMachine(machine);
671:   }
672:   }
673: #endif

675:   PetscOptionsGetReal(NULL,NULL,"-petsc_sleep",&si,&flg1);
676:   if (flg1) {
677:     PetscSleep(si);
678:   }

680:   PetscOptionsGetString(NULL,NULL,"-info_exclude",mname,PETSC_MAX_PATH_LEN,&flg1);
681:   if (flg1) {
682:     PetscStrstr(mname,"null",&f);
683:     if (f) {
684:       PetscInfoDeactivateClass(0);
685:     }
686:   }

688: #if defined(PETSC_HAVE_CUSP) || defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_VECCUDA)
689:   PetscOptionsHasName(NULL,NULL,"-log_summary",&flg3);
690:   if (!flg3) {
691:     PetscOptionsHasName(NULL,NULL,"-log_view",&flg3);
692:   }
693: #endif
694: #if defined(PETSC_HAVE_CUSP)
695:   PetscOptionsGetBool(NULL,NULL,"-cusp_synchronize",&flg3,NULL);
696:   PetscCUSPSynchronize = flg3;
697: #elif defined(PETSC_HAVE_VIENNACL)
698:   PetscOptionsGetBool(NULL,NULL,"-viennacl_synchronize",&flg3,NULL);
699:   PetscViennaCLSynchronize = flg3;
700: #elif defined(PETSC_HAVE_VECCUDA)
701:   PetscOptionsGetBool(NULL,NULL,"-cuda_synchronize",&flg3,NULL);
702:   PetscCUDASynchronize = flg3;
703: #endif

705: #if defined(PETSC_HAVE_VIENNACL)
706:   PetscViennaCLInit();
707: #endif

709:   return(0);
710: }