1e5c89e4eSSatish Balay /* 2e5c89e4eSSatish Balay 3e5c89e4eSSatish Balay This file defines part of the initialization of PETSc 4e5c89e4eSSatish Balay 5f2d66bcaSShri Abhyankar This file uses regular malloc and free because it cannot known 6e5c89e4eSSatish Balay what malloc is being used until it has already processed the input. 7e5c89e4eSSatish Balay */ 8ef386f4bSSatish Balay 9ef386f4bSSatish Balay #include <petscsys.h> /*I "petscsys.h" I*/ 10f67a399dSBarry Smith #include <petsc/private/petscimpl.h> 11022afb99SBarry Smith #include <petscvalgrind.h> 12665c2dedSJed Brown #include <petscviewer.h> 13*fdc842d1SBarry Smith #if defined(PETSC_USE_LOG) 14*fdc842d1SBarry Smith PETSC_INTERN PetscErrorCode PetscLogInitialize(void); 15*fdc842d1SBarry Smith #endif 16ef386f4bSSatish Balay 17ba61063dSBarry Smith #if defined(PETSC_HAVE_SYS_SYSINFO_H) 1851d315f7SKerry Stevens #include <sys/sysinfo.h> 19ba61063dSBarry Smith #endif 20121deb67SSatish Balay #if defined(PETSC_HAVE_UNISTD_H) 2151d315f7SKerry Stevens #include <unistd.h> 22121deb67SSatish Balay #endif 23d9b72601SDominic Meiser #if defined(PETSC_HAVE_CUDA) 24d9b72601SDominic Meiser #include <cuda_runtime.h> 25*fdc842d1SBarry Smith extern PetscErrorCode PetscCUBLASInitializeHandle(void); 26d9b72601SDominic Meiser #endif 27555d055bSBarry Smith 28f0a7718cSKarl Rupp #if defined(PETSC_HAVE_VIENNACL) 29f0a7718cSKarl Rupp PETSC_EXTERN PetscErrorCode PetscViennaCLInit(); 30f0a7718cSKarl Rupp #endif 31f0a7718cSKarl Rupp 32e5c89e4eSSatish Balay /* ------------------------Nasty global variables -------------------------------*/ 33e5c89e4eSSatish Balay /* 34e5c89e4eSSatish Balay Indicates if PETSc started up MPI, or it was 35e5c89e4eSSatish Balay already started before PETSc was initialized. 36e5c89e4eSSatish Balay */ 370cbf60d0SJose E. Roman PetscBool PetscBeganMPI = PETSC_FALSE; 380cbf60d0SJose E. Roman PetscBool PetscInitializeCalled = PETSC_FALSE; 390cbf60d0SJose E. Roman PetscBool PetscFinalizeCalled = PETSC_FALSE; 40bffec52eSKarl Rupp PetscBool PetscCUDAInitialized = PETSC_FALSE; 41d6f2c3cbSBarry Smith 427087cfbeSBarry Smith PetscMPIInt PetscGlobalRank = -1; 437087cfbeSBarry Smith PetscMPIInt PetscGlobalSize = -1; 44ba61063dSBarry Smith 4550f81f78SJed Brown #if defined(PETSC_HAVE_COMPLEX) 46e5c89e4eSSatish Balay #if defined(PETSC_COMPLEX_INSTANTIATE) 47e5c89e4eSSatish Balay template <> class std::complex<double>; /* instantiate complex template class */ 48e5c89e4eSSatish Balay #endif 492c876bd9SBarry Smith #if !defined(PETSC_HAVE_MPI_C_DOUBLE_COMPLEX) 50500d8756SSatish Balay MPI_Datatype MPIU_C_DOUBLE_COMPLEX; 51500d8756SSatish Balay MPI_Datatype MPIU_C_COMPLEX; 522c876bd9SBarry Smith #endif 538619c96cSJed Brown 548619c96cSJed Brown /*MC 558619c96cSJed Brown PETSC_i - the imaginary number i 568619c96cSJed Brown 578619c96cSJed Brown Synopsis: 588619c96cSJed Brown #include <petscsys.h> 598619c96cSJed Brown PetscComplex PETSC_i; 608619c96cSJed Brown 618619c96cSJed Brown Level: beginner 628619c96cSJed Brown 638619c96cSJed Brown Note: 648cd53115SBarry Smith Complex numbers are automatically available if PETSc located a working complex implementation 658619c96cSJed Brown 668619c96cSJed Brown .seealso: PetscRealPart(), PetscImaginaryPart(), PetscRealPartComplex(), PetscImaginaryPartComplex() 678619c96cSJed Brown M*/ 6850f81f78SJed Brown PetscComplex PETSC_i; 69e5c89e4eSSatish Balay #endif 70ce63c4c1SBarry Smith #if defined(PETSC_USE_REAL___FLOAT128) 71c90a1750SBarry Smith MPI_Datatype MPIU___FLOAT128 = 0; 727c2de775SJed Brown #if defined(PETSC_HAVE_COMPLEX) 738c764dc5SJose Roman MPI_Datatype MPIU___COMPLEX128 = 0; 748c764dc5SJose Roman #endif 75570b7f6dSBarry Smith #elif defined(PETSC_USE_REAL___FP16) 76570b7f6dSBarry Smith MPI_Datatype MPIU___FP16 = 0; 77c90a1750SBarry Smith #endif 787087cfbeSBarry Smith MPI_Datatype MPIU_2SCALAR = 0; 7944041f26SJed Brown #if defined(PETSC_USE_64BIT_INDICES) || !defined(MPI_2INT) 807087cfbeSBarry Smith MPI_Datatype MPIU_2INT = 0; 8144041f26SJed Brown #endif 828ad47952SJed Brown MPI_Datatype MPIU_BOOL; 838ad47952SJed Brown MPI_Datatype MPIU_ENUM; 847cdaf61dSJed Brown MPI_Datatype MPIU_FORTRANADDR; 85e316c87fSJed Brown MPI_Datatype MPIU_SIZE_T; 8675567043SBarry Smith 87e5c89e4eSSatish Balay /* 88e5c89e4eSSatish Balay Function that is called to display all error messages 89e5c89e4eSSatish Balay */ 907087cfbeSBarry Smith PetscErrorCode (*PetscErrorPrintf)(const char [],...) = PetscErrorPrintfDefault; 917087cfbeSBarry Smith PetscErrorCode (*PetscHelpPrintf)(MPI_Comm,const char [],...) = PetscHelpPrintfDefault; 927087cfbeSBarry Smith PetscErrorCode (*PetscVFPrintf)(FILE*,const char[],va_list) = PetscVFPrintfDefault; 93bab1f7e6SVictor Minden /* 944cf1874eSKarl Rupp This is needed to turn on/off GPU synchronization 958b5db460SBarry Smith */ 964cf1874eSKarl Rupp PetscBool PetscViennaCLSynchronize = PETSC_FALSE; 9782f73ecaSAlejandro Lamas Daviña PetscBool PetscCUDASynchronize = PETSC_FALSE; 98bab1f7e6SVictor Minden 99e5c89e4eSSatish Balay /* ------------------------------------------------------------------------------*/ 100e5c89e4eSSatish Balay /* 101e5c89e4eSSatish Balay Optional file where all PETSc output from various prints is saved 102e5c89e4eSSatish Balay */ 10395c0884eSLisandro Dalcin PETSC_INTERN FILE *petsc_history; 1040298fd71SBarry Smith FILE *petsc_history = NULL; 105e5c89e4eSSatish Balay 1067087cfbeSBarry Smith PetscErrorCode PetscOpenHistoryFile(const char filename[],FILE **fd) 107e5c89e4eSSatish Balay { 108e5c89e4eSSatish Balay PetscErrorCode ierr; 109e5c89e4eSSatish Balay PetscMPIInt rank,size; 110e5c89e4eSSatish Balay char pfile[PETSC_MAX_PATH_LEN],pname[PETSC_MAX_PATH_LEN],fname[PETSC_MAX_PATH_LEN],date[64]; 111e5c89e4eSSatish Balay char version[256]; 112e5c89e4eSSatish Balay 113e5c89e4eSSatish Balay PetscFunctionBegin; 114e5c89e4eSSatish Balay ierr = MPI_Comm_rank(PETSC_COMM_WORLD,&rank);CHKERRQ(ierr); 115e5c89e4eSSatish Balay if (!rank) { 116e5c89e4eSSatish Balay char arch[10]; 117f56c2debSBarry Smith int err; 118f56c2debSBarry Smith 119e5c89e4eSSatish Balay ierr = PetscGetArchType(arch,10);CHKERRQ(ierr); 120e5c89e4eSSatish Balay ierr = PetscGetDate(date,64);CHKERRQ(ierr); 121a523d312SBarry Smith ierr = PetscGetVersion(version,256);CHKERRQ(ierr); 122e5c89e4eSSatish Balay ierr = MPI_Comm_size(PETSC_COMM_WORLD,&size);CHKERRQ(ierr); 123e5c89e4eSSatish Balay if (filename) { 124e5c89e4eSSatish Balay ierr = PetscFixFilename(filename,fname);CHKERRQ(ierr); 125e5c89e4eSSatish Balay } else { 126e5c89e4eSSatish Balay ierr = PetscGetHomeDirectory(pfile,240);CHKERRQ(ierr); 127e5c89e4eSSatish Balay ierr = PetscStrcat(pfile,"/.petschistory");CHKERRQ(ierr); 128e5c89e4eSSatish Balay ierr = PetscFixFilename(pfile,fname);CHKERRQ(ierr); 129e5c89e4eSSatish Balay } 130e5c89e4eSSatish Balay 131a297a907SKarl Rupp *fd = fopen(fname,"a"); 132a297a907SKarl Rupp if (!fd) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_FILE_OPEN,"Cannot open file: %s",fname); 133a297a907SKarl Rupp 134e5c89e4eSSatish Balay ierr = PetscFPrintf(PETSC_COMM_SELF,*fd,"---------------------------------------------------------\n");CHKERRQ(ierr); 135e5c89e4eSSatish Balay ierr = PetscFPrintf(PETSC_COMM_SELF,*fd,"%s %s\n",version,date);CHKERRQ(ierr); 136e5c89e4eSSatish Balay ierr = PetscGetProgramName(pname,PETSC_MAX_PATH_LEN);CHKERRQ(ierr); 137e5c89e4eSSatish Balay ierr = PetscFPrintf(PETSC_COMM_SELF,*fd,"%s on a %s, %d proc. with options:\n",pname,arch,size);CHKERRQ(ierr); 138e5c89e4eSSatish Balay ierr = PetscFPrintf(PETSC_COMM_SELF,*fd,"---------------------------------------------------------\n");CHKERRQ(ierr); 139a297a907SKarl Rupp 140f56c2debSBarry Smith err = fflush(*fd); 141e32f2f54SBarry Smith if (err) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SYS,"fflush() failed on file"); 142e5c89e4eSSatish Balay } 143e5c89e4eSSatish Balay PetscFunctionReturn(0); 144e5c89e4eSSatish Balay } 145e5c89e4eSSatish Balay 14695c0884eSLisandro Dalcin PETSC_INTERN PetscErrorCode PetscCloseHistoryFile(FILE **fd) 147e5c89e4eSSatish Balay { 148e5c89e4eSSatish Balay PetscErrorCode ierr; 149e5c89e4eSSatish Balay PetscMPIInt rank; 150e5c89e4eSSatish Balay char date[64]; 151f56c2debSBarry Smith int err; 152e5c89e4eSSatish Balay 153e5c89e4eSSatish Balay PetscFunctionBegin; 154e5c89e4eSSatish Balay ierr = MPI_Comm_rank(PETSC_COMM_WORLD,&rank);CHKERRQ(ierr); 155e5c89e4eSSatish Balay if (!rank) { 156e5c89e4eSSatish Balay ierr = PetscGetDate(date,64);CHKERRQ(ierr); 157e5c89e4eSSatish Balay ierr = PetscFPrintf(PETSC_COMM_SELF,*fd,"---------------------------------------------------------\n");CHKERRQ(ierr); 158e5c89e4eSSatish Balay ierr = PetscFPrintf(PETSC_COMM_SELF,*fd,"Finished at %s\n",date);CHKERRQ(ierr); 159e5c89e4eSSatish Balay ierr = PetscFPrintf(PETSC_COMM_SELF,*fd,"---------------------------------------------------------\n");CHKERRQ(ierr); 160f56c2debSBarry Smith err = fflush(*fd); 161e32f2f54SBarry Smith if (err) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SYS,"fflush() failed on file"); 162f56c2debSBarry Smith err = fclose(*fd); 163e32f2f54SBarry Smith if (err) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SYS,"fclose() failed on file"); 164e5c89e4eSSatish Balay } 165e5c89e4eSSatish Balay PetscFunctionReturn(0); 166e5c89e4eSSatish Balay } 167e5c89e4eSSatish Balay 168e5c89e4eSSatish Balay /* ------------------------------------------------------------------------------*/ 169e5c89e4eSSatish Balay 170e5c89e4eSSatish Balay /* 171e5c89e4eSSatish Balay This is ugly and probably belongs somewhere else, but I want to 172e5c89e4eSSatish Balay be able to put a true MPI abort error handler with command line args. 173e5c89e4eSSatish Balay 174e5c89e4eSSatish Balay This is so MPI errors in the debugger will leave all the stack 1753c311c98SBarry Smith frames. The default MP_Abort() cleans up and exits thus providing no useful information 1763c311c98SBarry Smith in the debugger hence we call abort() instead of MPI_Abort(). 177e5c89e4eSSatish Balay */ 178e5c89e4eSSatish Balay 17933c7d699SBarry Smith void Petsc_MPI_AbortOnError(MPI_Comm *comm,PetscMPIInt *flag,...) 180e5c89e4eSSatish Balay { 181e5c89e4eSSatish Balay PetscFunctionBegin; 1823c311c98SBarry Smith (*PetscErrorPrintf)("MPI error %d\n",*flag); 183e5c89e4eSSatish Balay abort(); 184e5c89e4eSSatish Balay } 185e5c89e4eSSatish Balay 18633c7d699SBarry Smith void Petsc_MPI_DebuggerOnError(MPI_Comm *comm,PetscMPIInt *flag,...) 187e5c89e4eSSatish Balay { 188e5c89e4eSSatish Balay PetscErrorCode ierr; 189e5c89e4eSSatish Balay 190e5c89e4eSSatish Balay PetscFunctionBegin; 1913c311c98SBarry Smith (*PetscErrorPrintf)("MPI error %d\n",*flag); 192e5c89e4eSSatish Balay ierr = PetscAttachDebugger(); 193a297a907SKarl Rupp if (ierr) MPI_Abort(*comm,*flag); /* hopeless so get out */ 194e5c89e4eSSatish Balay } 195e5c89e4eSSatish Balay 196e5c89e4eSSatish Balay /*@C 197e5c89e4eSSatish Balay PetscEnd - Calls PetscFinalize() and then ends the program. This is useful if one 198e5c89e4eSSatish Balay wishes a clean exit somewhere deep in the program. 199e5c89e4eSSatish Balay 200e5c89e4eSSatish Balay Collective on PETSC_COMM_WORLD 201e5c89e4eSSatish Balay 202e5c89e4eSSatish Balay Options Database Keys are the same as for PetscFinalize() 203e5c89e4eSSatish Balay 204e5c89e4eSSatish Balay Level: advanced 205e5c89e4eSSatish Balay 206e5c89e4eSSatish Balay Note: 207e5c89e4eSSatish Balay See PetscInitialize() for more general runtime options. 208e5c89e4eSSatish Balay 20988c29154SBarry Smith .seealso: PetscInitialize(), PetscOptionsView(), PetscMallocDump(), PetscMPIDump(), PetscFinalize() 210e5c89e4eSSatish Balay @*/ 2117087cfbeSBarry Smith PetscErrorCode PetscEnd(void) 212e5c89e4eSSatish Balay { 213e5c89e4eSSatish Balay PetscFunctionBegin; 214e5c89e4eSSatish Balay PetscFinalize(); 215e5c89e4eSSatish Balay exit(0); 216e5c89e4eSSatish Balay return 0; 217e5c89e4eSSatish Balay } 218e5c89e4eSSatish Balay 219ace3abfcSBarry Smith PetscBool PetscOptionsPublish = PETSC_FALSE; 22095c0884eSLisandro Dalcin PETSC_INTERN PetscErrorCode PetscSetUseTrMalloc_Private(void); 22195c0884eSLisandro Dalcin PETSC_INTERN PetscErrorCode PetscSetUseHBWMalloc_Private(void); 22295c0884eSLisandro Dalcin PETSC_INTERN PetscBool petscsetmallocvisited; 223e5c89e4eSSatish Balay static char emacsmachinename[256]; 224e5c89e4eSSatish Balay 225e5c89e4eSSatish Balay PetscErrorCode (*PetscExternalVersionFunction)(MPI_Comm) = 0; 226e5c89e4eSSatish Balay PetscErrorCode (*PetscExternalHelpFunction)(MPI_Comm) = 0; 227e5c89e4eSSatish Balay 228e5c89e4eSSatish Balay /*@C 229e5c89e4eSSatish Balay PetscSetHelpVersionFunctions - Sets functions that print help and version information 230e5c89e4eSSatish Balay before the PETSc help and version information is printed. Must call BEFORE PetscInitialize(). 231e5c89e4eSSatish Balay This routine enables a "higher-level" package that uses PETSc to print its messages first. 232e5c89e4eSSatish Balay 233e5c89e4eSSatish Balay Input Parameter: 2340298fd71SBarry Smith + help - the help function (may be NULL) 2350298fd71SBarry Smith - version - the version function (may be NULL) 236e5c89e4eSSatish Balay 237e5c89e4eSSatish Balay Level: developer 238e5c89e4eSSatish Balay 239e5c89e4eSSatish Balay @*/ 2407087cfbeSBarry Smith PetscErrorCode PetscSetHelpVersionFunctions(PetscErrorCode (*help)(MPI_Comm),PetscErrorCode (*version)(MPI_Comm)) 241e5c89e4eSSatish Balay { 242e5c89e4eSSatish Balay PetscFunctionBegin; 243e5c89e4eSSatish Balay PetscExternalHelpFunction = help; 244e5c89e4eSSatish Balay PetscExternalVersionFunction = version; 245e5c89e4eSSatish Balay PetscFunctionReturn(0); 246e5c89e4eSSatish Balay } 247e5c89e4eSSatish Balay 24805df10baSBarry Smith #if defined(PETSC_USE_LOG) 24995c0884eSLisandro Dalcin PETSC_INTERN PetscBool PetscObjectsLog; 25005df10baSBarry Smith #endif 25105df10baSBarry Smith 25295c0884eSLisandro Dalcin PETSC_INTERN PetscErrorCode PetscOptionsCheckInitial_Private(void) 253e5c89e4eSSatish Balay { 254e5c89e4eSSatish Balay char string[64],mname[PETSC_MAX_PATH_LEN],*f; 255e5c89e4eSSatish Balay MPI_Comm comm = PETSC_COMM_WORLD; 25667584ceeSBarry Smith PetscBool flg1 = PETSC_FALSE,flg2 = PETSC_FALSE,flg3 = PETSC_FALSE,flag; 257e5c89e4eSSatish Balay PetscErrorCode ierr; 25867584ceeSBarry Smith PetscReal si; 25928559dc8SJed Brown PetscInt intensity; 260e5c89e4eSSatish Balay int i; 261e5c89e4eSSatish Balay PetscMPIInt rank; 2627ca660e7SBarry Smith char version[256],helpoptions[256]; 26367584ceeSBarry Smith #if !defined(PETSC_HAVE_THREADSAFETY) 26467584ceeSBarry Smith PetscReal logthreshold; 2652479a3a6SBarry Smith #endif 2662479a3a6SBarry Smith #if defined(PETSC_USE_LOG) 2672479a3a6SBarry Smith PetscViewerFormat format; 26867584ceeSBarry Smith PetscBool flg4 = PETSC_FALSE; 26967584ceeSBarry Smith #endif 270012f15ecSRichard Tran Mills #if defined(PETSC_HAVE_CUDA) 271d991300cSSatish Balay int device; 272d991300cSSatish Balay PetscInt deviceOpt = 0; 273012f15ecSRichard Tran Mills PetscBool cuda_view_flag = PETSC_FALSE; 274012f15ecSRichard Tran Mills #endif 275e5c89e4eSSatish Balay PetscFunctionBegin; 27642218b76SBarry Smith ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 277e5c89e4eSSatish Balay 27867584ceeSBarry Smith #if !defined(PETSC_HAVE_THREADSAFETY) 279e5c89e4eSSatish Balay /* 280e5c89e4eSSatish Balay Setup the memory management; support for tracing malloc() usage 281e5c89e4eSSatish Balay */ 282c5929fdfSBarry Smith ierr = PetscOptionsHasName(NULL,NULL,"-malloc_log",&flg3);CHKERRQ(ierr); 283574034a9SJed Brown logthreshold = 0.0; 284c5929fdfSBarry Smith ierr = PetscOptionsGetReal(NULL,NULL,"-malloc_log_threshold",&logthreshold,&flg1);CHKERRQ(ierr); 285574034a9SJed Brown if (flg1) flg3 = PETSC_TRUE; 2868bf1f09cSShri Abhyankar #if defined(PETSC_USE_DEBUG) 287c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-malloc",&flg1,&flg2);CHKERRQ(ierr); 288e5c89e4eSSatish Balay if ((!flg2 || flg1) && !petscsetmallocvisited) { 289dc92acbaSJed Brown if (flg2 || !(PETSC_RUNNING_ON_VALGRIND)) { 290555d055bSBarry Smith /* turn off default -malloc if valgrind is being used */ 291e5c89e4eSSatish Balay ierr = PetscSetUseTrMalloc_Private();CHKERRQ(ierr); 292555d055bSBarry Smith } 293e5c89e4eSSatish Balay } 294e5c89e4eSSatish Balay #else 295c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-malloc_dump",&flg1,NULL);CHKERRQ(ierr); 296c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-malloc",&flg2,NULL);CHKERRQ(ierr); 297e5c89e4eSSatish Balay if (flg1 || flg2 || flg3) {ierr = PetscSetUseTrMalloc_Private();CHKERRQ(ierr);} 298e5c89e4eSSatish Balay #endif 299e5c89e4eSSatish Balay if (flg3) { 300574034a9SJed Brown ierr = PetscMallocSetDumpLogThreshold((PetscLogDouble)logthreshold);CHKERRQ(ierr); 301e5c89e4eSSatish Balay } 302ba282f50SJed Brown ierr = PetscOptionsGetBool(NULL,NULL,"-malloc_coalesce",&flg1,&flg2);CHKERRQ(ierr); 303ba282f50SJed Brown if (flg2) {ierr = PetscMallocSetCoalesce(flg1);CHKERRQ(ierr);} 30490d69ab7SBarry Smith flg1 = PETSC_FALSE; 305c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-malloc_debug",&flg1,NULL);CHKERRQ(ierr); 306e5c89e4eSSatish Balay if (flg1) { 307e5c89e4eSSatish Balay ierr = PetscSetUseTrMalloc_Private();CHKERRQ(ierr); 308e5c89e4eSSatish Balay ierr = PetscMallocDebug(PETSC_TRUE);CHKERRQ(ierr); 309e5c89e4eSSatish Balay } 310dc92acbaSJed Brown flg1 = PETSC_FALSE; 311c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-malloc_test",&flg1,NULL);CHKERRQ(ierr); 3128bf1f09cSShri Abhyankar #if defined(PETSC_USE_DEBUG) 313dc92acbaSJed Brown if (flg1 && !PETSC_RUNNING_ON_VALGRIND) { 314dc92acbaSJed Brown ierr = PetscSetUseTrMalloc_Private();CHKERRQ(ierr); 315dc92acbaSJed Brown ierr = PetscMallocSetDumpLog();CHKERRQ(ierr); 316dc92acbaSJed Brown ierr = PetscMallocDebug(PETSC_TRUE);CHKERRQ(ierr); 317dc92acbaSJed Brown } 318dc92acbaSJed Brown #endif 3192f21b5c6SHong Zhang flg1 = PETSC_FALSE; 3202f21b5c6SHong Zhang ierr = PetscOptionsGetBool(NULL,NULL,"-malloc_hbw",&flg1,NULL);CHKERRQ(ierr); 321cf6f3811SHong Zhang /* ignore this option if malloc is already set */ 322cf6f3811SHong Zhang if (flg1 && !petscsetmallocvisited) {ierr = PetscSetUseHBWMalloc_Private();CHKERRQ(ierr);} 323e5c89e4eSSatish Balay 32490d69ab7SBarry Smith flg1 = PETSC_FALSE; 325c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-malloc_info",&flg1,NULL);CHKERRQ(ierr); 3267783f70dSSatish Balay if (!flg1) { 32790d69ab7SBarry Smith flg1 = PETSC_FALSE; 328c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-memory_view",&flg1,NULL);CHKERRQ(ierr); 3297783f70dSSatish Balay } 330e5c89e4eSSatish Balay if (flg1) { 331e5c89e4eSSatish Balay ierr = PetscMemorySetGetMaximumUsage();CHKERRQ(ierr); 332e5c89e4eSSatish Balay } 33367584ceeSBarry Smith #endif 334e5c89e4eSSatish Balay 335b4427426SBarry Smith #if defined(PETSC_USE_LOG) 336c5929fdfSBarry Smith ierr = PetscOptionsHasName(NULL,NULL,"-objects_dump",&PetscObjectsLog);CHKERRQ(ierr); 337b4427426SBarry Smith #endif 33805df10baSBarry Smith 339e5c89e4eSSatish Balay /* 340e5c89e4eSSatish Balay Set the display variable for graphics 341e5c89e4eSSatish Balay */ 342e5c89e4eSSatish Balay ierr = PetscSetDisplay();CHKERRQ(ierr); 343e5c89e4eSSatish Balay 34451dcc849SKerry Stevens /* 345e5c89e4eSSatish Balay Print the PETSc version information 346e5c89e4eSSatish Balay */ 347c5929fdfSBarry Smith ierr = PetscOptionsHasName(NULL,NULL,"-v",&flg1);CHKERRQ(ierr); 348c5929fdfSBarry Smith ierr = PetscOptionsHasName(NULL,NULL,"-version",&flg2);CHKERRQ(ierr); 3492d747510SLisandro Dalcin ierr = PetscOptionsHasHelp(NULL,&flg3);CHKERRQ(ierr); 350e5c89e4eSSatish Balay if (flg1 || flg2 || flg3) { 351e5c89e4eSSatish Balay 352e5c89e4eSSatish Balay /* 353e5c89e4eSSatish Balay Print "higher-level" package version message 354e5c89e4eSSatish Balay */ 355e5c89e4eSSatish Balay if (PetscExternalVersionFunction) { 356e5c89e4eSSatish Balay ierr = (*PetscExternalVersionFunction)(comm);CHKERRQ(ierr); 357e5c89e4eSSatish Balay } 358e5c89e4eSSatish Balay 359a523d312SBarry Smith ierr = PetscGetVersion(version,256);CHKERRQ(ierr); 3607ca660e7SBarry Smith ierr = (*PetscHelpPrintf)(comm,"--------------------------------------------------------------------------\n");CHKERRQ(ierr); 361e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm,"%s\n",version);CHKERRQ(ierr); 362e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm,"%s",PETSC_AUTHOR_INFO);CHKERRQ(ierr); 363e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm,"See docs/changes/index.html for recent updates.\n");CHKERRQ(ierr); 36484e42920SBarry Smith ierr = (*PetscHelpPrintf)(comm,"See docs/faq.html for problems.\n");CHKERRQ(ierr); 365e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm,"See docs/manualpages/index.html for help. \n");CHKERRQ(ierr); 366e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm,"Libraries linked from %s\n",PETSC_LIB_DIR);CHKERRQ(ierr); 3677ca660e7SBarry Smith ierr = (*PetscHelpPrintf)(comm,"--------------------------------------------------------------------------\n");CHKERRQ(ierr); 3687ca660e7SBarry Smith } 3697ca660e7SBarry Smith 37094941ca7SBarry Smith /* 37194941ca7SBarry Smith Print "higher-level" package help message 37294941ca7SBarry Smith */ 37394941ca7SBarry Smith if (flg3) { 37494941ca7SBarry Smith if (PetscExternalHelpFunction) { 37594941ca7SBarry Smith ierr = (*PetscExternalHelpFunction)(comm);CHKERRQ(ierr); 37694941ca7SBarry Smith } 37794941ca7SBarry Smith } 37894941ca7SBarry Smith 3797ca660e7SBarry Smith ierr = PetscOptionsGetString(NULL,NULL,"-help",helpoptions,sizeof(helpoptions),&flg1);CHKERRQ(ierr); 3807ca660e7SBarry Smith if (flg1) { 3817ca660e7SBarry Smith ierr = PetscStrcmp(helpoptions,"intro",&flg2);CHKERRQ(ierr); 3827ca660e7SBarry Smith if (flg2) { 383bdb346e9SBarry Smith ierr = PetscOptionsDestroyDefault();CHKERRQ(ierr); 384008a6e76SBarry Smith ierr = PetscFreeMPIResources();CHKERRQ(ierr); 3857ca660e7SBarry Smith ierr = MPI_Finalize();CHKERRQ(ierr); 3867ca660e7SBarry Smith exit(0); 3877ca660e7SBarry Smith } 388e5c89e4eSSatish Balay } 389e5c89e4eSSatish Balay 390e5c89e4eSSatish Balay /* 391e5c89e4eSSatish Balay Setup the error handling 392e5c89e4eSSatish Balay */ 39390d69ab7SBarry Smith flg1 = PETSC_FALSE; 394c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-on_error_abort",&flg1,NULL);CHKERRQ(ierr); 395b59baad1SJed Brown if (flg1) { 39642218b76SBarry Smith ierr = MPI_Comm_set_errhandler(comm,MPI_ERRORS_ARE_FATAL);CHKERRQ(ierr); 397b59baad1SJed Brown ierr = PetscPushErrorHandler(PetscAbortErrorHandler,0);CHKERRQ(ierr); 398b59baad1SJed Brown } 39990d69ab7SBarry Smith flg1 = PETSC_FALSE; 400c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-on_error_mpiabort",&flg1,NULL);CHKERRQ(ierr); 401cb9801acSJed Brown if (flg1) { ierr = PetscPushErrorHandler(PetscMPIAbortErrorHandler,0);CHKERRQ(ierr);} 40290d69ab7SBarry Smith flg1 = PETSC_FALSE; 403c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-mpi_return_on_error",&flg1,NULL);CHKERRQ(ierr); 404e5c89e4eSSatish Balay if (flg1) { 405d54338ecSKarl Rupp ierr = MPI_Comm_set_errhandler(comm,MPI_ERRORS_RETURN);CHKERRQ(ierr); 406e5c89e4eSSatish Balay } 40790d69ab7SBarry Smith flg1 = PETSC_FALSE; 408c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-no_signal_handler",&flg1,NULL);CHKERRQ(ierr); 4098d359177SBarry Smith if (!flg1) {ierr = PetscPushSignalHandler(PetscSignalHandlerDefault,(void*)0);CHKERRQ(ierr);} 41096cc47afSJed Brown flg1 = PETSC_FALSE; 411c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-fp_trap",&flg1,NULL);CHKERRQ(ierr); 41296cc47afSJed Brown if (flg1) {ierr = PetscSetFPTrap(PETSC_FP_TRAP_ON);CHKERRQ(ierr);} 413c5929fdfSBarry Smith ierr = PetscOptionsGetInt(NULL,NULL,"-check_pointer_intensity",&intensity,&flag);CHKERRQ(ierr); 41428559dc8SJed Brown if (flag) {ierr = PetscCheckPointerSetIntensity(intensity);CHKERRQ(ierr);} 415e5c89e4eSSatish Balay 416e5c89e4eSSatish Balay /* 417e5c89e4eSSatish Balay Setup debugger information 418e5c89e4eSSatish Balay */ 419e5c89e4eSSatish Balay ierr = PetscSetDefaultDebugger();CHKERRQ(ierr); 420c5929fdfSBarry Smith ierr = PetscOptionsGetString(NULL,NULL,"-on_error_attach_debugger",string,64,&flg1);CHKERRQ(ierr); 421e5c89e4eSSatish Balay if (flg1) { 422e5c89e4eSSatish Balay MPI_Errhandler err_handler; 423e5c89e4eSSatish Balay 424e5c89e4eSSatish Balay ierr = PetscSetDebuggerFromString(string);CHKERRQ(ierr); 42533c7d699SBarry Smith ierr = MPI_Comm_create_errhandler(Petsc_MPI_DebuggerOnError,&err_handler);CHKERRQ(ierr); 426d54338ecSKarl Rupp ierr = MPI_Comm_set_errhandler(comm,err_handler);CHKERRQ(ierr); 427e5c89e4eSSatish Balay ierr = PetscPushErrorHandler(PetscAttachDebuggerErrorHandler,0);CHKERRQ(ierr); 428e5c89e4eSSatish Balay } 429c5929fdfSBarry Smith ierr = PetscOptionsGetString(NULL,NULL,"-debug_terminal",string,64,&flg1);CHKERRQ(ierr); 4305e96ac45SJed Brown if (flg1) { ierr = PetscSetDebugTerminal(string);CHKERRQ(ierr); } 431c5929fdfSBarry Smith ierr = PetscOptionsGetString(NULL,NULL,"-start_in_debugger",string,64,&flg1);CHKERRQ(ierr); 432c5929fdfSBarry Smith ierr = PetscOptionsGetString(NULL,NULL,"-stop_for_debugger",string,64,&flg2);CHKERRQ(ierr); 433e5c89e4eSSatish Balay if (flg1 || flg2) { 434e5c89e4eSSatish Balay PetscMPIInt size; 435e5c89e4eSSatish Balay PetscInt lsize,*nodes; 436e5c89e4eSSatish Balay MPI_Errhandler err_handler; 437e5c89e4eSSatish Balay /* 438e5c89e4eSSatish Balay we have to make sure that all processors have opened 439e5c89e4eSSatish Balay connections to all other processors, otherwise once the 440e5c89e4eSSatish Balay debugger has stated it is likely to receive a SIGUSR1 441e5c89e4eSSatish Balay and kill the program. 442e5c89e4eSSatish Balay */ 44342218b76SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 444e5c89e4eSSatish Balay if (size > 2) { 445533163c2SBarry Smith PetscMPIInt dummy = 0; 446e5c89e4eSSatish Balay MPI_Status status; 447e5c89e4eSSatish Balay for (i=0; i<size; i++) { 448e5c89e4eSSatish Balay if (rank != i) { 44942218b76SBarry Smith ierr = MPI_Send(&dummy,1,MPI_INT,i,109,comm);CHKERRQ(ierr); 450e5c89e4eSSatish Balay } 451e5c89e4eSSatish Balay } 452e5c89e4eSSatish Balay for (i=0; i<size; i++) { 453e5c89e4eSSatish Balay if (rank != i) { 45442218b76SBarry Smith ierr = MPI_Recv(&dummy,1,MPI_INT,i,109,comm,&status);CHKERRQ(ierr); 455e5c89e4eSSatish Balay } 456e5c89e4eSSatish Balay } 457e5c89e4eSSatish Balay } 458e5c89e4eSSatish Balay /* check if this processor node should be in debugger */ 459785e854fSJed Brown ierr = PetscMalloc1(size,&nodes);CHKERRQ(ierr); 460e5c89e4eSSatish Balay lsize = size; 461c5929fdfSBarry Smith ierr = PetscOptionsGetIntArray(NULL,NULL,"-debugger_nodes",nodes,&lsize,&flag);CHKERRQ(ierr); 462e5c89e4eSSatish Balay if (flag) { 463e5c89e4eSSatish Balay for (i=0; i<lsize; i++) { 464e5c89e4eSSatish Balay if (nodes[i] == rank) { flag = PETSC_FALSE; break; } 465e5c89e4eSSatish Balay } 466e5c89e4eSSatish Balay } 467e5c89e4eSSatish Balay if (!flag) { 468e5c89e4eSSatish Balay ierr = PetscSetDebuggerFromString(string);CHKERRQ(ierr); 469e5c89e4eSSatish Balay ierr = PetscPushErrorHandler(PetscAbortErrorHandler,0);CHKERRQ(ierr); 470e5c89e4eSSatish Balay if (flg1) { 471e5c89e4eSSatish Balay ierr = PetscAttachDebugger();CHKERRQ(ierr); 472e5c89e4eSSatish Balay } else { 473e5c89e4eSSatish Balay ierr = PetscStopForDebugger();CHKERRQ(ierr); 474e5c89e4eSSatish Balay } 47533c7d699SBarry Smith ierr = MPI_Comm_create_errhandler(Petsc_MPI_AbortOnError,&err_handler);CHKERRQ(ierr); 476d54338ecSKarl Rupp ierr = MPI_Comm_set_errhandler(comm,err_handler);CHKERRQ(ierr); 477e5c89e4eSSatish Balay } 478e5c89e4eSSatish Balay ierr = PetscFree(nodes);CHKERRQ(ierr); 479e5c89e4eSSatish Balay } 480e5c89e4eSSatish Balay 481c5929fdfSBarry Smith ierr = PetscOptionsGetString(NULL,NULL,"-on_error_emacs",emacsmachinename,128,&flg1);CHKERRQ(ierr); 482cb9801acSJed Brown if (flg1 && !rank) {ierr = PetscPushErrorHandler(PetscEmacsClientErrorHandler,emacsmachinename);CHKERRQ(ierr);} 483e5c89e4eSSatish Balay 484e5c89e4eSSatish Balay /* 485e5c89e4eSSatish Balay Setup profiling and logging 486e5c89e4eSSatish Balay */ 4876cf91177SBarry Smith #if defined(PETSC_USE_INFO) 4888bb29257SSatish Balay { 489e5c89e4eSSatish Balay char logname[PETSC_MAX_PATH_LEN]; logname[0] = 0; 490c5929fdfSBarry Smith ierr = PetscOptionsGetString(NULL,NULL,"-info",logname,250,&flg1);CHKERRQ(ierr); 4918bb29257SSatish Balay if (flg1 && logname[0]) { 492fcc2139eSBarry Smith ierr = PetscInfoAllow(PETSC_TRUE,logname);CHKERRQ(ierr); 4938bb29257SSatish Balay } else if (flg1) { 4940298fd71SBarry Smith ierr = PetscInfoAllow(PETSC_TRUE,NULL);CHKERRQ(ierr); 495e5c89e4eSSatish Balay } 496e5c89e4eSSatish Balay } 497865f6aa8SSatish Balay #endif 498865f6aa8SSatish Balay #if defined(PETSC_USE_LOG) 499865f6aa8SSatish Balay mname[0] = 0; 500c5929fdfSBarry Smith ierr = PetscOptionsGetString(NULL,NULL,"-history",mname,PETSC_MAX_PATH_LEN,&flg1);CHKERRQ(ierr); 501865f6aa8SSatish Balay if (flg1) { 502865f6aa8SSatish Balay if (mname[0]) { 503f3dea69dSBarry Smith ierr = PetscOpenHistoryFile(mname,&petsc_history);CHKERRQ(ierr); 504865f6aa8SSatish Balay } else { 505706d7a88SBarry Smith ierr = PetscOpenHistoryFile(NULL,&petsc_history);CHKERRQ(ierr); 506865f6aa8SSatish Balay } 507865f6aa8SSatish Balay } 508217044c2SLisandro Dalcin 509217044c2SLisandro Dalcin ierr = PetscOptionsGetBool(NULL,NULL,"-log_sync",&PetscLogSyncOn,NULL);CHKERRQ(ierr); 510217044c2SLisandro Dalcin 511e5c89e4eSSatish Balay #if defined(PETSC_HAVE_MPE) 51290d69ab7SBarry Smith flg1 = PETSC_FALSE; 513c5929fdfSBarry Smith ierr = PetscOptionsHasName(NULL,NULL,"-log_mpe",&flg1);CHKERRQ(ierr); 514495fc317SBarry Smith if (flg1) {ierr = PetscLogMPEBegin();CHKERRQ(ierr);} 515e5c89e4eSSatish Balay #endif 51690d69ab7SBarry Smith flg1 = PETSC_FALSE; 51790d69ab7SBarry Smith flg3 = PETSC_FALSE; 518c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-log_all",&flg1,NULL);CHKERRQ(ierr); 519c5929fdfSBarry Smith ierr = PetscOptionsHasName(NULL,NULL,"-log_summary",&flg3);CHKERRQ(ierr); 520e5c89e4eSSatish Balay if (flg1) { ierr = PetscLogAllBegin();CHKERRQ(ierr); } 521bb1d7374SBarry Smith else if (flg3) { ierr = PetscLogDefaultBegin();CHKERRQ(ierr);} 522e5c89e4eSSatish Balay 523c5929fdfSBarry Smith ierr = PetscOptionsGetString(NULL,NULL,"-log_trace",mname,250,&flg1);CHKERRQ(ierr); 524e5c89e4eSSatish Balay if (flg1) { 525e5c89e4eSSatish Balay char name[PETSC_MAX_PATH_LEN],fname[PETSC_MAX_PATH_LEN]; 526e5c89e4eSSatish Balay FILE *file; 527e5c89e4eSSatish Balay if (mname[0]) { 5282e924ca5SSatish Balay PetscSNPrintf(name,PETSC_MAX_PATH_LEN,"%s.%d",mname,rank); 529e5c89e4eSSatish Balay ierr = PetscFixFilename(name,fname);CHKERRQ(ierr); 530e5c89e4eSSatish Balay file = fopen(fname,"w"); 531f3dea69dSBarry Smith if (!file) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_FILE_OPEN,"Unable to open trace file: %s",fname); 532a297a907SKarl Rupp } else file = PETSC_STDOUT; 533e5c89e4eSSatish Balay ierr = PetscLogTraceBegin(file);CHKERRQ(ierr); 534e5c89e4eSSatish Balay } 535bb1d7374SBarry Smith 53616413a6aSBarry Smith ierr = PetscOptionsGetViewer(comm,NULL,NULL,"-log_view",NULL,&format,&flg4);CHKERRQ(ierr); 537bb1d7374SBarry Smith if (flg4) { 538bb1d7374SBarry Smith if (format == PETSC_VIEWER_ASCII_XML) { 539bb1d7374SBarry Smith ierr = PetscLogNestedBegin();CHKERRQ(ierr); 540bb1d7374SBarry Smith } else { 541bb1d7374SBarry Smith ierr = PetscLogDefaultBegin();CHKERRQ(ierr); 542bb1d7374SBarry Smith } 543e3ed9ee7SBarry Smith PetscLogMemory = PETSC_FALSE; 544e3ed9ee7SBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-log_view_memory",&PetscLogMemory,NULL);CHKERRQ(ierr); 545e3ed9ee7SBarry Smith if (PetscLogMemory) { 546e3ed9ee7SBarry Smith ierr = PetscSetUseTrMalloc_Private();CHKERRQ(ierr); 547e3ed9ee7SBarry Smith } 548eccbb886SLisandro Dalcin } 549eccbb886SLisandro Dalcin if (flg4 && format == PETSC_VIEWER_ASCII_XML) { 550eccbb886SLisandro Dalcin PetscReal threshold = PetscRealConstant(0.01); 551eccbb886SLisandro Dalcin ierr = PetscOptionsGetReal(NULL,NULL,"-log_threshold",&threshold,&flg1);CHKERRQ(ierr); 552eccbb886SLisandro Dalcin if (flg1) {ierr = PetscLogSetThreshold((PetscLogDouble)threshold,NULL);CHKERRQ(ierr);} 553bb1d7374SBarry Smith } 554e5c89e4eSSatish Balay #endif 555e5c89e4eSSatish Balay 556c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-saws_options",&PetscOptionsPublish,NULL);CHKERRQ(ierr); 557e5c89e4eSSatish Balay 5584b0a73b2SBarry Smith #if defined(PETSC_HAVE_CUDA) 559*fdc842d1SBarry Smith /* 560*fdc842d1SBarry Smith If collecting logging information, by default, wait for GPU to complete its operations 561*fdc842d1SBarry Smith before returning to the CPU in order to get accurate timings of each event 562*fdc842d1SBarry Smith */ 563*fdc842d1SBarry Smith ierr = PetscOptionsHasName(NULL,NULL,"-log_summary",&PetscCUDASynchronize);CHKERRQ(ierr); 564*fdc842d1SBarry Smith if (!PetscCUDASynchronize) { 565*fdc842d1SBarry Smith ierr = PetscOptionsHasName(NULL,NULL,"-log_view",&PetscCUDASynchronize);CHKERRQ(ierr); 566*fdc842d1SBarry Smith } 567*fdc842d1SBarry Smith 568012f15ecSRichard Tran Mills ierr = PetscOptionsBegin(comm,NULL,"CUDA options","Sys");CHKERRQ(ierr); 569d991300cSSatish Balay ierr = PetscOptionsInt("-cuda_set_device","Set all MPI ranks to use the specified CUDA device",NULL,deviceOpt,&deviceOpt,&flg1);CHKERRQ(ierr); 570d991300cSSatish Balay device = (int)deviceOpt; 571*fdc842d1SBarry Smith ierr = PetscOptionsBool("-cuda_synchronize","Wait for the GPU to complete operations before returning to the CPU",NULL,PetscCUDASynchronize,&PetscCUDASynchronize,NULL);CHKERRQ(ierr); 572012f15ecSRichard Tran Mills ierr = PetscOptionsDeprecated("-cuda_show_devices","-cuda_view","3.12",NULL);CHKERRQ(ierr); 573012f15ecSRichard Tran Mills ierr = PetscOptionsName("-cuda_view","Display CUDA device information and assignments",NULL,&cuda_view_flag);CHKERRQ(ierr); 574012f15ecSRichard Tran Mills ierr = PetscOptionsEnd();CHKERRQ(ierr); 575bffec52eSKarl Rupp if (!PetscCUDAInitialized) { 57616b6f2efSBarry Smith PetscMPIInt size; 57742218b76SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 578012f15ecSRichard Tran Mills 579bd72cc96SPaul Mullowney if (size>1) { 58016b6f2efSBarry Smith int devCount; 58116b6f2efSBarry Smith PetscMPIInt rank; 5822692e278SPaul Mullowney cudaError_t err = cudaSuccess; 5832692e278SPaul Mullowney 5842692e278SPaul Mullowney /* check to see if we force multiple ranks to hit the same GPU */ 5852692e278SPaul Mullowney if (flg1) { 586d991300cSSatish Balay err = cudaSetDevice(device); 587e09ad801SBarry Smith if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaSetDevice %s",cudaGetErrorString(err)); 5882692e278SPaul Mullowney } else { 589e09ad801SBarry Smith /* we're not using the same GPU on multiple MPI threads. So try to allocated different GPUs to different processes */ 5902692e278SPaul Mullowney 5912692e278SPaul Mullowney /* First get the device count */ 592e09ad801SBarry Smith err = cudaGetDeviceCount(&devCount); 593e09ad801SBarry Smith if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaGetDeviceCount %s",cudaGetErrorString(err)); 5942692e278SPaul Mullowney 5952692e278SPaul Mullowney /* next determine the rank and then set the device via a mod */ 59642218b76SBarry Smith ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 597bd72cc96SPaul Mullowney device = rank % devCount; 598d991300cSSatish Balay err = cudaSetDevice(device); 599e09ad801SBarry Smith if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaSetDevice %s",cudaGetErrorString(err)); 6002692e278SPaul Mullowney } 6012692e278SPaul Mullowney 6022692e278SPaul Mullowney /* set the device flags so that it can map host memory ... do NOT throw exception on err!=cudaSuccess 6032692e278SPaul Mullowney multiple devices may try to set the flags on the same device. So long as one of them succeeds, things 6042692e278SPaul Mullowney are ok. */ 6052692e278SPaul Mullowney err = cudaSetDeviceFlags(cudaDeviceMapHost); 606e09ad801SBarry Smith if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaSetDeviceFlags %s",cudaGetErrorString(err)); 607a297a907SKarl Rupp } else { 6082692e278SPaul Mullowney cudaError_t err = cudaSuccess; 6092692e278SPaul Mullowney 610f297a14cSJed Brown /* the code below works for serial GPU simulations */ 6114b0a73b2SBarry Smith if (flg1) { 612d991300cSSatish Balay err = cudaSetDevice(device); 613e09ad801SBarry Smith if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaSetDevice %s",cudaGetErrorString(err)); 6144b0a73b2SBarry Smith } 6152692e278SPaul Mullowney 6162692e278SPaul Mullowney /* set the device flags so that it can map host memory ... here, we error check. */ 6172692e278SPaul Mullowney err = cudaSetDeviceFlags(cudaDeviceMapHost); 618e09ad801SBarry Smith if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaSetDeviceFlags %s",cudaGetErrorString(err)); 6194b0a73b2SBarry Smith } 620bffec52eSKarl Rupp 621*fdc842d1SBarry Smith ierr = PetscCUBLASInitializeHandle();CHKERRQ(ierr); 622bffec52eSKarl Rupp PetscCUDAInitialized = PETSC_TRUE; 623bd72cc96SPaul Mullowney } 624012f15ecSRichard Tran Mills if (cuda_view_flag) { 6257be52123SRichard Tran Mills struct cudaDeviceProp prop; 626d991300cSSatish Balay int devCount,device; 6277be52123SRichard Tran Mills cudaError_t err = cudaSuccess; 6287be52123SRichard Tran Mills 6297be52123SRichard Tran Mills err = cudaGetDeviceCount(&devCount); 6307be52123SRichard Tran Mills if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaGetDeviceCount %s",cudaGetErrorString(err)); 6317be52123SRichard Tran Mills for (device = 0; device < devCount; ++device) { 632d991300cSSatish Balay err = cudaGetDeviceProperties(&prop,device); 6337be52123SRichard Tran Mills if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaGetDeviceProperties %s",cudaGetErrorString(err)); 634fef7099cSRichard Tran Mills ierr = PetscPrintf(comm, "CUDA device %d: %s\n", device, prop.name);CHKERRQ(ierr); 6357be52123SRichard Tran Mills } 6367be52123SRichard Tran Mills err = cudaGetDevice(&device); 6377be52123SRichard Tran Mills if (err != cudaSuccess) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SYS,"error in cudaGetDevice %s",cudaGetErrorString(err)); 6387be52123SRichard Tran Mills ierr = PetscSynchronizedPrintf(PETSC_COMM_WORLD,"[%d] Using CUDA device %d.\n",rank,device);CHKERRQ(ierr); 6397be52123SRichard Tran Mills ierr = PetscSynchronizedFlush(PETSC_COMM_WORLD,PETSC_STDOUT);CHKERRQ(ierr); 6407be52123SRichard Tran Mills } 6417be52123SRichard Tran Mills 6424b0a73b2SBarry Smith #endif 6434b0a73b2SBarry Smith 6444b0a73b2SBarry Smith 645e5c89e4eSSatish Balay /* 646e5c89e4eSSatish Balay Print basic help message 647e5c89e4eSSatish Balay */ 6482d747510SLisandro Dalcin ierr = PetscOptionsHasHelp(NULL,&flg1);CHKERRQ(ierr); 649e5c89e4eSSatish Balay if (flg1) { 650e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm,"Options for all PETSc programs:\n");CHKERRQ(ierr); 651301d30feSBarry Smith ierr = (*PetscHelpPrintf)(comm," -help: prints help method for each option\n");CHKERRQ(ierr); 652301d30feSBarry Smith ierr = (*PetscHelpPrintf)(comm," -on_error_abort: cause an abort when an error is detected. Useful \n ");CHKERRQ(ierr); 653301d30feSBarry Smith ierr = (*PetscHelpPrintf)(comm," only when run in the debugger\n");CHKERRQ(ierr); 654e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -on_error_attach_debugger [gdb,dbx,xxgdb,ups,noxterm]\n");CHKERRQ(ierr); 655e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," start the debugger in new xterm\n");CHKERRQ(ierr); 656e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," unless noxterm is given\n");CHKERRQ(ierr); 657e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -start_in_debugger [gdb,dbx,xxgdb,ups,noxterm]\n");CHKERRQ(ierr); 658e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," start all processes in the debugger\n");CHKERRQ(ierr); 659e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -on_error_emacs <machinename>\n");CHKERRQ(ierr); 660e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," emacs jumps to error file\n");CHKERRQ(ierr); 661e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -debugger_nodes [n1,n2,..] Nodes to start in debugger\n");CHKERRQ(ierr); 662e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -debugger_pause [m] : delay (in seconds) to attach debugger\n");CHKERRQ(ierr); 663e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -stop_for_debugger : prints message on how to attach debugger manually\n");CHKERRQ(ierr); 664e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," waits the delay for you to attach\n");CHKERRQ(ierr); 6651cda70a7SBarry Smith ierr = (*PetscHelpPrintf)(comm," -display display: Location where X window graphics and debuggers are displayed\n");CHKERRQ(ierr); 666e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -no_signal_handler: do not trap error signals\n");CHKERRQ(ierr); 667e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -mpi_return_on_error: MPI returns error code, rather than abort on internal error\n");CHKERRQ(ierr); 668e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -fp_trap: stop on floating point exceptions\n");CHKERRQ(ierr); 669e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," note on IBM RS6000 this slows run greatly\n");CHKERRQ(ierr); 670e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -malloc_dump <optional filename>: dump list of unfreed memory at conclusion\n");CHKERRQ(ierr); 671e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -malloc: use our error checking malloc\n");CHKERRQ(ierr); 672e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -malloc no: don't use error checking malloc\n");CHKERRQ(ierr); 6734161f2a3SBarry Smith ierr = (*PetscHelpPrintf)(comm," -malloc_info: prints total memory usage\n");CHKERRQ(ierr); 6744161f2a3SBarry Smith ierr = (*PetscHelpPrintf)(comm," -malloc_log: keeps log of all memory allocations\n");CHKERRQ(ierr); 675e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -malloc_debug: enables extended checking for memory corruption\n");CHKERRQ(ierr); 67626a7e8d4SBarry Smith ierr = (*PetscHelpPrintf)(comm," -options_view: dump list of options inputted\n");CHKERRQ(ierr); 677e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -options_left: dump list of unused options\n");CHKERRQ(ierr); 678e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -options_left no: don't dump list of unused options\n");CHKERRQ(ierr); 679e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -tmp tmpdir: alternative /tmp directory\n");CHKERRQ(ierr); 680e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -shared_tmp: tmp directory is shared by all processors\n");CHKERRQ(ierr); 681a8c7a070SBarry Smith ierr = (*PetscHelpPrintf)(comm," -not_shared_tmp: each processor has separate tmp directory\n");CHKERRQ(ierr); 6820841954dSBarry Smith ierr = (*PetscHelpPrintf)(comm," -memory_view: print memory usage at end of run\n");CHKERRQ(ierr); 683e5c89e4eSSatish Balay #if defined(PETSC_USE_LOG) 684e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -get_total_flops: total flops over all processors\n");CHKERRQ(ierr); 685185ae32fSMatthew G. Knepley ierr = (*PetscHelpPrintf)(comm," -log_view [:filename:[format]]: logging objects and events\n");CHKERRQ(ierr); 686e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -log_trace [filename]: prints trace of all PETSc calls\n");CHKERRQ(ierr); 687e5c89e4eSSatish Balay #if defined(PETSC_HAVE_MPE) 688495fc317SBarry Smith ierr = (*PetscHelpPrintf)(comm," -log_mpe: Also create logfile viewable through Jumpshot\n");CHKERRQ(ierr); 689e5c89e4eSSatish Balay #endif 6906cf91177SBarry Smith ierr = (*PetscHelpPrintf)(comm," -info <optional filename>: print informative messages about the calculations\n");CHKERRQ(ierr); 691e5c89e4eSSatish Balay #endif 692e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -v: prints PETSc version number and release date\n");CHKERRQ(ierr); 693e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -options_file <file>: reads options from file\n");CHKERRQ(ierr); 694e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm," -petsc_sleep n: sleeps n seconds before running program\n");CHKERRQ(ierr); 695e5c89e4eSSatish Balay ierr = (*PetscHelpPrintf)(comm,"-----------------------------------------------\n");CHKERRQ(ierr); 696e5c89e4eSSatish Balay } 697e5c89e4eSSatish Balay 69874ba8654SBarry Smith #if defined(PETSC_HAVE_POPEN) 69974ba8654SBarry Smith { 70074ba8654SBarry Smith char machine[128]; 701c5929fdfSBarry Smith ierr = PetscOptionsGetString(NULL,NULL,"-popen_machine",machine,128,&flg1);CHKERRQ(ierr); 70274ba8654SBarry Smith if (flg1) { 70374ba8654SBarry Smith ierr = PetscPOpenSetMachine(machine);CHKERRQ(ierr); 70474ba8654SBarry Smith } 70574ba8654SBarry Smith } 70674ba8654SBarry Smith #endif 70774ba8654SBarry Smith 708c5929fdfSBarry Smith ierr = PetscOptionsGetReal(NULL,NULL,"-petsc_sleep",&si,&flg1);CHKERRQ(ierr); 709e5c89e4eSSatish Balay if (flg1) { 710e5c89e4eSSatish Balay ierr = PetscSleep(si);CHKERRQ(ierr); 711e5c89e4eSSatish Balay } 712e5c89e4eSSatish Balay 713c5929fdfSBarry Smith ierr = PetscOptionsGetString(NULL,NULL,"-info_exclude",mname,PETSC_MAX_PATH_LEN,&flg1);CHKERRQ(ierr); 7142ea1be5dSBarry Smith if (flg1) { 715e5c89e4eSSatish Balay ierr = PetscStrstr(mname,"null",&f);CHKERRQ(ierr); 716e5c89e4eSSatish Balay if (f) { 717ecd8bba6SJed Brown ierr = PetscInfoDeactivateClass(0);CHKERRQ(ierr); 718e5c89e4eSSatish Balay } 7192ea1be5dSBarry Smith } 720827f890bSBarry Smith 721*fdc842d1SBarry Smith #if defined(PETSC_HAVE_VIENNACL) 722c5929fdfSBarry Smith ierr = PetscOptionsHasName(NULL,NULL,"-log_summary",&flg3);CHKERRQ(ierr); 723f14045dbSBarry Smith if (!flg3) { 724c5929fdfSBarry Smith ierr = PetscOptionsHasName(NULL,NULL,"-log_view",&flg3);CHKERRQ(ierr); 725f14045dbSBarry Smith } 726c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-viennacl_synchronize",&flg3,NULL);CHKERRQ(ierr); 727f14045dbSBarry Smith PetscViennaCLSynchronize = flg3; 728*fdc842d1SBarry Smith ierr = PetscViennaCLInit();CHKERRQ(ierr); 7294cf1874eSKarl Rupp #endif 73082f73ecaSAlejandro Lamas Daviña 731*fdc842d1SBarry Smith /* 732*fdc842d1SBarry Smith Creates the logging data structures; this is enabled even if logging is not turned on 733*fdc842d1SBarry Smith This is the last thing we do before returning to the user code to prevent having the 734*fdc842d1SBarry Smith logging numbers contaminated by any startup time associated with MPI and the GPUs 735*fdc842d1SBarry Smith */ 736*fdc842d1SBarry Smith #if defined(PETSC_USE_LOG) 737*fdc842d1SBarry Smith ierr = PetscLogInitialize();CHKERRQ(ierr); 738f0a7718cSKarl Rupp #endif 739f0a7718cSKarl Rupp 740e5c89e4eSSatish Balay PetscFunctionReturn(0); 741e5c89e4eSSatish Balay } 742