xref: /petsc/src/sys/error/errtrace.c (revision aaa8cc7d2a5c3913edcbb923e20f154fe9c4aa65)
10039db0dSBarry Smith #define PETSC_DESIRE_FEATURE_TEST_MACROS /* for fileno() */
2c6db04a5SJed Brown #include <petscsys.h>                    /*I "petscsys.h" I*/
3f67a399dSBarry Smith #include <petsc/private/petscimpl.h>
4c6db04a5SJed Brown #include <petscconfiginfo.h>
5114011d0SBarry Smith #if defined(PETSC_HAVE_UNISTD_H)
6114011d0SBarry Smith   #include <unistd.h>
7114011d0SBarry Smith #endif
8e5c89e4eSSatish Balay 
9e5c89e4eSSatish Balay /*@C
10*aaa8cc7dSPierre Jolivet    PetscIgnoreErrorHandler - Deprecated, use `PetscReturnErrorHandler()`. Ignores the error, allows program to continue as if error did not occur
11e5c89e4eSSatish Balay 
12e5c89e4eSSatish Balay    Not Collective
13e5c89e4eSSatish Balay 
14e5c89e4eSSatish Balay    Input Parameters:
15e32f2f54SBarry Smith +  comm - communicator over which error occurred
16e32f2f54SBarry Smith .  line - the line number of the error (indicated by __LINE__)
17e5c89e4eSSatish Balay .  file - the file in which the error was detected (indicated by __FILE__)
18e5c89e4eSSatish Balay .  mess - an error text string, usually just printed to the screen
19e5c89e4eSSatish Balay .  n - the generic error number
20e5c89e4eSSatish Balay .  p - specific error number
21e5c89e4eSSatish Balay -  ctx - error handler context
22e5c89e4eSSatish Balay 
23e5c89e4eSSatish Balay    Level: developer
24e5c89e4eSSatish Balay 
25811af0c4SBarry Smith    Note:
26811af0c4SBarry Smith    Users do not directly call this routine
27e5c89e4eSSatish Balay 
28db781477SPatrick Sanan .seealso: `PetscReturnErrorHandler()`
29e5c89e4eSSatish Balay  @*/
30d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscIgnoreErrorHandler(MPI_Comm comm, int line, const char *fun, const char *file, PetscErrorCode n, PetscErrorType p, const char *mess, void *ctx)
31d71ae5a4SJacob Faibussowitsch {
3211cc89d2SBarry Smith   return n;
33e5c89e4eSSatish Balay }
34e5c89e4eSSatish Balay 
35107894f0SSatish Balay /* ---------------------------------------------------------------------------------------*/
36107894f0SSatish Balay 
375abee1b0SJed Brown static char      arch[128], hostname[128], username[128], pname[PETSC_MAX_PATH_LEN], date[128];
38ace3abfcSBarry Smith static PetscBool PetscErrorPrintfInitializeCalled = PETSC_FALSE;
393f6e4ae9SSatish Balay static char      version[256];
40107894f0SSatish Balay 
41107894f0SSatish Balay /*
42107894f0SSatish Balay    Initializes arch, hostname, username, date so that system calls do NOT need
43107894f0SSatish Balay    to be made during the error handler.
44107894f0SSatish Balay */
45d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscErrorPrintfInitialize(void)
46d71ae5a4SJacob Faibussowitsch {
47ace3abfcSBarry Smith   PetscBool use_stdout = PETSC_FALSE, use_none = PETSC_FALSE;
48107894f0SSatish Balay 
49107894f0SSatish Balay   PetscFunctionBegin;
509566063dSJacob Faibussowitsch   PetscCall(PetscGetArchType(arch, sizeof(arch)));
519566063dSJacob Faibussowitsch   PetscCall(PetscGetHostName(hostname, sizeof(hostname)));
529566063dSJacob Faibussowitsch   PetscCall(PetscGetUserName(username, sizeof(username)));
539566063dSJacob Faibussowitsch   PetscCall(PetscGetProgramName(pname, sizeof(pname)));
549566063dSJacob Faibussowitsch   PetscCall(PetscGetDate(date, sizeof(date)));
559566063dSJacob Faibussowitsch   PetscCall(PetscGetVersion(version, sizeof(version)));
56e8fb0fc0SBarry Smith 
579566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetBool(NULL, NULL, "-error_output_stdout", &use_stdout, NULL));
58a297a907SKarl Rupp   if (use_stdout) PETSC_STDERR = PETSC_STDOUT;
599566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetBool(NULL, NULL, "-error_output_none", &use_none, NULL));
60a297a907SKarl Rupp   if (use_none) PetscErrorPrintf = PetscErrorPrintfNone;
61107894f0SSatish Balay   PetscErrorPrintfInitializeCalled = PETSC_TRUE;
623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
63107894f0SSatish Balay }
64107894f0SSatish Balay 
65d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscErrorPrintfNone(const char format[], ...)
66d71ae5a4SJacob Faibussowitsch {
673ba16761SJacob Faibussowitsch   return PETSC_SUCCESS;
68e8fb0fc0SBarry Smith }
69e8fb0fc0SBarry Smith 
70d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscErrorPrintfDefault(const char format[], ...)
71d71ae5a4SJacob Faibussowitsch {
72e8fb0fc0SBarry Smith   va_list          Argp;
73ace3abfcSBarry Smith   static PetscBool PetscErrorPrintfCalled = PETSC_FALSE;
743ba16761SJacob Faibussowitsch   PetscErrorCode   ierr;
75e8fb0fc0SBarry Smith 
76e8fb0fc0SBarry Smith   /*
77e8fb0fc0SBarry Smith       This function does not call PetscFunctionBegin and PetscFunctionReturn() because
78e8fb0fc0SBarry Smith     it may be called by PetscStackView().
79e8fb0fc0SBarry Smith 
80e8fb0fc0SBarry Smith       This function does not do error checking because it is called by the error handlers.
81e8fb0fc0SBarry Smith   */
82e8fb0fc0SBarry Smith 
83e8fb0fc0SBarry Smith   if (!PetscErrorPrintfCalled) {
84e8fb0fc0SBarry Smith     PetscErrorPrintfCalled = PETSC_TRUE;
85e8fb0fc0SBarry Smith 
86e8fb0fc0SBarry Smith     /*
87e8fb0fc0SBarry Smith         On the SGI machines and Cray T3E, if errors are generated  "simultaneously" by
88e8fb0fc0SBarry Smith       different processors, the messages are printed all jumbled up; to try to
89e8fb0fc0SBarry Smith       prevent this we have each processor wait based on their rank
90e8fb0fc0SBarry Smith     */
91e8fb0fc0SBarry Smith #if defined(PETSC_CAN_SLEEP_AFTER_ERROR)
92e8fb0fc0SBarry Smith     {
933ba16761SJacob Faibussowitsch       PetscMPIInt rank = PetscGlobalRank > 8 ? 8 : PetscGlobalRank;
943ba16761SJacob Faibussowitsch       ierr             = PetscSleep((PetscReal)rank);
953ba16761SJacob Faibussowitsch       (void)ierr;
96e8fb0fc0SBarry Smith     }
97e8fb0fc0SBarry Smith #endif
98e8fb0fc0SBarry Smith   }
99e8fb0fc0SBarry Smith 
1003ba16761SJacob Faibussowitsch   ierr = PetscFPrintf(PETSC_COMM_SELF, PETSC_STDERR, "[%d]PETSC ERROR: ", PetscGlobalRank);
101e8fb0fc0SBarry Smith   va_start(Argp, format);
1023ba16761SJacob Faibussowitsch   ierr = (*PetscVFPrintf)(PETSC_STDERR, format, Argp);
1033ba16761SJacob Faibussowitsch   (void)ierr;
104e8fb0fc0SBarry Smith   va_end(Argp);
1053ba16761SJacob Faibussowitsch   return PETSC_SUCCESS;
106e8fb0fc0SBarry Smith }
107e8fb0fc0SBarry Smith 
108c2eed0edSBarry Smith /*
109c2eed0edSBarry Smith    On some systems when the stderr is nested through several levels of shell script
110c2eed0edSBarry Smith    before being passed to a file the isatty() falsely returns true resulting in
111c2eed0edSBarry Smith    the screen highlight variables being passed through the test harness. Therefore
112c2eed0edSBarry Smith    simply do not highlight when the PETSC_STDERR is PETSC_STDOUT.
113c2eed0edSBarry Smith */
114d71ae5a4SJacob Faibussowitsch static void PetscErrorPrintfHilight(void)
115d71ae5a4SJacob Faibussowitsch {
11698ed35c3SBarry Smith #if defined(PETSC_HAVE_UNISTD_H) && defined(PETSC_USE_ISATTY)
117c2eed0edSBarry Smith   if (PetscErrorPrintf == PetscErrorPrintfDefault && PETSC_STDERR != PETSC_STDOUT) {
118114011d0SBarry Smith     if (isatty(fileno(PETSC_STDERR))) fprintf(PETSC_STDERR, "\033[1;31m");
119114011d0SBarry Smith   }
120114011d0SBarry Smith #endif
121114011d0SBarry Smith }
122114011d0SBarry Smith 
123d71ae5a4SJacob Faibussowitsch static void PetscErrorPrintfNormal(void)
124d71ae5a4SJacob Faibussowitsch {
12598ed35c3SBarry Smith #if defined(PETSC_HAVE_UNISTD_H) && defined(PETSC_USE_ISATTY)
126c2eed0edSBarry Smith   if (PetscErrorPrintf == PetscErrorPrintfDefault && PETSC_STDERR != PETSC_STDOUT) {
127114011d0SBarry Smith     if (isatty(fileno(PETSC_STDERR))) fprintf(PETSC_STDERR, "\033[0;39m\033[0;49m");
128114011d0SBarry Smith   }
129114011d0SBarry Smith #endif
130114011d0SBarry Smith }
131114011d0SBarry Smith 
13295c0884eSLisandro Dalcin PETSC_EXTERN PetscErrorCode PetscOptionsViewError(void);
133114011d0SBarry Smith 
134e5c89e4eSSatish Balay /*@C
135e5c89e4eSSatish Balay 
136e5c89e4eSSatish Balay    PetscTraceBackErrorHandler - Default error handler routine that generates
137e5c89e4eSSatish Balay    a traceback on error detection.
138e5c89e4eSSatish Balay 
139e5c89e4eSSatish Balay    Not Collective
140e5c89e4eSSatish Balay 
141e5c89e4eSSatish Balay    Input Parameters:
142e32f2f54SBarry Smith +  comm - communicator over which error occurred
143e32f2f54SBarry Smith .  line - the line number of the error (indicated by __LINE__)
144e5c89e4eSSatish Balay .  file - the file in which the error was detected (indicated by __FILE__)
145e5c89e4eSSatish Balay .  mess - an error text string, usually just printed to the screen
146e5c89e4eSSatish Balay .  n - the generic error number
147811af0c4SBarry Smith .  p - `PETSC_ERROR_INITIAL` if this is the first call the error handler, otherwise `PETSC_ERROR_REPEAT`
148e5c89e4eSSatish Balay -  ctx - error handler context
149e5c89e4eSSatish Balay 
150811af0c4SBarry Smith   Options Database Keys:
15145b666d6SBarry Smith +  -error_output_stdout - output the error messages to stdout instead of the default stderr
15245b666d6SBarry Smith -  -error_output_none - do not output the error messages
153e5c89e4eSSatish Balay 
154e5c89e4eSSatish Balay    Notes:
155811af0c4SBarry Smith    Users do not directly call this routine
156e5c89e4eSSatish Balay 
157811af0c4SBarry Smith    Use `PetscPushErrorHandler()` to set the desired error handler.
158e5c89e4eSSatish Balay 
15945b666d6SBarry Smith    Level: developer
160e5c89e4eSSatish Balay 
161db781477SPatrick Sanan .seealso: `PetscError()`, `PetscPushErrorHandler()`, `PetscPopErrorHandler()`, `PetscAttachDebuggerErrorHandler()`,
162db781477SPatrick Sanan           `PetscAbortErrorHandler()`, `PetscMPIAbortErrorHandler()`, `PetscReturnErrorHandler()`, `PetscEmacsClientErrorHandler()`
163e5c89e4eSSatish Balay  @*/
164d71ae5a4SJacob Faibussowitsch PetscErrorCode PetscTraceBackErrorHandler(MPI_Comm comm, int line, const char *fun, const char *file, PetscErrorCode n, PetscErrorType p, const char *mess, void *ctx)
165d71ae5a4SJacob Faibussowitsch {
1663ba16761SJacob Faibussowitsch   PetscErrorCode ierr;
167e5c89e4eSSatish Balay   PetscLogDouble mem, rss;
168574034a9SJed Brown   PetscBool      flg1 = PETSC_FALSE, flg2 = PETSC_FALSE, flg3 = PETSC_FALSE;
169997adca8SBarry Smith   PetscMPIInt    rank = 0;
170e5c89e4eSSatish Balay 
171a297a907SKarl Rupp   if (comm != PETSC_COMM_SELF) MPI_Comm_rank(comm, &rank);
172a297a907SKarl Rupp 
173660278c0SBarry Smith   if (rank == 0 && (!PetscCIEnabledPortableErrorOutput || PetscGlobalRank == 0)) {
174114011d0SBarry Smith     static int cnt = 1;
175114011d0SBarry Smith 
17657a177adSBarry Smith     if (cnt == 1) {
177114011d0SBarry Smith       PetscErrorPrintfHilight();
1783ba16761SJacob Faibussowitsch       ierr = (*PetscErrorPrintf)("--------------------- Error Message --------------------------------------------------------------\n");
1795f3a2c8dSBarry Smith       PetscErrorPrintfNormal();
180e5c89e4eSSatish Balay       if (n == PETSC_ERR_MEM) {
1813ba16761SJacob Faibussowitsch         ierr = (*PetscErrorPrintf)("Out of memory. This could be due to allocating\n");
1823ba16761SJacob Faibussowitsch         ierr = (*PetscErrorPrintf)("too large an object or bleeding by not properly\n");
1833ba16761SJacob Faibussowitsch         ierr = (*PetscErrorPrintf)("destroying unneeded objects.\n");
1843ba16761SJacob Faibussowitsch         ierr = PetscMallocGetCurrentUsage(&mem);
1853ba16761SJacob Faibussowitsch         ierr = PetscMemoryGetCurrentUsage(&rss);
1863ba16761SJacob Faibussowitsch         ierr = PetscOptionsGetBool(NULL, NULL, "-malloc_dump", &flg1, NULL);
1873ba16761SJacob Faibussowitsch         ierr = PetscOptionsGetBool(NULL, NULL, "-malloc_view", &flg2, NULL);
1883ba16761SJacob Faibussowitsch         ierr = PetscOptionsHasName(NULL, NULL, "-malloc_view_threshold", &flg3);
1893ba16761SJacob Faibussowitsch         if (flg2 || flg3) ierr = PetscMallocView(stdout);
190a297a907SKarl Rupp         else {
1913ba16761SJacob Faibussowitsch           ierr = (*PetscErrorPrintf)("Memory allocated %.0f Memory used by process %.0f\n", mem, rss);
1923ba16761SJacob Faibussowitsch           if (flg1) ierr = PetscMallocDump(stdout);
1933ba16761SJacob Faibussowitsch           else ierr = (*PetscErrorPrintf)("Try running with -malloc_dump or -malloc_view for info.\n");
194e5c89e4eSSatish Balay         }
195e5c89e4eSSatish Balay       } else {
196e5c89e4eSSatish Balay         const char *text;
1973ba16761SJacob Faibussowitsch         ierr = PetscErrorMessage(n, &text, NULL);
1983ba16761SJacob Faibussowitsch         if (text) ierr = (*PetscErrorPrintf)("%s\n", text);
199e5c89e4eSSatish Balay       }
2003ba16761SJacob Faibussowitsch       if (mess) ierr = (*PetscErrorPrintf)("%s\n", mess);
2013ba16761SJacob Faibussowitsch       ierr = PetscOptionsLeftError();
2023ba16761SJacob Faibussowitsch       ierr = (*PetscErrorPrintf)("See https://petsc.org/release/faq/ for trouble shooting.\n");
203660278c0SBarry Smith       if (!PetscCIEnabledPortableErrorOutput) {
2043ba16761SJacob Faibussowitsch         ierr = (*PetscErrorPrintf)("%s\n", version);
2053ba16761SJacob Faibussowitsch         if (PetscErrorPrintfInitializeCalled) ierr = (*PetscErrorPrintf)("%s on a %s named %s by %s %s\n", pname, arch, hostname, username, date);
2063ba16761SJacob Faibussowitsch         ierr = (*PetscErrorPrintf)("Configure options %s\n", petscconfigureoptions);
207107894f0SSatish Balay       }
208660278c0SBarry Smith     }
209997adca8SBarry Smith     /* print line of stack trace */
2103ba16761SJacob Faibussowitsch     if (fun) ierr = (*PetscErrorPrintf)("#%d %s() at %s:%d\n", cnt++, fun, PetscCIFilename(file), PetscCILinenumber(line));
2113ba16761SJacob Faibussowitsch     else if (file) ierr = (*PetscErrorPrintf)("#%d %s:%d\n", cnt++, PetscCIFilename(file), PetscCILinenumber(line));
21249c86fc7SBarry Smith     if (fun) {
213bbcf679cSJacob Faibussowitsch       PetscBool ismain = PETSC_FALSE;
214bbcf679cSJacob Faibussowitsch 
2153ba16761SJacob Faibussowitsch       ierr = PetscStrncmp(fun, "main", 4, &ismain);
216fbfcfee5SBarry Smith       if (ismain) {
2173ba16761SJacob Faibussowitsch         if ((n <= PETSC_ERR_MIN_VALUE) || (n >= PETSC_ERR_MAX_VALUE)) ierr = (*PetscErrorPrintf)("Reached the main program with an out-of-range error code %d. This should never happen\n", n);
2183ba16761SJacob Faibussowitsch         ierr = PetscOptionsViewError();
219114011d0SBarry Smith         PetscErrorPrintfHilight();
2203ba16761SJacob Faibussowitsch         ierr = (*PetscErrorPrintf)("----------------End of Error Message -------send entire error message to petsc-maint@mcs.anl.gov----------\n");
221114011d0SBarry Smith         PetscErrorPrintfNormal();
222114011d0SBarry Smith       }
22349c86fc7SBarry Smith     }
224997adca8SBarry Smith   } else {
225a5b23f4aSJose E. Roman     /* do not print error messages since process 0 will print them, sleep before aborting so will not accidentally kill process 0*/
2263ba16761SJacob Faibussowitsch     ierr = PetscSleep(10.0);
227c16385d5SBarry Smith     exit(0);
228997adca8SBarry Smith   }
2293ba16761SJacob Faibussowitsch   (void)ierr;
230362febeeSStefano Zampini   return n;
231e5c89e4eSSatish Balay }
232