xref: /petsc/src/sys/error/errtrace.c (revision 811af0c4b09a35de4306c442f88bd09fdc09897d)
10039db0dSBarry Smith #define PETSC_DESIRE_FEATURE_TEST_MACROS /* for fileno() */
2c6db04a5SJed Brown #include <petscsys.h>                    /*I "petscsys.h" I*/
3f67a399dSBarry Smith #include <petsc/private/petscimpl.h>
4c6db04a5SJed Brown #include <petscconfiginfo.h>
5114011d0SBarry Smith #if defined(PETSC_HAVE_UNISTD_H)
6114011d0SBarry Smith #include <unistd.h>
7114011d0SBarry Smith #endif
8e5c89e4eSSatish Balay 
9e5c89e4eSSatish Balay /*@C
10*811af0c4SBarry Smith    PetscIgnoreErrorHandler - Deprecated, use `PetscReturnErrorHandler()`. Ignores the error, allows program to continue as if error did not occure
11e5c89e4eSSatish Balay 
12e5c89e4eSSatish Balay    Not Collective
13e5c89e4eSSatish Balay 
14e5c89e4eSSatish Balay    Input Parameters:
15e32f2f54SBarry Smith +  comm - communicator over which error occurred
16e32f2f54SBarry Smith .  line - the line number of the error (indicated by __LINE__)
17e5c89e4eSSatish Balay .  file - the file in which the error was detected (indicated by __FILE__)
18e5c89e4eSSatish Balay .  mess - an error text string, usually just printed to the screen
19e5c89e4eSSatish Balay .  n - the generic error number
20e5c89e4eSSatish Balay .  p - specific error number
21e5c89e4eSSatish Balay -  ctx - error handler context
22e5c89e4eSSatish Balay 
23e5c89e4eSSatish Balay    Level: developer
24e5c89e4eSSatish Balay 
25*811af0c4SBarry Smith    Note:
26*811af0c4SBarry Smith    Users do not directly call this routine
27e5c89e4eSSatish Balay 
28db781477SPatrick Sanan .seealso: `PetscReturnErrorHandler()`
29e5c89e4eSSatish Balay  @*/
309371c9d4SSatish Balay PetscErrorCode PetscIgnoreErrorHandler(MPI_Comm comm, int line, const char *fun, const char *file, PetscErrorCode n, PetscErrorType p, const char *mess, void *ctx) {
3111cc89d2SBarry Smith   return n;
32e5c89e4eSSatish Balay }
33e5c89e4eSSatish Balay 
34107894f0SSatish Balay /* ---------------------------------------------------------------------------------------*/
35107894f0SSatish Balay 
365abee1b0SJed Brown static char      arch[128], hostname[128], username[128], pname[PETSC_MAX_PATH_LEN], date[128];
37ace3abfcSBarry Smith static PetscBool PetscErrorPrintfInitializeCalled = PETSC_FALSE;
383f6e4ae9SSatish Balay static char      version[256];
39107894f0SSatish Balay 
40107894f0SSatish Balay /*
41107894f0SSatish Balay    Initializes arch, hostname, username, date so that system calls do NOT need
42107894f0SSatish Balay    to be made during the error handler.
43107894f0SSatish Balay */
449371c9d4SSatish Balay PetscErrorCode PetscErrorPrintfInitialize(void) {
45ace3abfcSBarry Smith   PetscBool use_stdout = PETSC_FALSE, use_none = PETSC_FALSE;
46107894f0SSatish Balay 
47107894f0SSatish Balay   PetscFunctionBegin;
489566063dSJacob Faibussowitsch   PetscCall(PetscGetArchType(arch, sizeof(arch)));
499566063dSJacob Faibussowitsch   PetscCall(PetscGetHostName(hostname, sizeof(hostname)));
509566063dSJacob Faibussowitsch   PetscCall(PetscGetUserName(username, sizeof(username)));
519566063dSJacob Faibussowitsch   PetscCall(PetscGetProgramName(pname, sizeof(pname)));
529566063dSJacob Faibussowitsch   PetscCall(PetscGetDate(date, sizeof(date)));
539566063dSJacob Faibussowitsch   PetscCall(PetscGetVersion(version, sizeof(version)));
54e8fb0fc0SBarry Smith 
559566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetBool(NULL, NULL, "-error_output_stdout", &use_stdout, NULL));
56a297a907SKarl Rupp   if (use_stdout) PETSC_STDERR = PETSC_STDOUT;
579566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetBool(NULL, NULL, "-error_output_none", &use_none, NULL));
58a297a907SKarl Rupp   if (use_none) PetscErrorPrintf = PetscErrorPrintfNone;
59107894f0SSatish Balay   PetscErrorPrintfInitializeCalled = PETSC_TRUE;
60107894f0SSatish Balay   PetscFunctionReturn(0);
61107894f0SSatish Balay }
62107894f0SSatish Balay 
639371c9d4SSatish Balay PetscErrorCode PetscErrorPrintfNone(const char format[], ...) {
64e8fb0fc0SBarry Smith   return 0;
65e8fb0fc0SBarry Smith }
66e8fb0fc0SBarry Smith 
679371c9d4SSatish Balay PetscErrorCode PetscErrorPrintfDefault(const char format[], ...) {
68e8fb0fc0SBarry Smith   va_list          Argp;
69ace3abfcSBarry Smith   static PetscBool PetscErrorPrintfCalled = PETSC_FALSE;
70e8fb0fc0SBarry Smith 
71e8fb0fc0SBarry Smith   /*
72e8fb0fc0SBarry Smith       This function does not call PetscFunctionBegin and PetscFunctionReturn() because
73e8fb0fc0SBarry Smith     it may be called by PetscStackView().
74e8fb0fc0SBarry Smith 
75e8fb0fc0SBarry Smith       This function does not do error checking because it is called by the error handlers.
76e8fb0fc0SBarry Smith   */
77e8fb0fc0SBarry Smith 
78e8fb0fc0SBarry Smith   if (!PetscErrorPrintfCalled) {
79e8fb0fc0SBarry Smith     PetscErrorPrintfCalled = PETSC_TRUE;
80e8fb0fc0SBarry Smith 
81e8fb0fc0SBarry Smith     /*
82e8fb0fc0SBarry Smith         On the SGI machines and Cray T3E, if errors are generated  "simultaneously" by
83e8fb0fc0SBarry Smith       different processors, the messages are printed all jumbled up; to try to
84e8fb0fc0SBarry Smith       prevent this we have each processor wait based on their rank
85e8fb0fc0SBarry Smith     */
86e8fb0fc0SBarry Smith #if defined(PETSC_CAN_SLEEP_AFTER_ERROR)
87e8fb0fc0SBarry Smith     {
88e8fb0fc0SBarry Smith       PetscMPIInt rank;
89a297a907SKarl Rupp       if (PetscGlobalRank > 8) rank = 8;
90a297a907SKarl Rupp       else rank = PetscGlobalRank;
91a6d0e24fSJed Brown       PetscSleep((PetscReal)rank);
92e8fb0fc0SBarry Smith     }
93e8fb0fc0SBarry Smith #endif
94e8fb0fc0SBarry Smith   }
95e8fb0fc0SBarry Smith 
961179db26SBarry Smith   PetscFPrintf(PETSC_COMM_SELF, PETSC_STDERR, "[%d]PETSC ERROR: ", PetscGlobalRank);
97e8fb0fc0SBarry Smith   va_start(Argp, format);
981179db26SBarry Smith   (*PetscVFPrintf)(PETSC_STDERR, format, Argp);
99e8fb0fc0SBarry Smith   va_end(Argp);
100e8fb0fc0SBarry Smith   return 0;
101e8fb0fc0SBarry Smith }
102e8fb0fc0SBarry Smith 
103c2eed0edSBarry Smith /*
104c2eed0edSBarry Smith    On some systems when the stderr is nested through several levels of shell script
105c2eed0edSBarry Smith    before being passed to a file the isatty() falsely returns true resulting in
106c2eed0edSBarry Smith    the screen highlight variables being passed through the test harness. Therefore
107c2eed0edSBarry Smith    simply do not highlight when the PETSC_STDERR is PETSC_STDOUT.
108c2eed0edSBarry Smith */
1099371c9d4SSatish Balay static void PetscErrorPrintfHilight(void) {
11098ed35c3SBarry Smith #if defined(PETSC_HAVE_UNISTD_H) && defined(PETSC_USE_ISATTY)
111c2eed0edSBarry Smith   if (PetscErrorPrintf == PetscErrorPrintfDefault && PETSC_STDERR != PETSC_STDOUT) {
112114011d0SBarry Smith     if (isatty(fileno(PETSC_STDERR))) fprintf(PETSC_STDERR, "\033[1;31m");
113114011d0SBarry Smith   }
114114011d0SBarry Smith #endif
115114011d0SBarry Smith }
116114011d0SBarry Smith 
1179371c9d4SSatish Balay static void PetscErrorPrintfNormal(void) {
11898ed35c3SBarry Smith #if defined(PETSC_HAVE_UNISTD_H) && defined(PETSC_USE_ISATTY)
119c2eed0edSBarry Smith   if (PetscErrorPrintf == PetscErrorPrintfDefault && PETSC_STDERR != PETSC_STDOUT) {
120114011d0SBarry Smith     if (isatty(fileno(PETSC_STDERR))) fprintf(PETSC_STDERR, "\033[0;39m\033[0;49m");
121114011d0SBarry Smith   }
122114011d0SBarry Smith #endif
123114011d0SBarry Smith }
124114011d0SBarry Smith 
12595c0884eSLisandro Dalcin PETSC_EXTERN PetscErrorCode PetscOptionsViewError(void);
126114011d0SBarry Smith 
127e5c89e4eSSatish Balay /*@C
128e5c89e4eSSatish Balay 
129e5c89e4eSSatish Balay    PetscTraceBackErrorHandler - Default error handler routine that generates
130e5c89e4eSSatish Balay    a traceback on error detection.
131e5c89e4eSSatish Balay 
132e5c89e4eSSatish Balay    Not Collective
133e5c89e4eSSatish Balay 
134e5c89e4eSSatish Balay    Input Parameters:
135e32f2f54SBarry Smith +  comm - communicator over which error occurred
136e32f2f54SBarry Smith .  line - the line number of the error (indicated by __LINE__)
137e5c89e4eSSatish Balay .  file - the file in which the error was detected (indicated by __FILE__)
138e5c89e4eSSatish Balay .  mess - an error text string, usually just printed to the screen
139e5c89e4eSSatish Balay .  n - the generic error number
140*811af0c4SBarry Smith .  p - `PETSC_ERROR_INITIAL` if this is the first call the error handler, otherwise `PETSC_ERROR_REPEAT`
141e5c89e4eSSatish Balay -  ctx - error handler context
142e5c89e4eSSatish Balay 
143*811af0c4SBarry Smith   Options Database Keys:
14445b666d6SBarry Smith +  -error_output_stdout - output the error messages to stdout instead of the default stderr
14545b666d6SBarry Smith -  -error_output_none - do not output the error messages
146e5c89e4eSSatish Balay 
147e5c89e4eSSatish Balay    Notes:
148*811af0c4SBarry Smith    Users do not directly call this routine
149e5c89e4eSSatish Balay 
150*811af0c4SBarry Smith    Use `PetscPushErrorHandler()` to set the desired error handler.
151e5c89e4eSSatish Balay 
15245b666d6SBarry Smith    Level: developer
153e5c89e4eSSatish Balay 
154db781477SPatrick Sanan .seealso: `PetscError()`, `PetscPushErrorHandler()`, `PetscPopErrorHandler()`, `PetscAttachDebuggerErrorHandler()`,
155db781477SPatrick Sanan           `PetscAbortErrorHandler()`, `PetscMPIAbortErrorHandler()`, `PetscReturnErrorHandler()`, `PetscEmacsClientErrorHandler()`
156e5c89e4eSSatish Balay  @*/
1579371c9d4SSatish Balay PetscErrorCode PetscTraceBackErrorHandler(MPI_Comm comm, int line, const char *fun, const char *file, PetscErrorCode n, PetscErrorType p, const char *mess, void *ctx) {
158e5c89e4eSSatish Balay   PetscLogDouble mem, rss;
159574034a9SJed Brown   PetscBool      flg1 = PETSC_FALSE, flg2 = PETSC_FALSE, flg3 = PETSC_FALSE;
160997adca8SBarry Smith   PetscMPIInt    rank = 0;
161e5c89e4eSSatish Balay 
162a297a907SKarl Rupp   if (comm != PETSC_COMM_SELF) MPI_Comm_rank(comm, &rank);
163a297a907SKarl Rupp 
164660278c0SBarry Smith   if (rank == 0 && (!PetscCIEnabledPortableErrorOutput || PetscGlobalRank == 0)) {
165fbfcfee5SBarry Smith     PetscBool  ismain;
166114011d0SBarry Smith     static int cnt = 1;
167114011d0SBarry Smith 
16857a177adSBarry Smith     if (cnt == 1) {
169114011d0SBarry Smith       PetscErrorPrintfHilight();
170114011d0SBarry Smith       (*PetscErrorPrintf)("--------------------- Error Message --------------------------------------------------------------\n");
1715f3a2c8dSBarry Smith       PetscErrorPrintfNormal();
172e5c89e4eSSatish Balay       if (n == PETSC_ERR_MEM) {
173e5c89e4eSSatish Balay         (*PetscErrorPrintf)("Out of memory. This could be due to allocating\n");
174e5c89e4eSSatish Balay         (*PetscErrorPrintf)("too large an object or bleeding by not properly\n");
175e5c89e4eSSatish Balay         (*PetscErrorPrintf)("destroying unneeded objects.\n");
176e5c89e4eSSatish Balay         PetscMallocGetCurrentUsage(&mem);
177e5c89e4eSSatish Balay         PetscMemoryGetCurrentUsage(&rss);
178c5929fdfSBarry Smith         PetscOptionsGetBool(NULL, NULL, "-malloc_dump", &flg1, NULL);
17992f119d6SBarry Smith         PetscOptionsGetBool(NULL, NULL, "-malloc_view", &flg2, NULL);
18092f119d6SBarry Smith         PetscOptionsHasName(NULL, NULL, "-malloc_view_threshold", &flg3);
18192f119d6SBarry Smith         if (flg2 || flg3) PetscMallocView(stdout);
182a297a907SKarl Rupp         else {
183b85f3346SJed Brown           (*PetscErrorPrintf)("Memory allocated %.0f Memory used by process %.0f\n", mem, rss);
184a297a907SKarl Rupp           if (flg1) PetscMallocDump(stdout);
18592f119d6SBarry Smith           else (*PetscErrorPrintf)("Try running with -malloc_dump or -malloc_view for info.\n");
186e5c89e4eSSatish Balay         }
187e5c89e4eSSatish Balay       } else {
188e5c89e4eSSatish Balay         const char *text;
1890298fd71SBarry Smith         PetscErrorMessage(n, &text, NULL);
190114011d0SBarry Smith         if (text) (*PetscErrorPrintf)("%s\n", text);
191e5c89e4eSSatish Balay       }
192114011d0SBarry Smith       if (mess) (*PetscErrorPrintf)("%s\n", mess);
193f4bc716fSBarry Smith       PetscOptionsLeftError();
194a17b96a8SKyle Gerard Felker       (*PetscErrorPrintf)("See https://petsc.org/release/faq/ for trouble shooting.\n");
195660278c0SBarry Smith       if (!PetscCIEnabledPortableErrorOutput) {
196107894f0SSatish Balay         (*PetscErrorPrintf)("%s\n", version);
197a297a907SKarl Rupp         if (PetscErrorPrintfInitializeCalled) (*PetscErrorPrintf)("%s on a %s named %s by %s %s\n", pname, arch, hostname, username, date);
198107894f0SSatish Balay         (*PetscErrorPrintf)("Configure options %s\n", petscconfigureoptions);
199107894f0SSatish Balay       }
200660278c0SBarry Smith     }
201997adca8SBarry Smith     /* print line of stack trace */
202660278c0SBarry Smith     if (fun) (*PetscErrorPrintf)("#%d %s() at %s:%d\n", cnt++, fun, PetscCIFilename(file), PetscCILinenumber(line));
203660278c0SBarry Smith     else if (file) (*PetscErrorPrintf)("#%d %s:%d\n", cnt++, PetscCIFilename(file), PetscCILinenumber(line));
20449c86fc7SBarry Smith     if (fun) {
205114011d0SBarry Smith       PetscStrncmp(fun, "main", 4, &ismain);
206fbfcfee5SBarry Smith       if (ismain) {
207ad540459SPierre Jolivet         if ((n <= PETSC_ERR_MIN_VALUE) || (n >= PETSC_ERR_MAX_VALUE)) (*PetscErrorPrintf)("Reached the main program with an out-of-range error code %d. This should never happen\n", n);
208e11779c2SBarry Smith         PetscOptionsViewError();
209114011d0SBarry Smith         PetscErrorPrintfHilight();
210f15a11d2SBarry Smith         (*PetscErrorPrintf)("----------------End of Error Message -------send entire error message to petsc-maint@mcs.anl.gov----------\n");
211114011d0SBarry Smith         PetscErrorPrintfNormal();
212114011d0SBarry Smith       }
21349c86fc7SBarry Smith     }
214997adca8SBarry Smith   } else {
215a5b23f4aSJose E. Roman     /* do not print error messages since process 0 will print them, sleep before aborting so will not accidentally kill process 0*/
216997adca8SBarry Smith     PetscSleep(10.0);
217c16385d5SBarry Smith     exit(0);
218997adca8SBarry Smith   }
219362febeeSStefano Zampini   return n;
220e5c89e4eSSatish Balay }
221