This source file includes following definitions.
- orte_err2str
- orte_job_state_to_str
- orte_app_ctx_state_to_str
- orte_proc_state_to_str
- orte_node_state_to_str
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25 #include "orte_config.h"
26 #include "orte/constants.h"
27
28 #include <stdio.h>
29 #ifdef HAVE_SYS_SIGNAL_H
30 #include <sys/signal.h>
31 #else
32 #include <signal.h>
33 #endif
34
35 #include "orte/mca/plm/plm_types.h"
36 #include "orte/util/error_strings.h"
37 #include "orte/runtime/orte_globals.h"
38
39 int orte_err2str(int errnum, const char **errmsg)
40 {
41 const char *retval;
42 switch (errnum) {
43 case ORTE_SUCCESS:
44 retval = "Success";
45 break;
46 case ORTE_ERR_RECV_LESS_THAN_POSTED:
47 retval = "Receive was less than posted size";
48 break;
49 case ORTE_ERR_RECV_MORE_THAN_POSTED:
50 retval = "Receive was greater than posted size";
51 break;
52 case ORTE_ERR_NO_MATCH_YET:
53 retval = "No match for receive posted";
54 break;
55 case ORTE_ERR_REQUEST:
56 retval = "Request error";
57 break;
58 case ORTE_ERR_NO_CONNECTION_ALLOWED:
59 retval = "No connection allowed";
60 break;
61 case ORTE_ERR_CONNECTION_REFUSED:
62 retval = "Connection refused";
63 break;
64 case ORTE_ERR_TYPE_MISMATCH:
65 retval = "Type mismatch";
66 break;
67 case ORTE_ERR_COMPARE_FAILURE:
68 retval = "Data comparison failure";
69 break;
70 case ORTE_ERR_COPY_FAILURE:
71 retval = "Data copy failure";
72 break;
73 case ORTE_ERR_PROC_STATE_MISSING:
74 retval = "The process state information is missing on the registry";
75 break;
76 case ORTE_ERR_PROC_EXIT_STATUS_MISSING:
77 retval = "The process exit status is missing on the registry";
78 break;
79 case ORTE_ERR_INDETERMINATE_STATE_INFO:
80 retval = "Request for state returned multiple responses";
81 break;
82 case ORTE_ERR_NODE_FULLY_USED:
83 retval = "All the slots on a given node have been used";
84 break;
85 case ORTE_ERR_INVALID_NUM_PROCS:
86 retval = "Multiple applications were specified, but at least one failed to specify the number of processes to run";
87 break;
88 case ORTE_ERR_SILENT:
89 if (orte_report_silent_errors) {
90 retval = "Silent error";
91 } else {
92 retval = "";
93 }
94 break;
95 case ORTE_ERR_ADDRESSEE_UNKNOWN:
96 retval = "A message is attempting to be sent to a process whose contact information is unknown";
97 break;
98 case ORTE_ERR_SYS_LIMITS_PIPES:
99 retval = "The system limit on number of pipes a process can open was reached";
100 break;
101 case ORTE_ERR_PIPE_SETUP_FAILURE:
102 retval = "A pipe could not be setup between a daemon and one of its local processes";
103 break;
104 case ORTE_ERR_SYS_LIMITS_CHILDREN:
105 retval = "The system limit on number of children a process can have was reached";
106 break;
107 case ORTE_ERR_FAILED_GET_TERM_ATTRS:
108 retval = "The I/O forwarding system was unable to get the attributes of your terminal";
109 break;
110 case ORTE_ERR_WDIR_NOT_FOUND:
111 retval = "The specified working directory could not be found";
112 break;
113 case ORTE_ERR_EXE_NOT_FOUND:
114 retval = "The specified executable could not be found";
115 break;
116 case ORTE_ERR_PIPE_READ_FAILURE:
117 retval = "A pipe could not be read";
118 break;
119 case ORTE_ERR_EXE_NOT_ACCESSIBLE:
120 retval = "The specified executable could not be executed";
121 break;
122 case ORTE_ERR_FAILED_TO_START:
123 retval = "The specified application failed to start";
124 break;
125 case ORTE_ERR_FILE_NOT_EXECUTABLE:
126 retval = "A system-required executable either could not be found or was not executable by this user";
127 break;
128 case ORTE_ERR_HNP_COULD_NOT_START:
129 retval = "Unable to start a daemon on the local node";
130 break;
131 case ORTE_ERR_SYS_LIMITS_SOCKETS:
132 retval = "The system limit on number of network connections a process can open was reached";
133 break;
134 case ORTE_ERR_SOCKET_NOT_AVAILABLE:
135 retval = "Unable to open a TCP socket for out-of-band communications";
136 break;
137 case ORTE_ERR_SYSTEM_WILL_BOOTSTRAP:
138 retval = "System will determine resources during bootstrap of daemons";
139 break;
140 case ORTE_ERR_RESTART_LIMIT_EXCEEDED:
141 retval = "Limit on number of process restarts was exceeded";
142 break;
143 case ORTE_ERR_INVALID_NODE_RANK:
144 retval = "Invalid node rank";
145 break;
146 case ORTE_ERR_INVALID_LOCAL_RANK:
147 retval = "Invalid local rank";
148 break;
149 case ORTE_ERR_UNRECOVERABLE:
150 retval = "Unrecoverable error";
151 break;
152 case ORTE_ERR_MEM_LIMIT_EXCEEDED:
153 retval = "Memory limit exceeded";
154 break;
155 case ORTE_ERR_HEARTBEAT_LOST:
156 retval = "Heartbeat lost";
157 break;
158 case ORTE_ERR_PROC_STALLED:
159 retval = "Proc appears to be stalled";
160 break;
161 case ORTE_ERR_NO_APP_SPECIFIED:
162 retval = "No application specified";
163 break;
164 case ORTE_ERR_NO_EXE_SPECIFIED:
165 retval = "No executable specified";
166 break;
167 case ORTE_ERR_COMM_DISABLED:
168 retval = "Communications have been disabled";
169 break;
170 case ORTE_ERR_FAILED_TO_MAP:
171 retval = "Unable to map job";
172 break;
173 case ORTE_ERR_TAKE_NEXT_OPTION:
174 if (orte_report_silent_errors) {
175 retval = "Next option";
176 } else {
177 retval = "";
178 }
179 break;
180 case ORTE_ERR_SENSOR_LIMIT_EXCEEDED:
181 retval = "Sensor limit exceeded";
182 break;
183 case ORTE_ERR_PROC_ENTRY_NOT_FOUND:
184 retval = "Proc entry not found";
185 break;
186 case ORTE_ERR_DATA_VALUE_NOT_FOUND:
187 retval = "Data not found";
188 break;
189 case ORTE_ERR_ALLOCATION_PENDING:
190 retval = "Allocation pending";
191 break;
192 case ORTE_ERR_NO_PATH_TO_TARGET:
193 retval = "No OOB path to target";
194 break;
195 case ORTE_ERR_OP_IN_PROGRESS:
196 retval = "Operation in progress";
197 break;
198 case ORTE_ERR_OPEN_CONDUIT_FAIL:
199 retval = "Open messaging conduit failed";
200 break;
201 case ORTE_ERR_OUT_OF_ORDER_MSG:
202 retval = "Out of order message";
203 break;
204 case ORTE_ERR_FORCE_SELECT:
205 retval = "Force select";
206 break;
207 case ORTE_ERR_JOB_CANCELLED:
208 retval = "Job cancelled";
209 break;
210 case ORTE_ERR_CONDUIT_SEND_FAIL:
211 retval = " Transport Conduit returned send error";
212 break;
213 case ORTE_ERR_DEBUGGER_RELEASE:
214 retval = "Debugger release";
215 break;
216 case ORTE_ERR_PARTIAL_SUCCESS:
217 retval = "Partial success";
218 break;
219 default:
220 retval = "Unknown error";
221 }
222
223 *errmsg = retval;
224 return ORTE_SUCCESS;
225 }
226
227 const char *orte_job_state_to_str(orte_job_state_t state)
228 {
229 switch(state) {
230 case ORTE_JOB_STATE_UNDEF:
231 return "UNDEFINED";
232 case ORTE_JOB_STATE_INIT:
233 return "PENDING INIT";
234 case ORTE_JOB_STATE_INIT_COMPLETE:
235 return "INIT_COMPLETE";
236 case ORTE_JOB_STATE_ALLOCATE:
237 return "PENDING ALLOCATION";
238 case ORTE_JOB_STATE_ALLOCATION_COMPLETE:
239 return "ALLOCATION COMPLETE";
240 case ORTE_JOB_STATE_MAP:
241 return "PENDING MAPPING";
242 case ORTE_JOB_STATE_MAP_COMPLETE:
243 return "MAP COMPLETE";
244 case ORTE_JOB_STATE_SYSTEM_PREP:
245 return "PENDING FINAL SYSTEM PREP";
246 case ORTE_JOB_STATE_LAUNCH_DAEMONS:
247 return "PENDING DAEMON LAUNCH";
248 case ORTE_JOB_STATE_DAEMONS_LAUNCHED:
249 return "DAEMONS LAUNCHED";
250 case ORTE_JOB_STATE_DAEMONS_REPORTED:
251 return "ALL DAEMONS REPORTED";
252 case ORTE_JOB_STATE_VM_READY:
253 return "VM READY";
254 case ORTE_JOB_STATE_LAUNCH_APPS:
255 return "PENDING APP LAUNCH";
256 case ORTE_JOB_STATE_SEND_LAUNCH_MSG:
257 return "SENDING LAUNCH MSG";
258 case ORTE_JOB_STATE_RUNNING:
259 return "RUNNING";
260 case ORTE_JOB_STATE_SUSPENDED:
261 return "SUSPENDED";
262 case ORTE_JOB_STATE_REGISTERED:
263 return "SYNC REGISTERED";
264 case ORTE_JOB_STATE_READY_FOR_DEBUGGERS:
265 return "READY FOR DEBUGGERS";
266 case ORTE_JOB_STATE_LOCAL_LAUNCH_COMPLETE:
267 return "LOCAL LAUNCH COMPLETE";
268 case ORTE_JOB_STATE_UNTERMINATED:
269 return "UNTERMINATED";
270 case ORTE_JOB_STATE_TERMINATED:
271 return "NORMALLY TERMINATED";
272 case ORTE_JOB_STATE_NOTIFY_COMPLETED:
273 return "NOTIFY COMPLETED";
274 case ORTE_JOB_STATE_NOTIFIED:
275 return "NOTIFIED";
276 case ORTE_JOB_STATE_ALL_JOBS_COMPLETE:
277 return "ALL JOBS COMPLETE";
278 case ORTE_JOB_STATE_ERROR:
279 return "ARTIFICIAL BOUNDARY - ERROR";
280 case ORTE_JOB_STATE_KILLED_BY_CMD:
281 return "KILLED BY INTERNAL COMMAND";
282 case ORTE_JOB_STATE_ABORTED:
283 return "ABORTED";
284 case ORTE_JOB_STATE_FAILED_TO_START:
285 return "FAILED TO START";
286 case ORTE_JOB_STATE_ABORTED_BY_SIG:
287 return "ABORTED BY SIGNAL";
288 case ORTE_JOB_STATE_ABORTED_WO_SYNC:
289 return "TERMINATED WITHOUT SYNC";
290 case ORTE_JOB_STATE_COMM_FAILED:
291 return "COMMUNICATION FAILURE";
292 case ORTE_JOB_STATE_SENSOR_BOUND_EXCEEDED:
293 return "SENSOR BOUND EXCEEDED";
294 case ORTE_JOB_STATE_CALLED_ABORT:
295 return "PROC CALLED ABORT";
296 case ORTE_JOB_STATE_HEARTBEAT_FAILED:
297 return "HEARTBEAT FAILED";
298 case ORTE_JOB_STATE_NEVER_LAUNCHED:
299 return "NEVER LAUNCHED";
300 case ORTE_JOB_STATE_ABORT_ORDERED:
301 return "ABORT IN PROGRESS";
302 case ORTE_JOB_STATE_NON_ZERO_TERM:
303 return "AT LEAST ONE PROCESS EXITED WITH NON-ZERO STATUS";
304 case ORTE_JOB_STATE_FAILED_TO_LAUNCH:
305 return "FAILED TO LAUNCH";
306 case ORTE_JOB_STATE_FORCED_EXIT:
307 return "FORCED EXIT";
308 case ORTE_JOB_STATE_DAEMONS_TERMINATED:
309 return "DAEMONS TERMINATED";
310 case ORTE_JOB_STATE_SILENT_ABORT:
311 return "ERROR REPORTED ELSEWHERE";
312 case ORTE_JOB_STATE_REPORT_PROGRESS:
313 return "REPORT PROGRESS";
314 case ORTE_JOB_STATE_ALLOC_FAILED:
315 return "ALLOCATION FAILED";
316 case ORTE_JOB_STATE_MAP_FAILED:
317 return "MAP FAILED";
318 case ORTE_JOB_STATE_CANNOT_LAUNCH:
319 return "CANNOT LAUNCH";
320 case ORTE_JOB_STATE_FT_CHECKPOINT:
321 return "FAULT TOLERANCE CHECKPOINT";
322 case ORTE_JOB_STATE_FT_CONTINUE:
323 return "FAULT TOLERANCE CONTINUE";
324 case ORTE_JOB_STATE_FT_RESTART:
325 return "FAULT TOLERANCE RESTART";
326 case ORTE_JOB_STATE_ANY:
327 return "ANY";
328 case ORTE_JOB_STATE_DEBUGGER_DETACH:
329 return "DEBUGGER DETACH";
330 default:
331 return "UNKNOWN STATE!";
332 }
333 }
334
335 const char *orte_app_ctx_state_to_str(orte_app_state_t state)
336 {
337 switch(state) {
338 case ORTE_APP_STATE_UNDEF:
339 return "UNDEFINED";
340 case ORTE_APP_STATE_INIT:
341 return "PENDING INIT";
342 case ORTE_APP_STATE_ALL_MAPPED:
343 return "ALL MAPPED";
344 case ORTE_APP_STATE_RUNNING:
345 return "RUNNING";
346 case ORTE_APP_STATE_COMPLETED:
347 return "COMPLETED";
348 default:
349 return "UNKNOWN STATE!";
350 }
351 }
352
353 const char *orte_proc_state_to_str(orte_proc_state_t state)
354 {
355 switch(state) {
356 case ORTE_PROC_STATE_UNDEF:
357 return "UNDEFINED";
358 case ORTE_PROC_STATE_INIT:
359 return "INITIALIZED";
360 case ORTE_PROC_STATE_RESTART:
361 return "RESTARTING";
362 case ORTE_PROC_STATE_TERMINATE:
363 return "MARKED FOR TERMINATION";
364 case ORTE_PROC_STATE_RUNNING:
365 return "RUNNING";
366 case ORTE_PROC_STATE_REGISTERED:
367 return "SYNC REGISTERED";
368 case ORTE_PROC_STATE_IOF_COMPLETE:
369 return "IOF COMPLETE";
370 case ORTE_PROC_STATE_WAITPID_FIRED:
371 return "WAITPID FIRED";
372 case ORTE_PROC_STATE_UNTERMINATED:
373 return "UNTERMINATED";
374 case ORTE_PROC_STATE_TERMINATED:
375 return "NORMALLY TERMINATED";
376 case ORTE_PROC_STATE_ERROR:
377 return "ARTIFICIAL BOUNDARY - ERROR";
378 case ORTE_PROC_STATE_KILLED_BY_CMD:
379 return "KILLED BY INTERNAL COMMAND";
380 case ORTE_PROC_STATE_ABORTED:
381 return "ABORTED";
382 case ORTE_PROC_STATE_FAILED_TO_START:
383 return "FAILED TO START";
384 case ORTE_PROC_STATE_ABORTED_BY_SIG:
385 return "ABORTED BY SIGNAL";
386 case ORTE_PROC_STATE_TERM_WO_SYNC:
387 return "TERMINATED WITHOUT SYNC";
388 case ORTE_PROC_STATE_COMM_FAILED:
389 return "COMMUNICATION FAILURE";
390 case ORTE_PROC_STATE_SENSOR_BOUND_EXCEEDED:
391 return "SENSOR BOUND EXCEEDED";
392 case ORTE_PROC_STATE_CALLED_ABORT:
393 return "CALLED ABORT";
394 case ORTE_PROC_STATE_HEARTBEAT_FAILED:
395 return "HEARTBEAT FAILED";
396 case ORTE_PROC_STATE_MIGRATING:
397 return "MIGRATING";
398 case ORTE_PROC_STATE_CANNOT_RESTART:
399 return "CANNOT BE RESTARTED";
400 case ORTE_PROC_STATE_TERM_NON_ZERO:
401 return "EXITED WITH NON-ZERO STATUS";
402 case ORTE_PROC_STATE_FAILED_TO_LAUNCH:
403 return "FAILED TO LAUNCH";
404 case ORTE_PROC_STATE_UNABLE_TO_SEND_MSG:
405 return "UNABLE TO SEND MSG";
406 case ORTE_PROC_STATE_LIFELINE_LOST:
407 return "LIFELINE LOST";
408 case ORTE_PROC_STATE_NO_PATH_TO_TARGET:
409 return "NO PATH TO TARGET";
410 case ORTE_PROC_STATE_FAILED_TO_CONNECT:
411 return "FAILED TO CONNECT";
412 case ORTE_PROC_STATE_PEER_UNKNOWN:
413 return "PEER UNKNOWN";
414 case ORTE_PROC_STATE_ANY:
415 return "ANY";
416 default:
417 return "UNKNOWN STATE!";
418 }
419 }
420
421 const char *orte_node_state_to_str(orte_node_state_t state)
422 {
423 switch(state) {
424 case ORTE_NODE_STATE_UNDEF:
425 return "UNDEF";
426 case ORTE_NODE_STATE_UNKNOWN:
427 return "UNKNOWN";
428 case ORTE_NODE_STATE_DOWN:
429 return "DOWN";
430 case ORTE_NODE_STATE_UP:
431 return "UP";
432 case ORTE_NODE_STATE_REBOOT:
433 return "REBOOT";
434 case ORTE_NODE_STATE_DO_NOT_USE:
435 return "DO_NOT_USE";
436 case ORTE_NODE_STATE_NOT_INCLUDED:
437 return "NOT_INCLUDED";
438 case ORTE_NODE_STATE_ADDED:
439 return "ADDED";
440 default:
441 return "UNKNOWN STATE!";
442 }
443 }