root/orte/util/error_strings.c

/* [<][>][^][v][top][bottom][index][help] */

DEFINITIONS

This source file includes following definitions.
  1. orte_err2str
  2. orte_job_state_to_str
  3. orte_app_ctx_state_to_str
  4. orte_proc_state_to_str
  5. orte_node_state_to_str

   1 /*
   2  * Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana
   3  *                         University Research and Technology
   4  *                         Corporation.  All rights reserved.
   5  * Copyright (c) 2004-2005 The University of Tennessee and The University
   6  *                         of Tennessee Research Foundation.  All rights
   7  *                         reserved.
   8  * Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
   9  *                         University of Stuttgart.  All rights reserved.
  10  * Copyright (c) 2004-2005 The Regents of the University of California.
  11  *                         All rights reserved.
  12  * Copyright (c) 2010-2016 Cisco Systems, Inc.  All rights reserved.
  13  * Copyright (c) 2011-2013 Los Alamos National Security, LLC.
  14  *                         All rights reserved.
  15  * Copyright (c) 2014-2018 Intel, Inc. All rights reserved.
  16  * $COPYRIGHT$
  17  *
  18  * Additional copyrights may follow
  19  *
  20  * $HEADER$
  21  */
  22 
  23 /** @file **/
  24 
  25 #include "orte_config.h"
  26 #include "orte/constants.h"
  27 
  28 #include <stdio.h>
  29 #ifdef HAVE_SYS_SIGNAL_H
  30 #include <sys/signal.h>
  31 #else
  32 #include <signal.h>
  33 #endif
  34 
  35 #include "orte/mca/plm/plm_types.h"
  36 #include "orte/util/error_strings.h"
  37 #include "orte/runtime/orte_globals.h"
  38 
  39 int orte_err2str(int errnum, const char **errmsg)
  40 {
  41     const char *retval;
  42     switch (errnum) {
  43     case ORTE_SUCCESS:
  44         retval = "Success";
  45         break;
  46     case ORTE_ERR_RECV_LESS_THAN_POSTED:
  47         retval = "Receive was less than posted size";
  48         break;
  49     case ORTE_ERR_RECV_MORE_THAN_POSTED:
  50         retval = "Receive was greater than posted size";
  51         break;
  52     case ORTE_ERR_NO_MATCH_YET:
  53         retval = "No match for receive posted";
  54         break;
  55     case ORTE_ERR_REQUEST:
  56         retval = "Request error";
  57         break;
  58     case ORTE_ERR_NO_CONNECTION_ALLOWED:
  59         retval = "No connection allowed";
  60         break;
  61     case ORTE_ERR_CONNECTION_REFUSED:
  62         retval = "Connection refused";
  63         break;
  64     case ORTE_ERR_TYPE_MISMATCH:
  65         retval = "Type mismatch";
  66         break;
  67     case ORTE_ERR_COMPARE_FAILURE:
  68         retval = "Data comparison failure";
  69         break;
  70     case ORTE_ERR_COPY_FAILURE:
  71         retval = "Data copy failure";
  72         break;
  73     case ORTE_ERR_PROC_STATE_MISSING:
  74         retval = "The process state information is missing on the registry";
  75         break;
  76     case ORTE_ERR_PROC_EXIT_STATUS_MISSING:
  77         retval = "The process exit status is missing on the registry";
  78         break;
  79     case ORTE_ERR_INDETERMINATE_STATE_INFO:
  80         retval = "Request for state returned multiple responses";
  81         break;
  82     case ORTE_ERR_NODE_FULLY_USED:
  83         retval = "All the slots on a given node have been used";
  84         break;
  85     case ORTE_ERR_INVALID_NUM_PROCS:
  86         retval = "Multiple applications were specified, but at least one failed to specify the number of processes to run";
  87         break;
  88     case ORTE_ERR_SILENT:
  89         if (orte_report_silent_errors) {
  90             retval = "Silent error";
  91         } else {
  92             retval = "";
  93         }
  94         break;
  95     case ORTE_ERR_ADDRESSEE_UNKNOWN:
  96         retval = "A message is attempting to be sent to a process whose contact information is unknown";
  97         break;
  98     case ORTE_ERR_SYS_LIMITS_PIPES:
  99         retval = "The system limit on number of pipes a process can open was reached";
 100         break;
 101     case ORTE_ERR_PIPE_SETUP_FAILURE:
 102         retval = "A pipe could not be setup between a daemon and one of its local processes";
 103         break;
 104     case ORTE_ERR_SYS_LIMITS_CHILDREN:
 105         retval = "The system limit on number of children a process can have was reached";
 106         break;
 107     case ORTE_ERR_FAILED_GET_TERM_ATTRS:
 108         retval = "The I/O forwarding system was unable to get the attributes of your terminal";
 109         break;
 110     case ORTE_ERR_WDIR_NOT_FOUND:
 111         retval = "The specified working directory could not be found";
 112         break;
 113     case ORTE_ERR_EXE_NOT_FOUND:
 114         retval = "The specified executable could not be found";
 115         break;
 116     case ORTE_ERR_PIPE_READ_FAILURE:
 117         retval = "A pipe could not be read";
 118         break;
 119     case ORTE_ERR_EXE_NOT_ACCESSIBLE:
 120         retval = "The specified executable could not be executed";
 121         break;
 122     case ORTE_ERR_FAILED_TO_START:
 123         retval = "The specified application failed to start";
 124         break;
 125     case ORTE_ERR_FILE_NOT_EXECUTABLE:
 126         retval = "A system-required executable either could not be found or was not executable by this user";
 127         break;
 128     case ORTE_ERR_HNP_COULD_NOT_START:
 129         retval = "Unable to start a daemon on the local node";
 130         break;
 131     case ORTE_ERR_SYS_LIMITS_SOCKETS:
 132         retval = "The system limit on number of network connections a process can open was reached";
 133         break;
 134     case ORTE_ERR_SOCKET_NOT_AVAILABLE:
 135         retval = "Unable to open a TCP socket for out-of-band communications";
 136         break;
 137     case ORTE_ERR_SYSTEM_WILL_BOOTSTRAP:
 138         retval = "System will determine resources during bootstrap of daemons";
 139         break;
 140     case ORTE_ERR_RESTART_LIMIT_EXCEEDED:
 141         retval = "Limit on number of process restarts was exceeded";
 142         break;
 143     case ORTE_ERR_INVALID_NODE_RANK:
 144         retval = "Invalid node rank";
 145         break;
 146     case ORTE_ERR_INVALID_LOCAL_RANK:
 147         retval = "Invalid local rank";
 148         break;
 149     case ORTE_ERR_UNRECOVERABLE:
 150         retval = "Unrecoverable error";
 151         break;
 152     case ORTE_ERR_MEM_LIMIT_EXCEEDED:
 153         retval = "Memory limit exceeded";
 154         break;
 155     case ORTE_ERR_HEARTBEAT_LOST:
 156         retval = "Heartbeat lost";
 157         break;
 158     case ORTE_ERR_PROC_STALLED:
 159         retval = "Proc appears to be stalled";
 160         break;
 161     case ORTE_ERR_NO_APP_SPECIFIED:
 162         retval = "No application specified";
 163         break;
 164     case ORTE_ERR_NO_EXE_SPECIFIED:
 165         retval = "No executable specified";
 166         break;
 167     case ORTE_ERR_COMM_DISABLED:
 168         retval = "Communications have been disabled";
 169         break;
 170     case ORTE_ERR_FAILED_TO_MAP:
 171         retval = "Unable to map job";
 172         break;
 173     case ORTE_ERR_TAKE_NEXT_OPTION:
 174         if (orte_report_silent_errors) {
 175             retval = "Next option";
 176         } else {
 177             retval = "";
 178         }
 179         break;
 180     case ORTE_ERR_SENSOR_LIMIT_EXCEEDED:
 181         retval = "Sensor limit exceeded";
 182         break;
 183     case ORTE_ERR_PROC_ENTRY_NOT_FOUND:
 184         retval = "Proc entry not found";
 185         break;
 186     case ORTE_ERR_DATA_VALUE_NOT_FOUND:
 187         retval = "Data not found";
 188         break;
 189     case ORTE_ERR_ALLOCATION_PENDING:
 190         retval = "Allocation pending";
 191         break;
 192     case ORTE_ERR_NO_PATH_TO_TARGET:
 193         retval = "No OOB path to target";
 194         break;
 195     case ORTE_ERR_OP_IN_PROGRESS:
 196         retval = "Operation in progress";
 197         break;
 198     case ORTE_ERR_OPEN_CONDUIT_FAIL:
 199         retval = "Open messaging conduit failed";
 200         break;
 201     case ORTE_ERR_OUT_OF_ORDER_MSG:
 202         retval = "Out of order message";
 203         break;
 204     case ORTE_ERR_FORCE_SELECT:
 205         retval = "Force select";
 206         break;
 207     case ORTE_ERR_JOB_CANCELLED:
 208         retval = "Job cancelled";
 209         break;
 210     case ORTE_ERR_CONDUIT_SEND_FAIL:
 211         retval = " Transport Conduit returned send error";
 212         break;
 213     case ORTE_ERR_DEBUGGER_RELEASE:
 214         retval = "Debugger release";
 215         break;
 216     case ORTE_ERR_PARTIAL_SUCCESS:
 217         retval = "Partial success";
 218         break;
 219     default:
 220         retval = "Unknown error";
 221     }
 222 
 223     *errmsg = retval;
 224     return ORTE_SUCCESS;
 225 }
 226 
 227 const char *orte_job_state_to_str(orte_job_state_t state)
 228 {
 229     switch(state) {
 230     case ORTE_JOB_STATE_UNDEF:
 231         return "UNDEFINED";
 232     case ORTE_JOB_STATE_INIT:
 233         return "PENDING INIT";
 234     case ORTE_JOB_STATE_INIT_COMPLETE:
 235         return "INIT_COMPLETE";
 236     case ORTE_JOB_STATE_ALLOCATE:
 237         return "PENDING ALLOCATION";
 238     case ORTE_JOB_STATE_ALLOCATION_COMPLETE:
 239         return "ALLOCATION COMPLETE";
 240     case ORTE_JOB_STATE_MAP:
 241         return "PENDING MAPPING";
 242     case ORTE_JOB_STATE_MAP_COMPLETE:
 243         return "MAP COMPLETE";
 244     case ORTE_JOB_STATE_SYSTEM_PREP:
 245         return "PENDING FINAL SYSTEM PREP";
 246     case ORTE_JOB_STATE_LAUNCH_DAEMONS:
 247         return "PENDING DAEMON LAUNCH";
 248     case ORTE_JOB_STATE_DAEMONS_LAUNCHED:
 249         return "DAEMONS LAUNCHED";
 250     case ORTE_JOB_STATE_DAEMONS_REPORTED:
 251         return "ALL DAEMONS REPORTED";
 252     case ORTE_JOB_STATE_VM_READY:
 253         return "VM READY";
 254     case ORTE_JOB_STATE_LAUNCH_APPS:
 255         return "PENDING APP LAUNCH";
 256     case ORTE_JOB_STATE_SEND_LAUNCH_MSG:
 257         return "SENDING LAUNCH MSG";
 258     case ORTE_JOB_STATE_RUNNING:
 259         return "RUNNING";
 260     case ORTE_JOB_STATE_SUSPENDED:
 261         return "SUSPENDED";
 262     case ORTE_JOB_STATE_REGISTERED:
 263         return "SYNC REGISTERED";
 264     case ORTE_JOB_STATE_READY_FOR_DEBUGGERS:
 265         return "READY FOR DEBUGGERS";
 266     case ORTE_JOB_STATE_LOCAL_LAUNCH_COMPLETE:
 267         return "LOCAL LAUNCH COMPLETE";
 268     case ORTE_JOB_STATE_UNTERMINATED:
 269         return "UNTERMINATED";
 270     case ORTE_JOB_STATE_TERMINATED:
 271         return "NORMALLY TERMINATED";
 272     case ORTE_JOB_STATE_NOTIFY_COMPLETED:
 273         return "NOTIFY COMPLETED";
 274     case ORTE_JOB_STATE_NOTIFIED:
 275         return "NOTIFIED";
 276     case ORTE_JOB_STATE_ALL_JOBS_COMPLETE:
 277         return "ALL JOBS COMPLETE";
 278     case ORTE_JOB_STATE_ERROR:
 279         return "ARTIFICIAL BOUNDARY - ERROR";
 280     case ORTE_JOB_STATE_KILLED_BY_CMD:
 281         return "KILLED BY INTERNAL COMMAND";
 282     case ORTE_JOB_STATE_ABORTED:
 283         return "ABORTED";
 284     case ORTE_JOB_STATE_FAILED_TO_START:
 285         return "FAILED TO START";
 286     case ORTE_JOB_STATE_ABORTED_BY_SIG:
 287         return "ABORTED BY SIGNAL";
 288     case ORTE_JOB_STATE_ABORTED_WO_SYNC:
 289         return "TERMINATED WITHOUT SYNC";
 290     case ORTE_JOB_STATE_COMM_FAILED:
 291         return "COMMUNICATION FAILURE";
 292     case ORTE_JOB_STATE_SENSOR_BOUND_EXCEEDED:
 293         return "SENSOR BOUND EXCEEDED";
 294     case ORTE_JOB_STATE_CALLED_ABORT:
 295         return "PROC CALLED ABORT";
 296     case ORTE_JOB_STATE_HEARTBEAT_FAILED:
 297         return "HEARTBEAT FAILED";
 298     case ORTE_JOB_STATE_NEVER_LAUNCHED:
 299         return "NEVER LAUNCHED";
 300     case ORTE_JOB_STATE_ABORT_ORDERED:
 301         return "ABORT IN PROGRESS";
 302     case ORTE_JOB_STATE_NON_ZERO_TERM:
 303         return "AT LEAST ONE PROCESS EXITED WITH NON-ZERO STATUS";
 304     case ORTE_JOB_STATE_FAILED_TO_LAUNCH:
 305         return "FAILED TO LAUNCH";
 306     case ORTE_JOB_STATE_FORCED_EXIT:
 307         return "FORCED EXIT";
 308     case ORTE_JOB_STATE_DAEMONS_TERMINATED:
 309         return "DAEMONS TERMINATED";
 310     case ORTE_JOB_STATE_SILENT_ABORT:
 311         return "ERROR REPORTED ELSEWHERE";
 312     case ORTE_JOB_STATE_REPORT_PROGRESS:
 313         return "REPORT PROGRESS";
 314     case ORTE_JOB_STATE_ALLOC_FAILED:
 315         return "ALLOCATION FAILED";
 316     case ORTE_JOB_STATE_MAP_FAILED:
 317         return "MAP FAILED";
 318     case ORTE_JOB_STATE_CANNOT_LAUNCH:
 319         return "CANNOT LAUNCH";
 320     case ORTE_JOB_STATE_FT_CHECKPOINT:
 321         return "FAULT TOLERANCE CHECKPOINT";
 322     case ORTE_JOB_STATE_FT_CONTINUE:
 323         return "FAULT TOLERANCE CONTINUE";
 324     case ORTE_JOB_STATE_FT_RESTART:
 325         return "FAULT TOLERANCE RESTART";
 326     case ORTE_JOB_STATE_ANY:
 327         return "ANY";
 328     case ORTE_JOB_STATE_DEBUGGER_DETACH:
 329         return "DEBUGGER DETACH";
 330     default:
 331         return "UNKNOWN STATE!";
 332     }
 333 }
 334 
 335 const char *orte_app_ctx_state_to_str(orte_app_state_t state)
 336 {
 337     switch(state) {
 338     case ORTE_APP_STATE_UNDEF:
 339         return "UNDEFINED";
 340     case ORTE_APP_STATE_INIT:
 341         return "PENDING INIT";
 342     case ORTE_APP_STATE_ALL_MAPPED:
 343         return "ALL MAPPED";
 344     case ORTE_APP_STATE_RUNNING:
 345         return "RUNNING";
 346     case ORTE_APP_STATE_COMPLETED:
 347         return "COMPLETED";
 348     default:
 349         return "UNKNOWN STATE!";
 350     }
 351 }
 352 
 353 const char *orte_proc_state_to_str(orte_proc_state_t state)
 354 {
 355     switch(state) {
 356     case ORTE_PROC_STATE_UNDEF:
 357         return "UNDEFINED";
 358     case ORTE_PROC_STATE_INIT:
 359         return "INITIALIZED";
 360     case ORTE_PROC_STATE_RESTART:
 361         return "RESTARTING";
 362     case ORTE_PROC_STATE_TERMINATE:
 363         return "MARKED FOR TERMINATION";
 364     case ORTE_PROC_STATE_RUNNING:
 365         return "RUNNING";
 366     case ORTE_PROC_STATE_REGISTERED:
 367         return "SYNC REGISTERED";
 368     case ORTE_PROC_STATE_IOF_COMPLETE:
 369         return "IOF COMPLETE";
 370     case ORTE_PROC_STATE_WAITPID_FIRED:
 371         return "WAITPID FIRED";
 372     case ORTE_PROC_STATE_UNTERMINATED:
 373         return "UNTERMINATED";
 374     case ORTE_PROC_STATE_TERMINATED:
 375         return "NORMALLY TERMINATED";
 376     case ORTE_PROC_STATE_ERROR:
 377         return "ARTIFICIAL BOUNDARY - ERROR";
 378     case ORTE_PROC_STATE_KILLED_BY_CMD:
 379         return "KILLED BY INTERNAL COMMAND";
 380     case ORTE_PROC_STATE_ABORTED:
 381         return "ABORTED";
 382     case ORTE_PROC_STATE_FAILED_TO_START:
 383         return "FAILED TO START";
 384     case ORTE_PROC_STATE_ABORTED_BY_SIG:
 385         return "ABORTED BY SIGNAL";
 386     case ORTE_PROC_STATE_TERM_WO_SYNC:
 387         return "TERMINATED WITHOUT SYNC";
 388     case ORTE_PROC_STATE_COMM_FAILED:
 389         return "COMMUNICATION FAILURE";
 390     case ORTE_PROC_STATE_SENSOR_BOUND_EXCEEDED:
 391         return "SENSOR BOUND EXCEEDED";
 392     case ORTE_PROC_STATE_CALLED_ABORT:
 393         return "CALLED ABORT";
 394     case ORTE_PROC_STATE_HEARTBEAT_FAILED:
 395         return "HEARTBEAT FAILED";
 396     case ORTE_PROC_STATE_MIGRATING:
 397         return "MIGRATING";
 398     case ORTE_PROC_STATE_CANNOT_RESTART:
 399         return "CANNOT BE RESTARTED";
 400     case ORTE_PROC_STATE_TERM_NON_ZERO:
 401         return "EXITED WITH NON-ZERO STATUS";
 402     case ORTE_PROC_STATE_FAILED_TO_LAUNCH:
 403         return "FAILED TO LAUNCH";
 404     case ORTE_PROC_STATE_UNABLE_TO_SEND_MSG:
 405         return "UNABLE TO SEND MSG";
 406     case ORTE_PROC_STATE_LIFELINE_LOST:
 407         return "LIFELINE LOST";
 408     case ORTE_PROC_STATE_NO_PATH_TO_TARGET:
 409         return "NO PATH TO TARGET";
 410     case ORTE_PROC_STATE_FAILED_TO_CONNECT:
 411         return "FAILED TO CONNECT";
 412     case ORTE_PROC_STATE_PEER_UNKNOWN:
 413         return "PEER UNKNOWN";
 414     case ORTE_PROC_STATE_ANY:
 415         return "ANY";
 416     default:
 417         return "UNKNOWN STATE!";
 418     }
 419 }
 420 
 421 const char *orte_node_state_to_str(orte_node_state_t state)
 422 {
 423     switch(state) {
 424     case ORTE_NODE_STATE_UNDEF:
 425         return "UNDEF";
 426     case ORTE_NODE_STATE_UNKNOWN:
 427         return "UNKNOWN";
 428     case ORTE_NODE_STATE_DOWN:
 429         return "DOWN";
 430     case ORTE_NODE_STATE_UP:
 431         return "UP";
 432     case ORTE_NODE_STATE_REBOOT:
 433         return "REBOOT";
 434     case ORTE_NODE_STATE_DO_NOT_USE:
 435         return "DO_NOT_USE";
 436     case ORTE_NODE_STATE_NOT_INCLUDED:
 437         return "NOT_INCLUDED";
 438     case ORTE_NODE_STATE_ADDED:
 439         return "ADDED";
 440    default:
 441         return "UNKNOWN STATE!";
 442     }
 443 }

/* [<][>][^][v][top][bottom][index][help] */