22 #ifndef ORTE_MCA_ERRMGR_BASE_H
23 #define ORTE_MCA_ERRMGR_BASE_H
28 #include "orte_config.h"
29 #include "orte/constants.h"
34 #include "orte/mca/snapc/base/base.h"
44 ORTE_DECLSPEC
int orte_errmgr_base_select(
void);
45 ORTE_DECLSPEC
int orte_errmgr_base_close(
void);
64 #define ORTE_ERRMGR_MIGRATE_STATE_ERROR (ORTE_SNAPC_CKPT_MAX + 1)
65 #define ORTE_ERRMGR_MIGRATE_STATE_ERR_INPROGRESS (ORTE_SNAPC_CKPT_MAX + 2)
66 #define ORTE_ERRMGR_MIGRATE_STATE_NONE (ORTE_SNAPC_CKPT_MAX + 3)
67 #define ORTE_ERRMGR_MIGRATE_STATE_REQUEST (ORTE_SNAPC_CKPT_MAX + 4)
68 #define ORTE_ERRMGR_MIGRATE_STATE_RUNNING (ORTE_SNAPC_CKPT_MAX + 5)
69 #define ORTE_ERRMGR_MIGRATE_STATE_RUN_CKPT (ORTE_SNAPC_CKPT_MAX + 6)
70 #define ORTE_ERRMGR_MIGRATE_STATE_STARTUP (ORTE_SNAPC_CKPT_MAX + 7)
71 #define ORTE_ERRMGR_MIGRATE_STATE_FINISH (ORTE_SNAPC_CKPT_MAX + 8)
72 #define ORTE_ERRMGR_MIGRATE_MAX (ORTE_SNAPC_CKPT_MAX + 9)
77 typedef uint8_t orte_errmgr_tool_cmd_flag_t;
78 #define ORTE_ERRMGR_MIGRATE_TOOL_CMD OPAL_UINT8
79 #define ORTE_ERRMGR_MIGRATE_TOOL_INIT_CMD 1
80 #define ORTE_ERRMGR_MIGRATE_TOOL_UPDATE_CMD 2
83 ORTE_DECLSPEC
int orte_errmgr_base_tool_init(
void);
84 ORTE_DECLSPEC
int orte_errmgr_base_tool_finalize(
void);
86 ORTE_DECLSPEC
void orte_errmgr_base_migrate_state_notify(
int state);
87 ORTE_DECLSPEC
int orte_errmgr_base_migrate_state_str(
char ** state_str,
int state);
89 ORTE_DECLSPEC
int orte_errmgr_base_migrate_update(
int status);
94 ORTE_DECLSPEC
int orte_errmgr_base_update_app_context_for_cr_recovery(
orte_job_t *jobdata,
98 ORTE_DECLSPEC
int orte_errmgr_base_restart_job(
orte_jobid_t jobid,
char * global_handle,
int seq_num);
102 ORTE_DECLSPEC
void orte_errmgr_base_proc_state_notify(orte_proc_state_t state,
orte_process_name_t *proc);
106 #if OPAL_ENABLE_FT_MPI
107 ORTE_DECLSPEC
int orte_errmgr_base_setup_listener(
void);
108 ORTE_DECLSPEC
int orte_errmgr_base_shutdown_listener(
void);
114 typedef int (*orte_errmgr_base_app_notify_callback_fn_t) (
orte_process_name_t, orte_proc_state_t);
115 ORTE_DECLSPEC
extern orte_errmgr_base_app_notify_callback_fn_t orte_errmgr_base_app_callback;
117 ORTE_DECLSPEC
int orte_errmgr_base_app_reg_notify_callback
118 (orte_errmgr_base_app_notify_callback_fn_t new_func,
119 orte_errmgr_base_app_notify_callback_fn_t *prev_func);
BEGIN_C_DECLS ORTE_DECLSPEC int orte_errmgr_base_open(void)
Function for finding and opening either all MCA components, or the one that was specifically requeste...
Definition: errmgr_base_open.c:95
ORTE_DECLSPEC orte_errmgr_fault_callback_t * orte_errmgr_base_set_fault_callback(orte_errmgr_fault_callback_t *cbfunc)
Interfaces for orte-migrate tool.
Definition: errmgr_base_fns.c:739
uint32_t orte_jobid_t
Set the allowed range for ids in each space.
Definition: types.h:76
ORTE_DECLSPEC orte_errmgr_base_component_t orte_errmgr_base_selected_component
Internal module reference.
Definition: errmgr_base_open.c:56
ORTE_DECLSPEC opal_list_t orte_errmgr_base_components_available
Output and component variables.
Definition: errmgr_base_open.c:52
The opal_list_t interface is used to provide a generic doubly-linked list container for Open MPI...
Top-level interface for all MCA components.
Definition: orte_globals.h:386
The Open RTE Error and Recovery Manager (ErrMgr)
Definition: orte_globals.h:316
Definition: opal_list.h:147