19 #ifndef MCA_ERRMGR_hnp_EXPORT_H
20 #define MCA_ERRMGR_hnp_EXPORT_H
22 #include "orte_config.h"
35 bool term_in_progress;
39 bool crmig_in_progress;
40 bool autor_in_progress;
44 bool crmig_timing_enabled;
48 bool autor_timing_enabled;
49 int autor_recovery_delay;
50 bool autor_skip_oldnode;
58 void orte_errmgr_hnp_update_proc(
orte_job_t *jdata,
60 orte_proc_state_t state,
62 orte_exit_code_t exit_code);
67 int orte_errmgr_hnp_global_module_init(
void);
68 int orte_errmgr_hnp_global_module_finalize(
void);
70 int orte_errmgr_hnp_global_update_state(
orte_jobid_t job,
71 orte_job_state_t jobstate,
73 orte_proc_state_t state,
75 orte_exit_code_t exit_code);
76 int orte_errmgr_hnp_global_predicted_fault(
opal_list_t *proc_list,
79 int orte_errmgr_hnp_global_suggest_map_targets(
orte_proc_t *proc,
82 int orte_errmgr_hnp_global_ft_event(
int state);
88 int orte_errmgr_hnp_base_global_init(
void);
89 int orte_errmgr_hnp_base_global_finalize(
void);
90 int orte_errmgr_hnp_base_global_update_state(
orte_jobid_t job,
91 orte_job_state_t jobstate,
93 orte_proc_state_t state,
95 orte_exit_code_t exit_code);
96 int orte_errmgr_hnp_base_global_ft_event(
int state);
100 int orte_errmgr_hnp_crmig_global_module_init(
void);
101 int orte_errmgr_hnp_crmig_global_module_finalize(
void);
103 int orte_errmgr_hnp_crmig_global_update_state(
orte_jobid_t job,
104 orte_job_state_t jobstate,
106 orte_proc_state_t state,
108 orte_exit_code_t exit_code);
109 int orte_errmgr_hnp_crmig_global_predicted_fault(
opal_list_t *proc_list,
112 int orte_errmgr_hnp_crmig_global_suggest_map_targets(
orte_proc_t *proc,
115 int orte_errmgr_hnp_crmig_global_ft_event(
int state);
118 int orte_errmgr_hnp_autor_global_module_init(
void);
119 int orte_errmgr_hnp_autor_global_module_finalize(
void);
121 int orte_errmgr_hnp_autor_global_update_state(
orte_jobid_t job,
122 orte_job_state_t jobstate,
124 orte_proc_state_t state,
126 orte_exit_code_t exit_code);
127 int orte_errmgr_hnp_autor_global_suggest_map_targets(
orte_proc_t *proc,
130 int orte_errmgr_hnp_autor_global_ft_event(
int state);
Common type for all MCA modules.
Definition: mca.h:100
dynamic pointer array
Definition: opal_pointer_array.h:45
Definition: errmgr_hnp.h:31
uint32_t orte_jobid_t
Set the allowed range for ids in each space.
Definition: types.h:76
Definition: orte_globals.h:386
The Open RTE Error and Recovery Manager (ErrMgr)
Definition: orte_globals.h:316
Definition: opal_list.h:147
bool ignore_current_update
Base Errmgr component.
Definition: errmgr_hnp.h:34
Structure for holding a buffer to be used with the RML or OOB subsystems.
Definition: dss_types.h:159
Definition: orte_globals.h:254