44 int processes_per_node,
45 int64_t node_sum_useful,
47 int64_t max_useful_time);
void perf_metrics__infer_mpi_model(perf_metrics_mpi_t *metrics, int processes_per_node, int64_t node_sum_useful, int64_t node_sum_mpi, int64_t max_useful_time)
Definition: perf_metrics.c:70
void perf_metrics__base_to_pop_metrics(const char *monitor_name, const pop_base_metrics_t *base_metrics, dlb_pop_metrics_t *pop_metrics)
Definition: perf_metrics.c:670
void perf_metrics__reduce_monitor_into_base_metrics(pop_base_metrics_t *base_metrics, const dlb_monitor_t *monitor, bool all_to_all)
Definition: perf_metrics.c:583
void perf_metrics__local_monitor_into_base_metrics(pop_base_metrics_t *base_metrics, const dlb_monitor_t *monitor)
Definition: perf_metrics.c:634
Definition: dlb_talp.h:35
Definition: dlb_talp.h:91
Definition: perf_metrics.h:34
float communication_efficiency
Definition: perf_metrics.h:36
float load_balance
Definition: perf_metrics.h:37
float lb_out
Definition: perf_metrics.h:39
float lb_in
Definition: perf_metrics.h:38
float parallel_efficiency
Definition: perf_metrics.h:35
Definition: perf_metrics.h:58
int64_t gpu_inactive_time
Definition: perf_metrics.h:92
int64_t elapsed_time
Definition: perf_metrics.h:75
int64_t num_omp_parallels
Definition: perf_metrics.h:71
double min_mpi_normd_proc
Definition: perf_metrics.h:85
double min_mpi_normd_node
Definition: perf_metrics.h:88
int64_t num_omp_tasks
Definition: perf_metrics.h:72
double instructions
Definition: perf_metrics.h:67
int64_t num_measurements
Definition: perf_metrics.h:69
int64_t num_gpu_runtime_calls
Definition: perf_metrics.h:73
int64_t num_mpi_calls
Definition: perf_metrics.h:70
int64_t gpu_useful_time
Definition: perf_metrics.h:90
int64_t gpu_communication_time
Definition: perf_metrics.h:91
int64_t omp_serialization_time
Definition: perf_metrics.h:80
int num_gpus
Definition: perf_metrics.h:64
int64_t useful_time
Definition: perf_metrics.h:76
int64_t gpu_runtime_time
Definition: perf_metrics.h:81
int64_t mpi_time
Definition: perf_metrics.h:77
int64_t omp_load_imbalance_time
Definition: perf_metrics.h:78
int64_t max_gpu_useful_time
Definition: perf_metrics.h:94
float avg_cpus
Definition: perf_metrics.h:63
double cycles
Definition: perf_metrics.h:66
int64_t omp_scheduling_time
Definition: perf_metrics.h:79
int num_nodes
Definition: perf_metrics.h:62
int num_mpi_ranks
Definition: perf_metrics.h:61
int num_cpus
Definition: perf_metrics.h:60
int64_t max_gpu_active_time
Definition: perf_metrics.h:95