19 #ifndef __PERFMODEL_H__
20 #define __PERFMODEL_H__
24 #include <common/config.h>
43 #define _STARPU_PERFMODEL_VERSION 45
47 struct starpu_perfmodel_per_arch** per_arch;
48 int** per_arch_is_set;
50 starpu_pthread_rwlock_t model_rwlock;
60 struct starpu_data_descr;
62 struct starpu_perfmodel_arch;
64 extern unsigned _starpu_calibration_minimum;
66 char *_starpu_get_perf_model_dir_codelet();
67 char *_starpu_get_perf_model_dir_bus();
68 char *_starpu_get_perf_model_dir_debug();
70 double _starpu_history_based_job_expected_perf(
struct starpu_perfmodel *model,
struct starpu_perfmodel_arch* arch,
struct _starpu_job *j,
unsigned nimpl);
71 void _starpu_load_history_based_model(
struct starpu_perfmodel *model,
unsigned scan_history);
72 void _starpu_init_and_load_perfmodel(
struct starpu_perfmodel *model);
73 void _starpu_initialize_registered_performance_models(
void);
74 void _starpu_deinitialize_registered_performance_models(
void);
75 void _starpu_deinitialize_performance_model(
struct starpu_perfmodel *model);
77 double _starpu_regression_based_job_expected_perf(
struct starpu_perfmodel *model,
78 struct starpu_perfmodel_arch* arch,
struct _starpu_job *j,
unsigned nimpl);
79 double _starpu_non_linear_regression_based_job_expected_perf(
struct starpu_perfmodel *model,
80 struct starpu_perfmodel_arch* arch,
struct _starpu_job *j,
unsigned nimpl);
81 double _starpu_multiple_regression_based_job_expected_perf(
struct starpu_perfmodel *model,
struct starpu_perfmodel_arch* arch,
83 void _starpu_update_perfmodel_history(
struct _starpu_job *j,
struct starpu_perfmodel *model,
struct starpu_perfmodel_arch * arch,
84 unsigned cpuid,
double measured,
unsigned nimpl);
85 int _starpu_perfmodel_create_comb_if_needed(
struct starpu_perfmodel_arch* arch);
87 void _starpu_create_sampling_directory_if_needed(
void);
89 void _starpu_load_bus_performance_files(
void);
91 void _starpu_set_calibrate_flag(
unsigned val);
92 unsigned _starpu_get_calibrate_flag(
void);
94 #if defined(STARPU_USE_CUDA)
95 unsigned *_starpu_get_cuda_affinity_vector(
unsigned gpuid);
97 #if defined(STARPU_USE_OPENCL)
98 unsigned *_starpu_get_opencl_affinity_vector(
unsigned gpuid);
101 void _starpu_save_bandwidth_and_latency_disk(
double bandwidth_write,
double bandwidth_read,
102 double latency_write,
double latency_read,
unsigned node,
const char *name);
104 void _starpu_write_double(FILE *f,
const char *format,
double val);
105 int _starpu_read_double(FILE *f,
char *format,
double *val);
106 void _starpu_simgrid_get_platform_path(
int version,
char *path,
size_t maxlen);
108 void _starpu_perfmodel_realloc(
struct starpu_perfmodel *model,
int nb);
110 void _starpu_free_arch_combs(
void);
112 #if defined(STARPU_HAVE_HWLOC)
113 hwloc_topology_t _starpu_perfmodel_get_hwtopology();
int ncombs_set
Definition: perfmodel.h:56
int ncombs
Definition: perfmodel.h:54
Definition: perfmodel.h:46