19#ifndef __PERFMODEL_H__
20#define __PERFMODEL_H__
24#include <common/config.h>
43#define _STARPU_PERFMODEL_VERSION 45
47 struct starpu_perfmodel_per_arch** per_arch;
48 int** per_arch_is_set;
50 starpu_pthread_rwlock_t model_rwlock;
60struct starpu_data_descr;
62struct starpu_perfmodel_arch;
64extern unsigned _starpu_calibration_minimum;
66char *_starpu_get_perf_model_dir_codelet();
67char *_starpu_get_perf_model_dir_bus();
68char *_starpu_get_perf_model_dir_debug();
70double _starpu_history_based_job_expected_perf(
struct starpu_perfmodel *model,
struct starpu_perfmodel_arch* arch,
struct _starpu_job *j,
unsigned nimpl);
71void _starpu_load_history_based_model(
struct starpu_perfmodel *model,
unsigned scan_history);
72void _starpu_init_and_load_perfmodel(
struct starpu_perfmodel *model);
73void _starpu_initialize_registered_performance_models(
void);
74void _starpu_deinitialize_registered_performance_models(
void);
75void _starpu_deinitialize_performance_model(
struct starpu_perfmodel *model);
77double _starpu_regression_based_job_expected_perf(
struct starpu_perfmodel *model,
78 struct starpu_perfmodel_arch* arch,
struct _starpu_job *j,
unsigned nimpl);
79double _starpu_non_linear_regression_based_job_expected_perf(
struct starpu_perfmodel *model,
80 struct starpu_perfmodel_arch* arch,
struct _starpu_job *j,
unsigned nimpl);
81double _starpu_multiple_regression_based_job_expected_perf(
struct starpu_perfmodel *model,
struct starpu_perfmodel_arch* arch,
83void _starpu_update_perfmodel_history(
struct _starpu_job *j,
struct starpu_perfmodel *model,
struct starpu_perfmodel_arch * arch,
84 unsigned cpuid,
double measured,
unsigned nimpl);
85int _starpu_perfmodel_create_comb_if_needed(
struct starpu_perfmodel_arch* arch);
87void _starpu_create_sampling_directory_if_needed(
void);
89void _starpu_load_bus_performance_files(
void);
91void _starpu_set_calibrate_flag(
unsigned val);
92unsigned _starpu_get_calibrate_flag(
void);
94#if defined(STARPU_USE_CUDA)
95unsigned *_starpu_get_cuda_affinity_vector(
unsigned gpuid);
97#if defined(STARPU_USE_OPENCL)
98unsigned *_starpu_get_opencl_affinity_vector(
unsigned gpuid);
101void _starpu_save_bandwidth_and_latency_disk(
double bandwidth_write,
double bandwidth_read,
102 double latency_write,
double latency_read,
unsigned node,
const char *name);
104void _starpu_write_double(FILE *f,
const char *format,
double val);
105int _starpu_read_double(FILE *f,
char *format,
double *val);
106void _starpu_simgrid_get_platform_path(
int version,
char *path,
size_t maxlen);
108void _starpu_perfmodel_realloc(
struct starpu_perfmodel *model,
int nb);
110void _starpu_free_arch_combs(
void);
112#if defined(STARPU_HAVE_HWLOC)
113hwloc_topology_t _starpu_perfmodel_get_hwtopology();
int ncombs_set
Definition perfmodel.h:56
int ncombs
Definition perfmodel.h:54
Definition perfmodel.h:46