1 /* Copyright (c) 2007, 2009, 2010. The SimGrid Team.
2 * All rights reserved. */
4 /* This program is free software; you can redistribute it and/or modify it
5 * under the terms of the license (GNU LGPL) which comes with this package. */
7 #include <math.h> // sqrt
10 #include "xbt/sysdep.h"
12 #include "surf/surf.h"
14 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(smpi_bench, smpi,
15 "Logging specific to SMPI (benchmarking)");
17 xbt_dict_t allocs = NULL; /* Allocated on first use */
18 xbt_dict_t samples = NULL; /* Allocated on first use */
19 xbt_dict_t calls = NULL; /* Allocated on first use */
37 void smpi_bench_destroy(void)
39 xbt_dict_free(&allocs);
40 xbt_dict_free(&samples);
41 xbt_dict_free(&calls);
44 static void smpi_execute_flops(double flops)
48 host = SIMIX_host_self();
50 XBT_DEBUG("Handle real computation time: %f flops", flops);
51 action = SIMIX_req_host_execute("computation", host, flops, 1);
53 SIMIX_req_set_category (action, TRACE_internal_smpi_get_category());
55 SIMIX_req_host_execution_wait(action);
58 static void smpi_execute(double duration)
60 /* FIXME: a global variable would be less expensive to consult than a call to xbt_cfg_get_double() right on the critical path */
61 if (duration >= xbt_cfg_get_double(_surf_cfg_set, "smpi/cpu_threshold")) {
62 XBT_DEBUG("Sleep for %f to handle real computation time", duration);
63 smpi_execute_flops(duration *
64 xbt_cfg_get_double(_surf_cfg_set,
65 "smpi/running_power"));
69 void smpi_bench_begin(void)
71 xbt_os_timer_start(smpi_process_timer());
74 void smpi_bench_end(void)
76 xbt_os_timer_t timer = smpi_process_timer();
78 xbt_os_timer_stop(timer);
79 smpi_execute(xbt_os_timer_elapsed(timer));
82 unsigned int smpi_sleep(unsigned int secs)
84 smpi_execute((double) secs);
88 int smpi_gettimeofday(struct timeval *tv, struct timezone *tz)
90 double now = SIMIX_get_clock();
93 tv->tv_sec = (time_t) now;
94 tv->tv_usec = (suseconds_t) (now * 1e6);
99 static char *sample_location(int global, const char *file, int line)
102 return bprintf("%s:%d", file, line);
104 return bprintf("%s:%d:%d", file, line, smpi_process_index());
108 int smpi_sample_1(int global, const char *file, int line, int iters, double threshold)
110 char *loc = sample_location(global, file, line);
113 smpi_bench_end(); /* Take time from previous MPI call into account */
115 samples = xbt_dict_new_homogeneous(free);
117 data = xbt_dict_get_or_null(samples, loc);
119 data = (local_data_t *) xbt_new(local_data_t, 1);
122 data->sum_pow2 = 0.0;
124 data->threshold = threshold;
126 xbt_dict_set(samples, loc, data, NULL);
133 int smpi_sample_2(int global, const char *file, int line)
135 char *loc = sample_location(global, file, line);
138 xbt_assert(samples, "You did something very inconsistent, didn't you?");
139 data = xbt_dict_get_or_null(samples, loc);
141 xbt_assert(data, "Please, do thing in order");
143 if (!data->started) {
144 if ((data->iters > 0 && data->count >= data->iters)
145 || (data->count > 1 && data->threshold > 0.0 && data->relstderr <= data->threshold)) {
146 XBT_DEBUG("Perform some wait of %f", data->mean);
147 smpi_execute(data->mean);
157 smpi_process_simulated_start();
158 return data->started;
161 void smpi_sample_3(int global, const char *file, int line)
163 char *loc = sample_location(global, file, line);
167 xbt_assert(samples, "You did something very inconsistent, didn't you?");
168 data = xbt_dict_get_or_null(samples, loc);
170 if(data && data->started && data->count < data->iters) {
171 sample = smpi_process_simulated_elapsed();
173 data->sum_pow2 += sample * sample;
174 n = (double)data->count;
175 data->mean = data->sum / n;
176 data->relstderr = sqrt((data->sum_pow2 / n - data->mean * data->mean) / n) / data->mean;
177 XBT_DEBUG("Average mean after %d steps is %f, relative standard error is %f (sample was %f)", data->count,
178 data->mean, data->relstderr, sample);
183 void smpi_sample_flops(double flops)
185 smpi_execute_flops(flops);
188 void *smpi_shared_malloc(size_t size, const char *file, int line)
190 char *loc = bprintf("%s:%d:%zu", file, line, size);
194 allocs = xbt_dict_new_homogeneous(free);
196 data = xbt_dict_get_or_null(allocs, loc);
198 data = (shared_data_t *) xbt_malloc0(sizeof(int) + size);
200 xbt_dict_set(allocs, loc, data, NULL);
208 void smpi_shared_free(void *ptr)
210 shared_data_t *data = (shared_data_t *) ((int *) ptr - 1);
214 XBT_WARN("Cannot free: nothing was allocated");
217 loc = xbt_dict_get_key(allocs, data);
219 XBT_WARN("Cannot free: %p was not shared-allocated by SMPI", ptr);
223 if (data->count <= 0) {
224 xbt_dict_remove(allocs, loc);
228 int smpi_shared_known_call(const char* func, const char* input) {
229 char* loc = bprintf("%s:%s", func, input);
234 calls = xbt_dict_new_homogeneous(NULL);
237 xbt_dict_get(calls, loc); /* Succeed or throw */
241 if(ex.category == not_found_error) {
252 void* smpi_shared_get_call(const char* func, const char* input) {
253 char* loc = bprintf("%s:%s", func, input);
257 calls = xbt_dict_new_homogeneous(NULL);
259 data = xbt_dict_get(calls, loc);
264 void* smpi_shared_set_call(const char* func, const char* input, void* data) {
265 char* loc = bprintf("%s:%s", func, input);
268 calls = xbt_dict_new_homogeneous(NULL);
270 xbt_dict_set(calls, loc, data, NULL);