X-Git-Url: http://info.iut-bm.univ-fcomte.fr/pub/gitweb/simgrid.git/blobdiff_plain/02e37010625e82cedbbfc3d1a5982eaa3b18b176..a4ab179f11ae2afec1467c4ca9256fc5ba6fa85b:/src/smpi/smpi_bench.cpp diff --git a/src/smpi/smpi_bench.cpp b/src/smpi/smpi_bench.cpp index 5e18345c34..3b01c90dce 100644 --- a/src/smpi/smpi_bench.cpp +++ b/src/smpi/smpi_bench.cpp @@ -1,5 +1,4 @@ -/* Copyright (c) 2007, 2009-2015. The SimGrid Team. - * All rights reserved. */ +/* Copyright (c) 2007, 2009-2017. The SimGrid Team. All rights reserved. */ /* This program is free software; you can redistribute it and/or modify it * under the terms of the license (GNU LGPL) which comes with this package. */ @@ -12,6 +11,7 @@ #include "src/internal_config.h" #include "private.h" #include "private.hpp" +#include #include "xbt/dict.h" #include "xbt/sysdep.h" #include "xbt/ex.h" @@ -20,11 +20,11 @@ #include "simgrid/modelchecker.h" #include "src/mc/mc_replay.h" +#include #ifndef WIN32 #include #endif #include -#include #include #include #include // sqrt @@ -32,6 +32,10 @@ #include #include +#if HAVE_PAPI +#include +#endif + #ifndef MAP_ANONYMOUS #define MAP_ANONYMOUS MAP_ANON #endif @@ -71,16 +75,16 @@ XBT_LOG_NEW_DEFAULT_SUBCATEGORY(smpi_bench, smpi, "Logging specific to SMPI (ben #define PTR_STRLEN (2 + 2 * sizeof(void*) + 1) -xbt_dict_t samples = NULL; /* Allocated on first use */ -xbt_dict_t calls = NULL; /* Allocated on first use */ +xbt_dict_t samples = nullptr; /* Allocated on first use */ +xbt_dict_t calls = nullptr; /* Allocated on first use */ double smpi_cpu_threshold; -double smpi_running_power; +double smpi_host_speed; int smpi_loaded_page = -1; -char* smpi_start_data_exe = NULL; +char* smpi_start_data_exe = nullptr; int smpi_size_data_exe = 0; -int smpi_privatize_global_variables; +bool smpi_privatize_global_variables; double smpi_total_benched_time = 0; smpi_privatisation_region_t smpi_privatisation_regions; @@ -93,10 +97,10 @@ namespace { class smpi_source_location { public: smpi_source_location(const char* filename, int line) - : filename(filename), filename_length(strlen(filename)), line(line) {} + : filename(xbt_strdup(filename)), filename_length(strlen(filename)), line(line) {} /** Pointer to a static string containing the file name */ - const char* filename = nullptr; + char* filename = nullptr; int filename_length = 0; int line = 0; @@ -155,24 +159,26 @@ static size_t shm_size(int fd) { if(fstat(fd, &st) < 0) { xbt_die("Could not stat fd %d: %s", fd, strerror(errno)); } - return (size_t)st.st_size; + return static_cast(st.st_size); } #ifndef WIN32 static void* shm_map(int fd, size_t size, shared_data_key_type* data) { - void* mem; char loc[PTR_STRLEN]; shared_metadata_t meta; - if(size > shm_size(fd)) { - if(ftruncate(fd, (off_t)size) < 0) { + if(size > shm_size(fd) && (ftruncate(fd, static_cast(size)) < 0)) { xbt_die("Could not truncate fd %d to %zu: %s", fd, size, strerror(errno)); - } } - mem = mmap(NULL, size, PROT_READ | PROT_WRITE, MAP_SHARED, fd, 0); + void* mem = mmap(nullptr, size, PROT_READ | PROT_WRITE, MAP_SHARED, fd, 0); if(mem == MAP_FAILED) { - xbt_die("Could not map fd %d: %s", fd, strerror(errno)); + xbt_die( + "Failed to map fd %d with size %zu: %s\n" + "If you are running a lot of ranks, you may be exceeding the amount of mappings allowed per process.\n" + "On Linux systems, change this value with sudo sysctl -w vm.max_map_count=newvalue (default value: 65536)\n" + "Please see http://simgrid.gforge.inria.fr/simgrid/latest/doc/html/options.html#options_virt for more info.", + fd, size, strerror(errno)); } snprintf(loc, PTR_STRLEN, "%p", mem); meta.size = size; @@ -183,7 +189,7 @@ static void* shm_map(int fd, size_t size, shared_data_key_type* data) { } #endif -void smpi_bench_destroy(void) +void smpi_bench_destroy() { allocs.clear(); allocs_metadata.clear(); @@ -204,9 +210,8 @@ void smpi_execute_(double *duration) } void smpi_execute_flops(double flops) { - smx_synchro_t action; XBT_DEBUG("Handle real computation time: %f flops", flops); - action = simcall_execution_start("computation", flops, 1, 0, 0); + smx_activity_t action = simcall_execution_start("computation", flops, 1, 0); simcall_set_category (action, TRACE_internal_smpi_get_category()); simcall_execution_wait(action); smpi_switch_data_segment(smpi_process_index()); @@ -216,12 +221,13 @@ void smpi_execute(double duration) { if (duration >= smpi_cpu_threshold) { XBT_DEBUG("Sleep for %g to handle real computation time", duration); - double flops = duration * smpi_running_power; + double flops = duration * smpi_host_speed; int rank = smpi_process_index(); instr_extra_data extra = xbt_new0(s_instr_extra_data_t,1); extra->type=TRACING_COMPUTING; extra->comp_size=flops; TRACE_smpi_computing_in(rank, extra); + smpi_execute_flops(flops); TRACE_smpi_computing_out(rank); @@ -232,9 +238,7 @@ void smpi_execute(double duration) } } -void smpi_switch_data_segment(int dest); - -void smpi_bench_begin(void) +void smpi_bench_begin() { if (smpi_privatize_global_variables) { smpi_switch_data_segment(smpi_process_index()); @@ -243,27 +247,90 @@ void smpi_bench_begin(void) if (MC_is_active() || MC_record_replay_is_active()) return; +#if HAVE_PAPI + if (xbt_cfg_get_string("smpi/papi-events")[0] != '\0') { + int event_set = smpi_process_papi_event_set(); + // PAPI_start sets everything to 0! See man(3) PAPI_start + if (PAPI_LOW_LEVEL_INITED == PAPI_is_initialized()) { + if (PAPI_start(event_set) != PAPI_OK) { + // TODO This needs some proper handling. + XBT_CRITICAL("Could not start PAPI counters.\n"); + xbt_die("Error."); + } + } + } +#endif xbt_os_threadtimer_start(smpi_process_timer()); } -void smpi_bench_end(void) +void smpi_bench_end() { - if (MC_is_active() || MC_record_replay_is_active()) return; + double speedup = 1; xbt_os_timer_t timer = smpi_process_timer(); xbt_os_threadtimer_stop(timer); -// smpi_switch_data_segment(smpi_process_count()); + +#if HAVE_PAPI + /** + * An MPI function has been called and now is the right time to update + * our PAPI counters for this process. + */ + if (xbt_cfg_get_string("smpi/papi-events")[0] != '\0') { + papi_counter_t& counter_data = smpi_process_papi_counters(); + int event_set = smpi_process_papi_event_set(); + std::vector event_values = std::vector(counter_data.size()); + + if (PAPI_stop(event_set, &event_values[0]) != PAPI_OK) { // Error + XBT_CRITICAL("Could not stop PAPI counters.\n"); + xbt_die("Error."); + } else { + for (unsigned int i = 0; i < counter_data.size(); i++) { + counter_data[i].second += event_values[i]; + // XBT_DEBUG("[%i] PAPI: Counter %s: Value is now %lli (got increment by %lli\n", smpi_process_index(), + // counter_data[i].first.c_str(), counter_data[i].second, event_values[i]); + } + } + } +#endif + if (smpi_process_get_sampling()) { XBT_CRITICAL("Cannot do recursive benchmarks."); XBT_CRITICAL("Are you trying to make a call to MPI within a SMPI_SAMPLE_ block?"); xbt_backtrace_display_current(); xbt_die("Aborting."); } + + if (xbt_cfg_get_string("smpi/comp-adjustment-file")[0] != '\0') { // Maybe we need to artificially speed up or slow + // down our computation based on our statistical analysis. + + smpi_trace_call_location_t* loc = smpi_process_get_call_location(); + std::string key = loc->get_composed_key(); + std::unordered_map::const_iterator it = location2speedup.find(key); + if (it != location2speedup.end()) { + speedup = it->second; + } + } + // Simulate the benchmarked computation unless disabled via command-line argument - if (xbt_cfg_get_boolean("smpi/simulate-computation")) - smpi_execute(xbt_os_timer_elapsed(timer)); + if (xbt_cfg_get_boolean("smpi/simulate-computation")) { + smpi_execute(xbt_os_timer_elapsed(timer)/speedup); + } + +#if HAVE_PAPI + if (xbt_cfg_get_string("smpi/papi-events")[0] != '\0' && TRACE_smpi_is_enabled()) { + char container_name[INSTR_DEFAULT_STR_SIZE]; + smpi_container(smpi_process_index(), container_name, INSTR_DEFAULT_STR_SIZE); + container_t container = PJ_container_get(container_name); + papi_counter_t& counter_data = smpi_process_papi_counters(); + + for (auto& pair : counter_data) { + new_pajeSetVariable(surf_get_clock(), container, + PJ_type_get(/* countername */ pair.first.c_str(), container->type), pair.second); + } + } +#endif smpi_total_benched_time += xbt_os_timer_elapsed(timer); } @@ -290,41 +357,64 @@ static unsigned int private_sleep(double secs) unsigned int smpi_sleep(unsigned int secs) { - return private_sleep((double)secs); + return private_sleep(static_cast(secs)); } int smpi_usleep(useconds_t usecs) { - return (int)private_sleep((double)usecs / 1000000.0); + return static_cast(private_sleep(static_cast(usecs) / 1000000.0)); } +#if _POSIX_TIMERS > 0 +int smpi_nanosleep(const struct timespec *tp, struct timespec * t) +{ + return static_cast(private_sleep(static_cast(tp->tv_sec + tp->tv_nsec / 1000000000.0))); +} +#endif + int smpi_gettimeofday(struct timeval *tv, void* tz) { double now; smpi_bench_end(); now = SIMIX_get_clock(); if (tv) { - tv->tv_sec = (time_t)now; + tv->tv_sec = static_cast(now); #ifdef WIN32 - tv->tv_usec = (useconds_t)((now - tv->tv_sec) * 1e6); + tv->tv_usec = static_cast((now - tv->tv_sec) * 1e6); #else - tv->tv_usec = (suseconds_t)((now - tv->tv_sec) * 1e6); + tv->tv_usec = static_cast((now - tv->tv_sec) * 1e6); #endif } smpi_bench_begin(); return 0; } +#if _POSIX_TIMERS > 0 +int smpi_clock_gettime(clockid_t clk_id, struct timespec *tp) +{ + //there is only one time in SMPI, so clk_id is ignored. + double now; + smpi_bench_end(); + now = SIMIX_get_clock(); + if (tp) { + tp->tv_sec = static_cast(now); + tp->tv_nsec = static_cast((now - tp->tv_sec) * 1e9); + } + smpi_bench_begin(); + return 0; +} +#endif + extern double sg_surf_precision; -unsigned long long smpi_rastro_resolution (void) +unsigned long long smpi_rastro_resolution () { smpi_bench_end(); double resolution = (1/sg_surf_precision); smpi_bench_begin(); - return (unsigned long long)resolution; + return static_cast(resolution); } -unsigned long long smpi_rastro_timestamp (void) +unsigned long long smpi_rastro_timestamp () { smpi_bench_end(); double now = SIMIX_get_clock(); @@ -332,7 +422,7 @@ unsigned long long smpi_rastro_timestamp (void) unsigned long long sec = (unsigned long long)now; unsigned long long pre = (now - sec) * smpi_rastro_resolution(); smpi_bench_begin(); - return (unsigned long long)sec * smpi_rastro_resolution() + pre; + return static_cast(sec) * smpi_rastro_resolution() + pre; } /* ****************************** Functions related to the SMPI_SAMPLE_ macros ************************************/ @@ -376,14 +466,14 @@ void smpi_sample_1(int global, const char *file, int line, int iters, double thr smpi_bench_end(); /* Take time from previous, unrelated computation into account */ smpi_process_set_sampling(1); - if (!samples) + if (samples==nullptr) samples = xbt_dict_new_homogeneous(free); data = static_cast(xbt_dict_get_or_null(samples, loc)); - if (!data) { + if (data==nullptr) { xbt_assert(threshold>0 || iters>0, "You should provide either a positive amount of iterations to bench, or a positive maximal stderr (or both)"); - data = (local_data_t *) xbt_new(local_data_t, 1); + data = static_cast( xbt_new(local_data_t, 1)); data->count = 0; data->sum = 0.0; data->sum_pow2 = 0.0; @@ -391,7 +481,7 @@ void smpi_sample_1(int global, const char *file, int line, int iters, double thr data->threshold = threshold; data->benching = 1; // If we have no data, we need at least one data->mean = 0; - xbt_dict_set(samples, loc, data, NULL); + xbt_dict_set(samples, loc, data, nullptr); XBT_DEBUG("XXXXX First time ever on benched nest %s.",loc); } else { if (data->iters != iters || data->threshold != threshold) { @@ -403,7 +493,7 @@ void smpi_sample_1(int global, const char *file, int line, int iters, double thr // if we already have some data, check whether sample_2 should get one more bench or whether it should emulate // the computation instead - data->benching = !sample_enough_benchs(data); + data->benching = (sample_enough_benchs(data) == 0); XBT_DEBUG("XXXX Re-entering the benched nest %s. %s",loc, (data->benching?"more benching needed":"we have enough data, skip computes")); } @@ -462,10 +552,10 @@ void smpi_sample_3(int global, const char *file, int line) sample = xbt_os_timer_elapsed(smpi_process_timer()); data->sum += sample; data->sum_pow2 += sample * sample; - n = (double)data->count; + n = static_cast(data->count); data->mean = data->sum / n; data->relstderr = sqrt((data->sum_pow2 / n - data->mean * data->mean) / n) / data->mean; - if (!sample_enough_benchs(data)) { + if (sample_enough_benchs(data)==0) { data->mean = sample; // Still in benching process; We want sample_2 to simulate the exact time of this loop // occurrence before leaving, not the mean over the history } @@ -481,7 +571,7 @@ void smpi_sample_3(int global, const char *file, int line) void *smpi_shared_malloc(size_t size, const char *file, int line) { void* mem; - if (xbt_cfg_get_boolean("smpi/use-shared-malloc")){ + if (size > 0 && xbt_cfg_get_boolean("smpi/use-shared-malloc")){ int fd; smpi_source_location loc(file, line); auto res = allocs.insert(std::make_pair(loc, shared_data_t())); @@ -493,12 +583,10 @@ void *smpi_shared_malloc(size_t size, const char *file, int line) snprintf(shmname, 31, "/shmalloc%p", &*data); fd = shm_open(shmname, O_RDWR | O_CREAT | O_EXCL, S_IRUSR | S_IWUSR | S_IRGRP | S_IROTH); if (fd < 0) { - switch(errno) { - case EEXIST: - xbt_die("Please cleanup /dev/shm/%s", shmname); - default: - xbt_die("An unhandled error occurred while opening %s. shm_open: %s", shmname, strerror(errno)); - } + if(errno==EEXIST) + xbt_die("Please cleanup /dev/shm/%s", shmname); + else + xbt_die("An unhandled error occurred while opening %s. shm_open: %s", shmname, strerror(errno)); } data->second.fd = fd; data->second.count = 1; @@ -528,7 +616,7 @@ void smpi_shared_free(void *ptr) snprintf(loc, PTR_STRLEN, "%p", ptr); auto meta = allocs_metadata.find(ptr); if (meta == allocs_metadata.end()) { - XBT_WARN("Cannot free: %p was not shared-allocated by SMPI", ptr); + XBT_WARN("Cannot free: %p was not shared-allocated by SMPI - maybe its size was 0?", ptr); return; } shared_data_t* data = &meta->second.data->second; @@ -536,11 +624,12 @@ void smpi_shared_free(void *ptr) XBT_WARN("Unmapping of fd %d failed: %s", data->fd, strerror(errno)); } data->count--; - XBT_DEBUG("Shared free - no removal - of %p, count = %d", ptr, data->count); if (data->count <= 0) { close(data->fd); allocs.erase(allocs.find(meta->second.data->first)); XBT_DEBUG("Shared free - with removal - of %p", ptr); + }else{ + XBT_DEBUG("Shared free - no removal - of %p, count = %d", ptr, data->count); } }else{ XBT_DEBUG("Classic free of %p", ptr); @@ -552,23 +641,24 @@ void smpi_shared_free(void *ptr) int smpi_shared_known_call(const char* func, const char* input) { char* loc = bprintf("%s:%s", func, input); - xbt_ex_t ex; int known = 0; - if (!calls) { - calls = xbt_dict_new_homogeneous(NULL); + if (calls==nullptr) { + calls = xbt_dict_new_homogeneous(nullptr); } - TRY { + try { xbt_dict_get(calls, loc); /* Succeed or throw */ known = 1; - } - TRY_CLEANUP { xbt_free(loc); } - CATCH(ex) { + catch (xbt_ex& ex) { + xbt_free(loc); if (ex.category != not_found_error) - RETHROW; - xbt_ex_free(ex); + throw; + } + catch(...) { + xbt_free(loc); + throw; } return known; } @@ -577,31 +667,30 @@ void* smpi_shared_get_call(const char* func, const char* input) { char* loc = bprintf("%s:%s", func, input); void* data; - if(!calls) { - calls = xbt_dict_new_homogeneous(NULL); + if(calls==nullptr) { + calls = xbt_dict_new_homogeneous(nullptr); } data = xbt_dict_get(calls, loc); - free(loc); + xbt_free(loc); return data; } void* smpi_shared_set_call(const char* func, const char* input, void* data) { char* loc = bprintf("%s:%s", func, input); - if(!calls) { - calls = xbt_dict_new_homogeneous(NULL); + if(calls==0) { + calls = xbt_dict_new_homogeneous(nullptr); } - xbt_dict_set(calls, loc, data, NULL); - free(loc); + xbt_dict_set(calls, loc, data, nullptr); + xbt_free(loc); return data; } -#define TOPAGE(addr) (void *)(((unsigned long)(addr) / xbt_pagesize) * xbt_pagesize) /** Map a given SMPI privatization segment (make a SMPI process active) */ -void smpi_switch_data_segment(int dest){ - if (smpi_loaded_page==dest)//no need to switch either - return; +void smpi_switch_data_segment(int dest) { + if (smpi_loaded_page == dest)//no need to switch, we've already loaded the one we want + return; // So the job: smpi_really_switch_data_segment(dest); @@ -636,13 +725,13 @@ void smpi_really_switch_data_segment(int dest) { int smpi_is_privatisation_file(char* file) { - return strncmp("/dev/shm/my-buffer-", file, 19) == 0; + return strncmp("/dev/shm/my-buffer-", file, std::strlen("/dev/shm/my-buffer-")) == 0; } void smpi_initialize_global_memory_segments(){ #if !HAVE_PRIVATIZATION - smpi_privatize_global_variables=0; + smpi_privatize_global_variables=false; xbt_die("You are trying to use privatization on a system that does not support it. Don't."); return; #else @@ -652,20 +741,24 @@ void smpi_initialize_global_memory_segments(){ XBT_DEBUG ("bss+data segment found : size %d starting at %p", smpi_size_data_exe, smpi_start_data_exe ); if (smpi_size_data_exe == 0){//no need to switch - smpi_privatize_global_variables=0; + smpi_privatize_global_variables=false; return; } smpi_privatisation_regions = - (smpi_privatisation_region_t) malloc(smpi_process_count() * sizeof(struct s_smpi_privatisation_region)); + static_cast( xbt_malloc(smpi_process_count() * sizeof(struct s_smpi_privatisation_region))); for (int i=0; i< smpi_process_count(); i++){ //create SIMIX_process_count() mappings of this size with the same data inside - void *address = NULL; - char path[] = "/dev/shm/my-buffer-XXXXXX"; + int file_descriptor; + void *address = nullptr; + char path[24]; int status; - int file_descriptor= mkstemp (path); + do { + snprintf(path, sizeof(path), "/smpi-buffer-%06x", rand()%0xffffff); + file_descriptor = shm_open(path, O_RDWR|O_CREAT|O_EXCL, S_IRUSR|S_IWUSR); + } while (file_descriptor == -1 && errno == EEXIST); if (file_descriptor < 0) { if (errno==EMFILE) { xbt_die("Impossible to create temporary file for memory mapping: %s\n\ @@ -686,19 +779,19 @@ Ask the Internet about tutorials on how to increase the files limit such as: htt strerror(errno)); } - status = unlink (path); - if (status) - xbt_die("Impossible to unlink temporary file for memory mapping"); - status = ftruncate(file_descriptor, smpi_size_data_exe); if(status) xbt_die("Impossible to set the size of the temporary file for memory mapping"); /* Ask for a free region */ - address = mmap (NULL, smpi_size_data_exe, PROT_READ | PROT_WRITE, MAP_SHARED, file_descriptor, 0); + address = mmap (nullptr, smpi_size_data_exe, PROT_READ | PROT_WRITE, MAP_SHARED, file_descriptor, 0); if (address == MAP_FAILED) xbt_die("Couldn't find a free region for memory mapping"); + status = shm_unlink(path); + if (status) + xbt_die("Impossible to unlink temporary file for memory mapping"); + //initialize the values memcpy(address, TOPAGE(smpi_start_data_exe), smpi_size_data_exe); @@ -723,3 +816,32 @@ void smpi_destroy_global_memory_segments(){ xbt_free(smpi_privatisation_regions); #endif } + +extern "C" { /** These functions will be called from the user code **/ + smpi_trace_call_location_t* smpi_trace_get_call_location() { + return smpi_process_get_call_location(); + } + + void smpi_trace_set_call_location(const char* file, const int line) { + smpi_trace_call_location_t* loc = smpi_process_get_call_location(); + + loc->previous_filename = loc->filename; + loc->previous_linenumber = loc->linenumber; + loc->filename = file; + loc->linenumber = line; + } + + /** + * Required for Fortran bindings + */ + void smpi_trace_set_call_location_(const char* file, int* line) { + smpi_trace_set_call_location(file, *line); + } + + /** + * Required for Fortran if -fsecond-underscore is activated + */ + void smpi_trace_set_call_location__(const char* file, int* line) { + smpi_trace_set_call_location(file, *line); + } +}