X-Git-Url: http://info.iut-bm.univ-fcomte.fr/pub/gitweb/simgrid.git/blobdiff_plain/7b2fe943182bff869b3ae80333a4f2d2bf0fb7cf..bfc956026c22595af39ca5c73b7e250e16d85aea:/src/smpi/smpi_bench.c diff --git a/src/smpi/smpi_bench.c b/src/smpi/smpi_bench.c index 15fdb676a4..d35c50c8d9 100644 --- a/src/smpi/smpi_bench.c +++ b/src/smpi/smpi_bench.c @@ -69,18 +69,17 @@ xbt_dict_t allocs = NULL; /* Allocated on first use */ xbt_dict_t allocs_metadata = NULL; /* Allocated on first use */ xbt_dict_t samples = NULL; /* Allocated on first use */ xbt_dict_t calls = NULL; /* Allocated on first use */ -__thread int smpi_current_rank = 0; /* Updated after each MPI call */ double smpi_cpu_threshold; double smpi_running_power; -int* fds; -void** mappings; -int loaded_page = -1; +int smpi_loaded_page = -1; char* start_data_exe = NULL; int size_data_exe = 0; int smpi_privatize_global_variables; +smpi_privatisation_region_t smpi_privatisation_regions; + typedef struct { int fd; int count; @@ -118,7 +117,7 @@ static void* shm_map(int fd, size_t size, shared_data_t* data) { xbt_die("Could not map fd %d: %s", fd, strerror(errno)); } if(!allocs_metadata) { - allocs_metadata = xbt_dict_new_homogeneous(xbt_free); + allocs_metadata = xbt_dict_new_homogeneous(xbt_free_f); } snprintf(loc, PTR_STRLEN, "%p", mem); meta = xbt_new(shared_metadata_t, 1); @@ -186,63 +185,61 @@ void smpi_execute(double duration) } } -void switch_data_segment(int dest); +void smpi_switch_data_segment(int dest); void smpi_bench_begin(void) { - switch_data_segment(smpi_process_index()); + smpi_switch_data_segment(smpi_process_index()); xbt_os_threadtimer_start(smpi_process_timer()); - smpi_current_rank = smpi_process_index(); } void smpi_bench_end(void) { xbt_os_timer_t timer = smpi_process_timer(); xbt_os_threadtimer_stop(timer); -// switch_data_segment(smpi_process_count()); +// smpi_switch_data_segment(smpi_process_count()); if (smpi_process_get_sampling()) { XBT_CRITICAL("Cannot do recursive benchmarks."); XBT_CRITICAL("Are you trying to make a call to MPI within a SMPI_SAMPLE_ block?"); xbt_backtrace_display_current(); xbt_die("Aborting."); } - smpi_execute(xbt_os_timer_elapsed(timer)); + // Simulate the benchmarked computation unless disabled via command-line argument + if (sg_cfg_get_boolean("smpi/simulate_computation")) { + smpi_execute(xbt_os_timer_elapsed(timer)); + } } -unsigned int smpi_sleep(unsigned int secs) +/* Private sleep function used by smpi_sleep() and smpi_usleep() */ +static unsigned int private_sleep(double secs) { - smx_action_t action; - smpi_bench_end(); - double flops = (double) secs*simcall_host_get_speed(SIMIX_host_self()); - XBT_DEBUG("Sleep for: %f flops", flops); - action = simcall_host_execute("computation", SIMIX_host_self(), flops, 1, 0, 0); + XBT_DEBUG("Sleep for: %lf secs", secs); #ifdef HAVE_TRACING - simcall_set_category (action, TRACE_internal_smpi_get_category()); - #endif - simcall_host_execution_wait(action); + int rank = smpi_comm_rank(MPI_COMM_WORLD); + instr_extra_data extra = xbt_new0(s_instr_extra_data_t,1); + extra->type=TRACING_SLEEPING; + extra->sleep_duration=secs; + TRACE_smpi_sleeping_in(rank, extra); +#endif + simcall_process_sleep(secs); +#ifdef HAVE_TRACING + TRACE_smpi_sleeping_out(rank); +#endif smpi_bench_begin(); - return secs; + return 0; } -int smpi_usleep(useconds_t usecs) +unsigned int smpi_sleep(unsigned int secs) { - smx_action_t action; - - smpi_bench_end(); - - double flops = (double) (usecs/1000000.0)*simcall_host_get_speed(SIMIX_host_self()); - XBT_DEBUG("Sleep for: %f flops", flops); - action = simcall_host_execute("computation", SIMIX_host_self(), flops, 1, 0, 0); - #ifdef HAVE_TRACING - simcall_set_category (action, TRACE_internal_smpi_get_category()); - #endif - simcall_host_execution_wait(action); + return private_sleep((double)secs); +} - smpi_bench_begin(); - return 0; +int smpi_usleep(useconds_t usecs) +{ + return (int)private_sleep((double)usecs / 1000000.0); } @@ -507,7 +504,7 @@ void smpi_shared_free(void *ptr) shared_metadata_t* meta; shared_data_t* data; if (sg_cfg_get_boolean("smpi/use_shared_malloc")){ - + if (!allocs) { XBT_WARN("Cannot free: nothing was allocated"); return; @@ -605,28 +602,27 @@ void* smpi_shared_set_call(const char* func, const char* input, void* data) { -void switch_data_segment(int dest){ +void smpi_switch_data_segment(int dest){ if(size_data_exe == 0)//no need to switch return; - if (loaded_page==dest)//no need to switch either + if (smpi_loaded_page==dest)//no need to switch either return; - #ifdef HAVE_MMAP int i; - if(loaded_page==-1){//initial switch, do the copy from the real page here + if(smpi_loaded_page==-1){//initial switch, do the copy from the real page here for (i=0; i< SIMIX_process_count(); i++){ - memcpy(mappings[i],TOPAGE(start_data_exe),size_data_exe); + memcpy(smpi_privatisation_regions[i].address,TOPAGE(start_data_exe),size_data_exe); } } - int current= fds[dest]; + int current = smpi_privatisation_regions[dest].file_descriptor; XBT_VERB("Switching data frame to the one of process %d", dest); void* tmp = mmap (TOPAGE(start_data_exe), size_data_exe, PROT_READ | PROT_WRITE, MAP_FIXED | MAP_SHARED, current, 0); if (tmp != TOPAGE(start_data_exe)) xbt_die("Couldn't map the new region"); - loaded_page=dest; + smpi_loaded_page=dest; #endif } @@ -687,7 +683,7 @@ void smpi_get_executable_global_size(){ found++; }else if(strcmp(lfields[1], ".bss") == 0){ //the beginning of bss is not exactly the end of data if not aligned, grow bss reported size accordingly - //TODO : check if this is OK, as some segments may be inserted between them.. + //TODO : check if this is OK, as some segments may be inserted between them.. size_bss_binary = ((char*) strtoul(lfields[4], NULL, 16) - (start_data_exe + size_data_binary)) + strtoul(lfields[2], NULL, 16); found++; @@ -721,18 +717,19 @@ void smpi_initialize_global_memory_segments(){ return; } - fds= (int*)xbt_malloc((smpi_process_count())*sizeof(int)); - mappings= (void**)xbt_malloc((smpi_process_count())*sizeof(void*)); - + smpi_privatisation_regions = (smpi_privatisation_region_t) malloc( + sizeof(struct s_smpi_privatisation_region) * sizeof(int)); for (i=0; i< SIMIX_process_count(); i++){ //create SIMIX_process_count() mappings of this size with the same data inside - void *address = NULL, *tmp = NULL; + void *address = NULL; char path[] = "/dev/shm/my-buffer-XXXXXX"; int status; + int file_descriptor= mkstemp (path); if (file_descriptor < 0) xbt_die("Impossible to create temporary file for memory mapping"); + status = unlink (path); if (status) xbt_die("Impossible to unlink temporary file for memory mapping"); @@ -742,21 +739,16 @@ void smpi_initialize_global_memory_segments(){ xbt_die("Impossible to set the size of the temporary file for memory mapping"); /* Ask for a free region */ - address = mmap (NULL, size_data_exe, PROT_NONE, MAP_ANONYMOUS | MAP_PRIVATE, -1, 0); - + address = mmap (NULL, size_data_exe, PROT_READ | PROT_WRITE, MAP_SHARED, file_descriptor, 0); if (address == MAP_FAILED) xbt_die("Couldn't find a free region for memory mapping"); - tmp = mmap (address, size_data_exe, PROT_READ | PROT_WRITE, MAP_FIXED | MAP_SHARED, file_descriptor, 0); - - if (tmp != address) - xbt_die("Couldn't obtain the right address"); //initialize the values memcpy(address,TOPAGE(start_data_exe),size_data_exe); //store the address of the mapping for further switches - fds[i]=file_descriptor; - mappings[i]= address; + smpi_privatisation_regions[i].file_descriptor = file_descriptor; + smpi_privatisation_regions[i].address = address; } #endif @@ -769,15 +761,13 @@ void smpi_destroy_global_memory_segments(){ #ifdef HAVE_MMAP int i; for (i=0; i< smpi_process_count(); i++){ - if(munmap(mappings[i],size_data_exe) < 0) { - XBT_WARN("Unmapping of fd %d failed: %s", fds[i], strerror(errno)); + if(munmap(smpi_privatisation_regions[i].address,size_data_exe) < 0) { + XBT_WARN("Unmapping of fd %d failed: %s", + smpi_privatisation_regions[i].file_descriptor, strerror(errno)); } - close(fds[i]); + close(smpi_privatisation_regions[i].file_descriptor); } - xbt_free(mappings); - xbt_free(fds); - + xbt_free(smpi_privatisation_regions); #endif } -