X-Git-Url: http://info.iut-bm.univ-fcomte.fr/pub/gitweb/simgrid.git/blobdiff_plain/b61e0df4e0f5d85fbc1df364660fc71d9461adc6..50b36cfb6864e719576327d1289cf9ba31d652da:/src/mc/mc_checkpoint.c diff --git a/src/mc/mc_checkpoint.c b/src/mc/mc_checkpoint.c index cece2e82ad..3d92e45243 100644 --- a/src/mc/mc_checkpoint.c +++ b/src/mc/mc_checkpoint.c @@ -5,13 +5,20 @@ * under the terms of the license (GNU LGPL) which comes with this package. */ #define _GNU_SOURCE -#define UNW_LOCAL_ONLY + +#include #include #include +#include + +#include "internal_config.h" +#include "mc_memory_map.h" #include "mc_private.h" #include "xbt/module.h" #include +#include "../smpi/private.h" +#include #include "xbt/mmalloc/mmprivate.h" @@ -21,213 +28,319 @@ #include #include "mc_private.h" +#include + +#include "mc_snapshot.h" +#include "mc_object_info.h" +#include "mc_mmu.h" +#include "mc_unw.h" +#include "mc_protocol.h" +#include "mc_smx.h" XBT_LOG_NEW_DEFAULT_SUBCATEGORY(mc_checkpoint, mc, "Logging specific to mc_checkpoint"); -char *libsimgrid_path; - /************************************ Free functions **************************************/ /*****************************************************************************************/ -static void MC_snapshot_stack_free(mc_snapshot_stack_t s){ - if(s){ +static void MC_snapshot_stack_free(mc_snapshot_stack_t s) +{ + if (s) { xbt_dynar_free(&(s->local_variables)); xbt_dynar_free(&(s->stack_frames)); + mc_unw_destroy_context(s->context); + xbt_free(s->context); xbt_free(s); } } -static void MC_snapshot_stack_free_voidp(void *s){ - MC_snapshot_stack_free((mc_snapshot_stack_t) * (void **) s); +static void MC_snapshot_stack_free_voidp(void *s) +{ + mc_snapshot_stack_t stack = (mc_snapshot_stack_t) * (void **) s; + MC_snapshot_stack_free(stack); } -static void local_variable_free(local_variable_t v){ +static void local_variable_free(local_variable_t v) +{ xbt_free(v->name); xbt_free(v); } -static void local_variable_free_voidp(void *v){ +static void local_variable_free_voidp(void *v) +{ local_variable_free((local_variable_t) * (void **) v); } -static void MC_region_destroy(mc_mem_region_t reg) +void MC_region_destroy(mc_mem_region_t region) { - xbt_free(reg->data); - xbt_free(reg); + if (!region) + return; + switch(region->storage_type) { + case MC_REGION_STORAGE_TYPE_NONE: + break; + case MC_REGION_STORAGE_TYPE_FLAT: + xbt_free(region->flat.data); + break; + case MC_REGION_STORAGE_TYPE_CHUNKED: + mc_free_page_snapshot_region(region->chunked.page_numbers, mc_page_count(region->size)); + xbt_free(region->chunked.page_numbers); + break; + case MC_REGION_STORAGE_TYPE_PRIVATIZED: + { + size_t regions_count = region->privatized.regions_count; + for (size_t i=0; i!=regions_count; ++i) { + MC_region_destroy(region->privatized.regions[i]); + } + free(region->privatized.regions); + break; + } + } + xbt_free(region); } -void MC_free_snapshot(mc_snapshot_t snapshot){ - unsigned int i; - for(i=0; i < NB_REGIONS; i++) - MC_region_destroy(snapshot->regions[i]); - +void MC_free_snapshot(mc_snapshot_t snapshot) +{ + for (size_t i = 0; i < snapshot->snapshot_regions_count; i++) { + MC_region_destroy(snapshot->snapshot_regions[i]); + } + xbt_free(snapshot->snapshot_regions); xbt_free(snapshot->stack_sizes); xbt_dynar_free(&(snapshot->stacks)); xbt_dynar_free(&(snapshot->to_ignore)); + xbt_dynar_free(&snapshot->ignored_data); xbt_free(snapshot); } - /******************************* Snapshot regions ********************************/ /*********************************************************************************/ -static mc_mem_region_t MC_region_new(int type, void *start_addr, size_t size) +static mc_mem_region_t mc_region_new_dense( + mc_region_type_t region_type, + void *start_addr, void* permanent_addr, size_t size, mc_mem_region_t ref_reg) { - mc_mem_region_t new_reg = xbt_new(s_mc_mem_region_t, 1); - new_reg->start_addr = start_addr; - new_reg->size = size; - new_reg->data = xbt_malloc(size); - memcpy(new_reg->data, start_addr, size); - - XBT_DEBUG("New region : type : %d, data : %p (real addr %p), size : %zu", type, new_reg->data, start_addr, size); - - return new_reg; + mc_mem_region_t region = xbt_new(s_mc_mem_region_t, 1); + region->region_type = region_type; + region->storage_type = MC_REGION_STORAGE_TYPE_FLAT; + region->start_addr = start_addr; + region->permanent_addr = permanent_addr; + region->size = size; + region->flat.data = xbt_malloc(size); + MC_process_read(&mc_model_checker->process, MC_ADDRESS_SPACE_READ_FLAGS_NONE, + region->flat.data, permanent_addr, size, + MC_PROCESS_INDEX_DISABLED); + XBT_DEBUG("New region : type : %d, data : %p (real addr %p), size : %zu", + region_type, region->flat.data, permanent_addr, size); + return region; } -static void MC_region_restore(mc_mem_region_t reg) +/** @brief Take a snapshot of a given region + * + * @param type + * @param start_addr Address of the region in the simulated process + * @param permanent_addr Permanent address of this data (for privatized variables, this is the virtual address of the privatized mapping) + * @param size Size of the data* + * @param ref_reg Reference corresponding region + */ +static mc_mem_region_t MC_region_new(mc_region_type_t type, void *start_addr, void* permanent_addr, size_t size, mc_mem_region_t ref_reg) { - /*FIXME: check if start_addr is still mapped, if it is not, then map it - before copying the data */ - - memcpy(reg->start_addr, reg->data, reg->size); - return; + if (_sg_mc_sparse_checkpoint) { + return mc_region_new_sparse(type, start_addr, permanent_addr, size, ref_reg); + } else { + return mc_region_new_dense(type, start_addr, permanent_addr, size, ref_reg); + } } -static void MC_snapshot_add_region(mc_snapshot_t snapshot, int type, void *start_addr, size_t size) +/** @brief Restore a region from a snapshot + * + * If we are using per page snapshots, it is possible to use the reference + * region in order to do an incremental restoration of the region: the + * softclean pages which are shared between the two snapshots do not need + * to be restored. + * + * @param reg Target region + * @param reg_reg Current region (if not NULL), used for lazy per page restoration + */ +static void MC_region_restore(mc_mem_region_t region, mc_mem_region_t ref_region) { - mc_mem_region_t new_reg = MC_region_new(type, start_addr, size); - snapshot->regions[type] = new_reg; - return; -} - -static void MC_get_memory_regions(mc_snapshot_t snapshot){ - - void* start_heap = ((xbt_mheap_t)std_heap)->base; - void* end_heap = ((xbt_mheap_t)std_heap)->breakval; - MC_snapshot_add_region(snapshot, 0, start_heap, (char*) end_heap - (char*) start_heap); - snapshot->heap_bytes_used = mmalloc_get_bytes_used(std_heap); - - MC_snapshot_add_region(snapshot, 1, mc_libsimgrid_info->start_rw, mc_libsimgrid_info->end_rw - mc_libsimgrid_info->start_rw); - MC_snapshot_add_region(snapshot, 2, mc_binary_info->start_rw, mc_binary_info->end_rw - mc_binary_info->start_rw); -} - -/** @brief Finds the range of the different memory segments and binary paths */ -void MC_init_memory_map_info(){ - - unsigned int i = 0; - s_map_region_t reg; - memory_map_t maps = MC_get_memory_map(); - - maestro_stack_start = NULL; - maestro_stack_end = NULL; - libsimgrid_path = NULL; - - while (i < maps->mapsize) { - reg = maps->regions[i]; - if (maps->regions[i].pathname == NULL) { - // Nothing to do - } - else if ((reg.prot & PROT_WRITE) && !memcmp(maps->regions[i].pathname, "[stack]", 7)){ - maestro_stack_start = reg.start_addr; - maestro_stack_end = reg.end_addr; - } else if ((reg.prot & PROT_READ) && (reg.prot & PROT_EXEC) && !memcmp(basename(maps->regions[i].pathname), "libsimgrid", 10)){ - if(libsimgrid_path == NULL) - libsimgrid_path = strdup(maps->regions[i].pathname); + switch(region->storage_type) { + case MC_REGION_STORAGE_TYPE_NONE: + default: + xbt_die("Storage type not supported"); + break; + + case MC_REGION_STORAGE_TYPE_FLAT: + MC_process_write(&mc_model_checker->process, region->flat.data, + region->permanent_addr, region->size); + break; + + case MC_REGION_STORAGE_TYPE_CHUNKED: + mc_region_restore_sparse(&mc_model_checker->process, region, ref_region); + break; + + case MC_REGION_STORAGE_TYPE_PRIVATIZED: + { + bool has_ref_regions = ref_region && + ref_region->storage_type == MC_REGION_STORAGE_TYPE_PRIVATIZED; + size_t process_count = region->privatized.regions_count; + for (size_t i = 0; i < process_count; i++) { + MC_region_restore(region->privatized.regions[i], + has_ref_regions ? ref_region->privatized.regions[i] : NULL); + } + break; } - i++; } - - xbt_assert(maestro_stack_start, "maestro_stack_start"); - xbt_assert(maestro_stack_end, "maestro_stack_end"); - xbt_assert(libsimgrid_path, "libsimgrid_path&"); - - MC_free_memory_map(maps); - } -/** \brief Fill/lookup the "subtype" field. - */ -static void MC_resolve_subtype(mc_object_info_t info, dw_type_t type) { - - if(type->dw_type_id==NULL) - return; - type->subtype = xbt_dict_get_or_null(info->types, type->dw_type_id); - if(type->subtype==NULL) - return; - if(type->subtype->byte_size != 0) - return; - if(type->subtype->name==NULL) - return; - // Try to find a more complete description of the type: - // We need to fix in order to support C++. +// FIXME, multiple privatisation regions +// FIXME, cross-process +static inline +void* MC_privatization_address(mc_process_t process, int process_index) +{ + xbt_assert(process_index >= 0); + return smpi_privatisation_regions[process_index].address; +} - dw_type_t subtype = xbt_dict_get_or_null(info->full_types_by_name, type->subtype->name); - if(subtype!=NULL) { - type->subtype = subtype; +static mc_mem_region_t MC_region_new_privatized( + mc_region_type_t region_type, void *start_addr, void* permanent_addr, size_t size, + mc_mem_region_t ref_reg) +{ + size_t process_count = MC_smpi_process_count(); + mc_mem_region_t region = xbt_new(s_mc_mem_region_t, 1); + region->region_type = region_type; + region->storage_type = MC_REGION_STORAGE_TYPE_PRIVATIZED; + region->start_addr = start_addr; + region->permanent_addr = permanent_addr; + region->size = size; + region->privatized.regions_count = process_count; + region->privatized.regions = xbt_new(mc_mem_region_t, process_count); + + for (size_t i = 0; i < process_count; i++) { + mc_mem_region_t ref_subreg = NULL; + if (ref_reg && ref_reg->storage_type == MC_REGION_STORAGE_TYPE_PRIVATIZED) + ref_subreg = ref_reg->privatized.regions[i]; + region->privatized.regions[i] = + MC_region_new(region_type, start_addr, + MC_privatization_address(&mc_model_checker->process, i), size, + ref_subreg); } + return region; } -void MC_post_process_types(mc_object_info_t info) { - xbt_dict_cursor_t cursor = NULL; - char *origin; - dw_type_t type; +static void MC_snapshot_add_region(int index, mc_snapshot_t snapshot, mc_region_type_t type, + mc_object_info_t object_info, + void *start_addr, void* permanent_addr, size_t size) +{ + if (type == MC_REGION_TYPE_DATA) + xbt_assert(object_info, "Missing object info for object."); + else if (type == MC_REGION_TYPE_HEAP) + xbt_assert(!object_info, "Unexpected object info for heap region."); + + mc_mem_region_t ref_reg = NULL; + if (mc_model_checker->parent_snapshot) + ref_reg = mc_model_checker->parent_snapshot->snapshot_regions[index]; + + mc_mem_region_t region; + const bool privatization_aware = MC_object_info_is_privatized(object_info); + if (privatization_aware && MC_smpi_process_count()) + region = MC_region_new_privatized(type, start_addr, permanent_addr, size, ref_reg); + else + region = MC_region_new(type, start_addr, permanent_addr, size, ref_reg); + + region->object_info = object_info; + snapshot->snapshot_regions[index] = region; + return; +} - // Lookup "subtype" field: - xbt_dict_foreach(info->types, cursor, origin, type){ - MC_resolve_subtype(info, type); +static void MC_get_memory_regions(mc_process_t process, mc_snapshot_t snapshot) +{ + const size_t n = process->object_infos_size; + snapshot->snapshot_regions_count = n + 1; + snapshot->snapshot_regions = xbt_new0(mc_mem_region_t, n + 1); + + for (size_t i = 0; i!=n; ++i) { + mc_object_info_t object_info = process->object_infos[i]; + MC_snapshot_add_region(i, snapshot, MC_REGION_TYPE_DATA, object_info, + object_info->start_rw, object_info->start_rw, + object_info->end_rw - object_info->start_rw); + } - dw_type_t member; - unsigned int i = 0; - if(type->members!=NULL) xbt_dynar_foreach(type->members, i, member) { - MC_resolve_subtype(info, member); - } + xbt_mheap_t heap = MC_process_get_heap(process); + void *start_heap = heap->base; + void *end_heap = heap->breakval; + + MC_snapshot_add_region(n, snapshot, MC_REGION_TYPE_HEAP, NULL, + start_heap, start_heap, + (char *) end_heap - (char *) start_heap); + snapshot->heap_bytes_used = mmalloc_get_bytes_used_remote( + heap->heaplimit, + MC_process_get_malloc_info(process)); + +#ifdef HAVE_SMPI + if (smpi_privatize_global_variables && MC_smpi_process_count()) { + // FIXME, cross-process + snapshot->privatization_index = smpi_loaded_page; + } else +#endif + { + snapshot->privatization_index = MC_PROCESS_INDEX_MISSING; } } /** \brief Fills the position of the segments (executable, read-only, read/write). * - * TODO, use dl_iterate_phdr to be more robust + * `dl_iterate_phdr` would be more robust but would not work in cross-process. * */ -void MC_find_object_address(memory_map_t maps, mc_object_info_t result) { - +void MC_find_object_address(memory_map_t maps, mc_object_info_t result) +{ unsigned int i = 0; s_map_region_t reg; - const char* name = basename(result->file_name); + const char *name = basename(result->file_name); while (i < maps->mapsize) { reg = maps->regions[i]; - if (maps->regions[i].pathname == NULL || strcmp(basename(maps->regions[i].pathname), name)) { + if (maps->regions[i].pathname == NULL + || strcmp(basename(maps->regions[i].pathname), name)) { // Nothing to do - } - else if ((reg.prot & PROT_WRITE)){ - xbt_assert(!result->start_rw, - "Multiple read-write segments for %s, not supported", - maps->regions[i].pathname); - result->start_rw = reg.start_addr; - result->end_rw = reg.end_addr; - // .bss is usually after the .data: - s_map_region_t* next = &(maps->regions[i+1]); - if(next->pathname == NULL && (next->prot & PROT_WRITE) && next->start_addr == reg.end_addr) { - result->end_rw = maps->regions[i+1].end_addr; - } - } else if ((reg.prot & PROT_READ) && (reg.prot & PROT_EXEC)){ - xbt_assert(!result->start_exec, - "Multiple executable segments for %s, not supported", - maps->regions[i].pathname); - result->start_exec = reg.start_addr; - result->end_exec = reg.end_addr; - } - else if((reg.prot & PROT_READ) && !(reg.prot & PROT_EXEC)) { - xbt_assert(!result->start_ro, - "Multiple read only segments for %s, not supported", - maps->regions[i].pathname); - result->start_ro = reg.start_addr; - result->end_ro = reg.end_addr; + } else if ((reg.prot & PROT_WRITE)) { + xbt_assert(!result->start_rw, + "Multiple read-write segments for %s, not supported", + maps->regions[i].pathname); + result->start_rw = reg.start_addr; + result->end_rw = reg.end_addr; + // .bss is usually after the .data: + s_map_region_t *next = &(maps->regions[i + 1]); + if (next->pathname == NULL && (next->prot & PROT_WRITE) + && next->start_addr == reg.end_addr) { + result->end_rw = maps->regions[i + 1].end_addr; + } + } else if ((reg.prot & PROT_READ) && (reg.prot & PROT_EXEC)) { + xbt_assert(!result->start_exec, + "Multiple executable segments for %s, not supported", + maps->regions[i].pathname); + result->start_exec = reg.start_addr; + result->end_exec = reg.end_addr; + } else if ((reg.prot & PROT_READ) && !(reg.prot & PROT_EXEC)) { + xbt_assert(!result->start_ro, + "Multiple read only segments for %s, not supported", + maps->regions[i].pathname); + result->start_ro = reg.start_addr; + result->end_ro = reg.end_addr; } i++; } + result->start = result->start_rw; + if ((const void*) result->start_ro > result->start) + result->start = result->start_ro; + if ((const void*) result->start_exec > result->start) + result->start = result->start_exec; + + result->end = result->end_rw; + if (result->end_ro && (const void*) result->end_ro < result->end) + result->end = result->end_ro; + if (result->end_exec && (const void*) result->end_exec > result->end) + result->end = result->end_exec; + xbt_assert(result->file_name); xbt_assert(result->start_rw); xbt_assert(result->start_exec); @@ -245,28 +358,35 @@ void MC_find_object_address(memory_map_t maps, mc_object_info_t result) { * \param ip Instruction pointer * \return true if the variable is valid * */ -static bool mc_valid_variable(dw_variable_t var, dw_frame_t frame, const void* ip) { +static bool mc_valid_variable(dw_variable_t var, dw_frame_t scope, + const void *ip) +{ // The variable is not yet valid: - if((const void*)((const char*) frame->low_pc + var->start_scope) > ip) + if ((const void *) ((const char *) scope->low_pc + var->start_scope) > ip) return false; else return true; } -static void mc_fill_local_variables_values(mc_stack_frame_t stack_frame, dw_frame_t scope, xbt_dynar_t result) { - void* ip = (void*) stack_frame->ip; - if(ip < scope->low_pc || ip>= scope->high_pc) +static void mc_fill_local_variables_values(mc_stack_frame_t stack_frame, + dw_frame_t scope, int process_index, xbt_dynar_t result) +{ + mc_process_t process = &mc_model_checker->process; + + void *ip = (void *) stack_frame->ip; + if (ip < scope->low_pc || ip >= scope->high_pc) return; unsigned cursor = 0; dw_variable_t current_variable; - xbt_dynar_foreach(scope->variables, cursor, current_variable){ + xbt_dynar_foreach(scope->variables, cursor, current_variable) { - if(!mc_valid_variable(current_variable, stack_frame->frame, (void*) stack_frame->ip)) + if (!mc_valid_variable(current_variable, scope, (void *) stack_frame->ip)) continue; int region_type; - if((long)stack_frame->ip > (long)mc_libsimgrid_info->start_exec) + // FIXME, get rid of `region_type` + if ((long) stack_frame->ip > (long) process->libsimgrid_info->start_exec) region_type = 1; else region_type = 2; @@ -276,15 +396,30 @@ static void mc_fill_local_variables_values(mc_stack_frame_t stack_frame, dw_fram new_var->ip = stack_frame->ip; new_var->name = xbt_strdup(current_variable->name); new_var->type = current_variable->type; - new_var->region= region_type; + new_var->region = region_type; - /* if(current_variable->address!=NULL) { + if (current_variable->address != NULL) { new_var->address = current_variable->address; - } else */ - if(current_variable->locations.size != 0){ - new_var->address = (void*) mc_dwarf_resolve_locations(¤t_variable->locations, - current_variable->object_info, - &(stack_frame->unw_cursor), (void*)stack_frame->frame_base, NULL); + } else if (current_variable->locations.size != 0) { + s_mc_location_t location; + // FIXME, cross-process support + mc_dwarf_resolve_locations(&location, ¤t_variable->locations, + current_variable->object_info, + &(stack_frame->unw_cursor), + (void *) stack_frame->frame_base, + NULL, process_index); + + switch(mc_get_location_type(&location)) { + case MC_LOCATION_TYPE_ADDRESS: + new_var->address = location.memory_location; + break; + case MC_LOCATION_TYPE_REGISTER: + default: + xbt_die("Cannot handle non-address variable"); + } + + } else { + xbt_die("No address"); } xbt_dynar_push(result, &new_var); @@ -293,69 +428,91 @@ static void mc_fill_local_variables_values(mc_stack_frame_t stack_frame, dw_fram // Recursive processing of nested scopes: dw_frame_t nested_scope = NULL; xbt_dynar_foreach(scope->scopes, cursor, nested_scope) { - mc_fill_local_variables_values(stack_frame, nested_scope, result); + mc_fill_local_variables_values(stack_frame, nested_scope, process_index, result); } } -static xbt_dynar_t MC_get_local_variables_values(xbt_dynar_t stack_frames){ +static xbt_dynar_t MC_get_local_variables_values(xbt_dynar_t stack_frames, int process_index) +{ unsigned cursor1 = 0; mc_stack_frame_t stack_frame; - xbt_dynar_t variables = xbt_dynar_new(sizeof(local_variable_t), local_variable_free_voidp); + xbt_dynar_t variables = + xbt_dynar_new(sizeof(local_variable_t), local_variable_free_voidp); - xbt_dynar_foreach(stack_frames,cursor1,stack_frame) { - mc_fill_local_variables_values(stack_frame, stack_frame->frame, variables); + xbt_dynar_foreach(stack_frames, cursor1, stack_frame) { + mc_fill_local_variables_values(stack_frame, stack_frame->frame, process_index, variables); } return variables; } -static void MC_stack_frame_free_voipd(void *s){ - mc_stack_frame_t stack_frame = *(mc_stack_frame_t*)s; - if(stack_frame) { +static void MC_stack_frame_free_voipd(void *s) +{ + mc_stack_frame_t stack_frame = *(mc_stack_frame_t *) s; + if (stack_frame) { xbt_free(stack_frame->frame_name); xbt_free(stack_frame); } } -static xbt_dynar_t MC_unwind_stack_frames(void *stack_context) { - xbt_dynar_t result = xbt_dynar_new(sizeof(mc_stack_frame_t), MC_stack_frame_free_voipd); +static xbt_dynar_t MC_unwind_stack_frames(mc_unw_context_t stack_context) +{ + mc_process_t process = &mc_model_checker->process; + xbt_dynar_t result = + xbt_dynar_new(sizeof(mc_stack_frame_t), MC_stack_frame_free_voipd); unw_cursor_t c; - int ret; - for(ret = unw_init_local(&c, (unw_context_t *)stack_context); ret >= 0; ret = unw_step(&c)){ - mc_stack_frame_t stack_frame = xbt_new(s_mc_stack_frame_t, 1); - xbt_dynar_push(result, &stack_frame); + // TODO, check condition check (unw_init_local==0 means end of frame) + if (mc_unw_init_cursor(&c, stack_context) != 0) { - stack_frame->unw_cursor = c; + xbt_die("Could not initialize stack unwinding"); - unw_word_t ip, sp; + } else + while (1) { - unw_get_reg(&c, UNW_REG_IP, &ip); - unw_get_reg(&c, UNW_REG_SP, &sp); + mc_stack_frame_t stack_frame = xbt_new(s_mc_stack_frame_t, 1); + xbt_dynar_push(result, &stack_frame); - stack_frame->ip = ip; - stack_frame->sp = sp; + stack_frame->unw_cursor = c; - // TODO, use real addresses in frame_t instead of fixing it here + unw_word_t ip, sp; - dw_frame_t frame = MC_find_function_by_ip((void*) ip); - stack_frame->frame = frame; + unw_get_reg(&c, UNW_REG_IP, &ip); + unw_get_reg(&c, UNW_REG_SP, &sp); - if(frame) { - stack_frame->frame_name = xbt_strdup(frame->name); - stack_frame->frame_base = (unw_word_t)mc_find_frame_base(frame, frame->object_info, &c); - } else { - stack_frame->frame_base = 0; - } + stack_frame->ip = ip; + stack_frame->sp = sp; - /* Stop before context switch with maestro */ - if(frame!=NULL && frame->name!=NULL && !strcmp(frame->name, "smx_ctx_sysv_wrapper")) - break; - } + // TODO, use real addresses in frame_t instead of fixing it here + + dw_frame_t frame = MC_process_find_function(process, (void *) ip); + stack_frame->frame = frame; + + if (frame) { + stack_frame->frame_name = xbt_strdup(frame->name); + stack_frame->frame_base = + (unw_word_t) mc_find_frame_base(frame, frame->object_info, &c); + } else { + stack_frame->frame_base = 0; + stack_frame->frame_name = NULL; + } + + /* Stop before context switch with maestro */ + if (frame != NULL && frame->name != NULL + && !strcmp(frame->name, "smx_ctx_sysv_wrapper")) + break; - if(xbt_dynar_length(result) == 0){ + int ret = unw_step(&c); + if (ret == 0) { + xbt_die("Unexpected end of stack."); + } else if (ret < 0) { + xbt_die("Error while unwinding stack"); + } + } + + if (xbt_dynar_length(result) == 0) { XBT_INFO("unw_init_local failed"); xbt_abort(); } @@ -363,42 +520,60 @@ static xbt_dynar_t MC_unwind_stack_frames(void *stack_context) { return result; }; -static xbt_dynar_t MC_take_snapshot_stacks(mc_snapshot_t *snapshot, void *heap){ +static xbt_dynar_t MC_take_snapshot_stacks(mc_snapshot_t * snapshot) +{ - xbt_dynar_t res = xbt_dynar_new(sizeof(s_mc_snapshot_stack_t), MC_snapshot_stack_free_voidp); + xbt_dynar_t res = + xbt_dynar_new(sizeof(s_mc_snapshot_stack_t), + MC_snapshot_stack_free_voidp); unsigned int cursor = 0; stack_region_t current_stack; - - xbt_dynar_foreach(stacks_areas, cursor, current_stack){ + + // FIXME, cross-process support (stack_areas) + xbt_dynar_foreach(stacks_areas, cursor, current_stack) { mc_snapshot_stack_t st = xbt_new(s_mc_snapshot_stack_t, 1); - st->stack_frames = MC_unwind_stack_frames(current_stack->context); - st->local_variables = MC_get_local_variables_values(st->stack_frames); + + unw_context_t* original_context = (unw_context_t*) current_stack->context; + + st->context = xbt_new0(s_mc_unw_context_t, 1); + if (mc_unw_init_context(st->context, &mc_model_checker->process, + original_context) < 0) { + xbt_die("Could not initialise the libunwind context."); + } + + st->stack_frames = MC_unwind_stack_frames(st->context); + st->local_variables = MC_get_local_variables_values(st->stack_frames, current_stack->process_index); + st->process_index = current_stack->process_index; unw_word_t sp = xbt_dynar_get_as(st->stack_frames, 0, mc_stack_frame_t)->sp; - st->stack_pointer = ((char *)heap + (size_t)(((char *)((long)sp) - (char*)std_heap))); - st->real_address = current_stack->address; xbt_dynar_push(res, &st); - (*snapshot)->stack_sizes = xbt_realloc((*snapshot)->stack_sizes, (cursor + 1) * sizeof(size_t)); - (*snapshot)->stack_sizes[cursor] = current_stack->size - ((char *)st->stack_pointer - (char *)((char *)heap + ((char *)current_stack->address - (char *)std_heap))); + (*snapshot)->stack_sizes = + xbt_realloc((*snapshot)->stack_sizes, (cursor + 1) * sizeof(size_t)); + (*snapshot)->stack_sizes[cursor] = + (char*) current_stack->address + current_stack->size - (char*) sp; } return res; } -static xbt_dynar_t MC_take_snapshot_ignore(){ - - if(mc_heap_comparison_ignore == NULL) +// FIXME, cross-process support (mc_heap_comparison_ignore) +static xbt_dynar_t MC_take_snapshot_ignore() +{ + + if (mc_heap_comparison_ignore == NULL) return NULL; - xbt_dynar_t cpy = xbt_dynar_new(sizeof(mc_heap_ignore_region_t), heap_ignore_region_free_voidp); + xbt_dynar_t cpy = + xbt_dynar_new(sizeof(mc_heap_ignore_region_t), + heap_ignore_region_free_voidp); unsigned int cursor = 0; mc_heap_ignore_region_t current_region; - xbt_dynar_foreach(mc_heap_comparison_ignore, cursor, current_region){ + xbt_dynar_foreach(mc_heap_comparison_ignore, cursor, current_region) { mc_heap_ignore_region_t new_region = NULL; new_region = xbt_new0(s_mc_heap_ignore_region_t, 1); new_region->address = current_region->address; @@ -412,110 +587,267 @@ static xbt_dynar_t MC_take_snapshot_ignore(){ } -static void MC_dump_checkpoint_ignore(mc_snapshot_t snapshot){ - +static void mc_free_snapshot_ignored_data_pvoid(void* data) { + mc_snapshot_ignored_data_t ignored_data = (mc_snapshot_ignored_data_t) data; + free(ignored_data->data); +} + +static void MC_snapshot_handle_ignore(mc_snapshot_t snapshot) +{ + xbt_assert(snapshot->process); + snapshot->ignored_data = xbt_dynar_new(sizeof(s_mc_snapshot_ignored_data_t), mc_free_snapshot_ignored_data_pvoid); + + // Copy the memory: unsigned int cursor = 0; mc_checkpoint_ignore_region_t region; - size_t offset; - - xbt_dynar_foreach(mc_checkpoint_ignore, cursor, region){ - if(region->addr > snapshot->regions[0]->start_addr && (char *)(region->addr) < (char *)snapshot->regions[0]->start_addr + STD_HEAP_SIZE){ - offset = (char *)region->addr - (char *)snapshot->regions[0]->start_addr; - memset((char *)snapshot->regions[0]->data + offset, 0, region->size); - }else if(region->addr > snapshot->regions[2]->start_addr && (char *)(region->addr) < (char*)snapshot->regions[2]->start_addr + snapshot->regions[2]->size){ - offset = (char *)region->addr - (char *)snapshot->regions[2]->start_addr; - memset((char *)snapshot->regions[2]->data + offset, 0, region->size); - }else if(region->addr > snapshot->regions[1]->start_addr && (char *)(region->addr) < (char*)snapshot->regions[1]->start_addr + snapshot->regions[1]->size){ - offset = (char *)region->addr - (char *)snapshot->regions[1]->start_addr; - memset((char *)snapshot->regions[1]->data + offset, 0, region->size); - } + // FIXME, cross-process support (mc_checkpoint_ignore) + xbt_dynar_foreach (mc_model_checker->process.checkpoint_ignore, cursor, region) { + s_mc_snapshot_ignored_data_t ignored_data; + ignored_data.start = region->addr; + ignored_data.size = region->size; + ignored_data.data = malloc(region->size); + // TODO, we should do this once per privatization segment: + MC_process_read(snapshot->process, + MC_ADDRESS_SPACE_READ_FLAGS_NONE, + ignored_data.data, region->addr, region->size, MC_PROCESS_INDEX_DISABLED); + xbt_dynar_push(snapshot->ignored_data, &ignored_data); + } + + // Zero the memory: + xbt_dynar_foreach (mc_model_checker->process.checkpoint_ignore, cursor, region) { + MC_process_clear_memory(snapshot->process, region->addr, region->size); + } + +} + +static void MC_snapshot_ignore_restore(mc_snapshot_t snapshot) +{ + unsigned int cursor = 0; + s_mc_snapshot_ignored_data_t ignored_data; + xbt_dynar_foreach (snapshot->ignored_data, cursor, ignored_data) { + MC_process_write(snapshot->process, + ignored_data.data, ignored_data.start, ignored_data.size); } +} + +/** @brief Can we remove this snapshot? + * + * Some snapshots cannot be removed (yet) because we need them + * at this point. + * + * @param snapshot + */ +int mc_important_snapshot(mc_snapshot_t snapshot) +{ + // We need this snapshot in order to know which + // pages needs to be stored in the next snapshot. + // This field is only non-NULL when using soft-dirty + // page tracking. + if (snapshot == mc_model_checker->parent_snapshot) + return true; + return false; } +static void MC_get_current_fd(mc_snapshot_t snapshot) +{ + + snapshot->total_fd = 0; + + const size_t fd_dir_path_size = 20; + char fd_dir_path[fd_dir_path_size]; + if (snprintf(fd_dir_path, fd_dir_path_size, + "/proc/%lli/fd", (long long int) snapshot->process->pid) > fd_dir_path_size) + xbt_die("Unexpected buffer is too small for fd_dir_path"); + + DIR* fd_dir = opendir(fd_dir_path); + if (fd_dir == NULL) + xbt_die("Cannot open directory '/proc/self/fd'\n"); + + size_t total_fd = 0; + struct dirent* fd_number; + while ((fd_number = readdir(fd_dir))) { + + int fd_value = atoi(fd_number->d_name); + + if(fd_value < 3) + continue; + + const size_t source_size = 25; + char source[25]; + if (snprintf(source, source_size, "/proc/%lli/fd/%s", + (long long int) snapshot->process->pid, fd_number->d_name) > source_size) + xbt_die("Unexpected buffer is too small for fd %s", fd_number->d_name); + + const size_t link_size = 200; + char link[200]; + int res = readlink(source, link, link_size); + if (res<0) { + xbt_die("Could not read link for %s", source); + } + if (res==200) { + xbt_die("Buffer to small for link of %s", source); + } + link[res] = '\0'; + + if(smpi_is_privatisation_file(link)) + continue; + + // This is (probably) the DIR* we are reading: + // TODO, read all the file entries at once and close the DIR.* + if(strcmp(fd_dir_path, link) == 0) + continue; + + // We don't handle them. + // It does not mean we should silently ignore them however. + if (strncmp(link, "pipe:", 5) == 0 || strncmp(link, "socket:", 7) == 0) + continue; + + // If dot_output enabled, do not handle the corresponding file + if (dot_output != NULL && strcmp(basename(link), _sg_mc_dot_output_file) == 0) + continue; + + // This is probably a shared memory used by lttng-ust: + if(strncmp("/dev/shm/ust-shm-tmp-", link, 21)==0) + continue; + + // Add an entry for this FD in the snapshot: + fd_infos_t fd = xbt_new0(s_fd_infos_t, 1); + fd->filename = strdup(link); + fd->number = fd_value; + fd->flags = fcntl(fd_value, F_GETFL) | fcntl(fd_value, F_GETFD) ; + fd->current_position = lseek(fd_value, 0, SEEK_CUR); + snapshot->current_fd = xbt_realloc(snapshot->current_fd, (total_fd + 1) * sizeof(fd_infos_t)); + snapshot->current_fd[total_fd] = fd; + total_fd++; + } + + snapshot->total_fd = total_fd; + closedir (fd_dir); +} -mc_snapshot_t MC_take_snapshot(int num_state){ +static s_mc_address_space_class_t mc_snapshot_class = { + .read = (void*) &MC_snapshot_read +}; +mc_snapshot_t MC_take_snapshot(int num_state) +{ + mc_process_t mc_process = &mc_model_checker->process; mc_snapshot_t snapshot = xbt_new0(s_mc_snapshot_t, 1); - snapshot->nb_processes = xbt_swag_size(simix_global->process_list); + snapshot->process = mc_process; + snapshot->address_space.address_space_class = &mc_snapshot_class; + + snapshot->enabled_processes = xbt_dynar_new(sizeof(int), NULL); + + smx_process_t process; + MC_EACH_SIMIX_PROCESS(process, + xbt_dynar_push_as(snapshot->enabled_processes, int, (int)process->pid)); + + MC_snapshot_handle_ignore(snapshot); + + if (_sg_mc_snapshot_fds) + MC_get_current_fd(snapshot); + + const bool use_soft_dirty = _sg_mc_sparse_checkpoint + && _sg_mc_soft_dirty + && MC_process_is_self(mc_process); /* Save the std heap and the writable mapped pages of libsimgrid and binary */ - MC_get_memory_regions(snapshot); + MC_get_memory_regions(mc_process, snapshot); + if (use_soft_dirty) + mc_softdirty_reset(); snapshot->to_ignore = MC_take_snapshot_ignore(); - if(_sg_mc_visited > 0 || strcmp(_sg_mc_property_file,"")){ - snapshot->stacks = MC_take_snapshot_stacks(&snapshot, snapshot->regions[0]->data); - if(_sg_mc_hash && snapshot->stacks!=NULL) { + if (_sg_mc_visited > 0 || strcmp(_sg_mc_property_file, "")) { + snapshot->stacks = + MC_take_snapshot_stacks(&snapshot); + if (_sg_mc_hash && snapshot->stacks != NULL) { snapshot->hash = mc_hash_processes_state(num_state, snapshot->stacks); } else { snapshot->hash = 0; } - } - else { + } else { snapshot->hash = 0; } - if(num_state > 0) - MC_dump_checkpoint_ignore(snapshot); - + MC_snapshot_ignore_restore(snapshot); + if (use_soft_dirty) + mc_model_checker->parent_snapshot = snapshot; return snapshot; - } -void MC_restore_snapshot(mc_snapshot_t snapshot){ - unsigned int i; - for(i=0; i < NB_REGIONS; i++){ - MC_region_restore(snapshot->regions[i]); +static inline +void MC_restore_snapshot_regions(mc_snapshot_t snapshot) +{ + mc_snapshot_t parent_snapshot = mc_model_checker->parent_snapshot; + + const size_t n = snapshot->snapshot_regions_count; + for (size_t i = 0; i < n; i++) { + // For privatized, variables we decided it was not necessary to take the snapshot: + if (snapshot->snapshot_regions[i]) + MC_region_restore(snapshot->snapshot_regions[i], + parent_snapshot ? parent_snapshot->snapshot_regions[i] : NULL); } -} - -void* mc_translate_address(uintptr_t addr, mc_snapshot_t snapshot) { - - // If not in a process state/clone: - if(!snapshot) { - return (uintptr_t*) addr; +#ifdef HAVE_SMPI + if(snapshot->privatization_index >= 0) { + // We just rewrote the global variables. + // The privatisation segment SMPI thinks + // is mapped might be inconsistent with the segment which + // is really mapped in memory (kernel state). + // We ask politely SMPI to map the segment anyway, + // even if it thinks it is the current one: + smpi_really_switch_data_segment(snapshot->privatization_index); } +#endif +} - // If it is in a snapshot: - for(size_t i=0; i!=NB_REGIONS; ++i) { - mc_mem_region_t region = snapshot->regions[i]; - uintptr_t start = (uintptr_t) region->start_addr; - uintptr_t end = start + region->size; - - // The address is in this region: - if(addr >= start && addr < end) { - uintptr_t offset = addr - start; - return (void*) ((uintptr_t)region->data + offset); +static inline +void MC_restore_snapshot_fds(mc_snapshot_t snapshot) +{ + if (mc_mode == MC_MODE_SERVER) + xbt_die("FD snapshot not implemented in client/server mode."); + + int new_fd; + size_t i; + for(i=0; i < snapshot->total_fd; i++){ + + new_fd = open(snapshot->current_fd[i]->filename, snapshot->current_fd[i]->flags); + if (new_fd <0) { + xbt_die("Could not reopen the file %s fo restoring the file descriptor", + snapshot->current_fd[i]->filename); } - + if(new_fd != -1 && new_fd != snapshot->current_fd[i]->number){ + dup2(new_fd, snapshot->current_fd[i]->number); + //fprintf(stderr, "%p\n", fdopen(snapshot->current_fd[i]->number, "rw")); + close(new_fd); + }; + lseek(snapshot->current_fd[i]->number, snapshot->current_fd[i]->current_position, SEEK_SET); } - - // It is not in a snapshot: - return (void*) addr; } -uintptr_t mc_untranslate_address(void* addr, mc_snapshot_t snapshot) { - if(!snapshot) { - return (uintptr_t) addr; +void MC_restore_snapshot(mc_snapshot_t snapshot) +{ + const bool use_soft_dirty = _sg_mc_sparse_checkpoint + && _sg_mc_soft_dirty + && MC_process_is_self(&mc_model_checker->process); + + MC_restore_snapshot_regions(snapshot); + if (_sg_mc_snapshot_fds) + MC_restore_snapshot_fds(snapshot); + if (use_soft_dirty) { + mc_softdirty_reset(); } - - for(size_t i=0; i!=NB_REGIONS; ++i) { - mc_mem_region_t region = snapshot->regions[i]; - if(addr>=region->data && addr<=(void*)(((char*)region->data)+region->size)) { - size_t offset = (size_t) ((char*) addr - (char*) region->data); - return ((uintptr_t) region->start_addr) + offset; - } + MC_snapshot_ignore_restore(snapshot); + if (use_soft_dirty) { + mc_model_checker->parent_snapshot = snapshot; } - return (uintptr_t) addr; + mc_model_checker->process.cache_flags = 0; } -mc_snapshot_t SIMIX_pre_mc_snapshot(smx_simcall_t simcall){ +mc_snapshot_t simcall_HANDLER_mc_snapshot(smx_simcall_t simcall) +{ return MC_take_snapshot(1); } - -void *MC_snapshot(void){ - return simcall_mc_snapshot(); -}