X-Git-Url: http://info.iut-bm.univ-fcomte.fr/pub/gitweb/simgrid.git/blobdiff_plain/c65a2fd02f74c12e469150dfbae04366f4be484c..477470a3c0b62c557dba9f40f2f781224a6c73e6:/src/smpi/include/private.hpp diff --git a/src/smpi/include/private.hpp b/src/smpi/include/private.hpp index 9b276231ac..a4e1fdab68 100644 --- a/src/smpi/include/private.hpp +++ b/src/smpi/include/private.hpp @@ -26,8 +26,9 @@ constexpr unsigned MPI_REQ_RMA = 0x200; constexpr unsigned MPI_REQ_ACCUMULATE = 0x400; constexpr unsigned MPI_REQ_GENERALIZED = 0x800; constexpr unsigned MPI_REQ_COMPLETE = 0x1000; +constexpr unsigned MPI_REQ_BSEND = 0x2000; -enum class SmpiProcessState { UNINITIALIZED, INITIALIZING, INITIALIZED, FINALIZED }; +enum class SmpiProcessState { UNINITIALIZED, INITIALIZING, INITIALIZED /*(=MPI_Init called)*/, FINALIZED }; constexpr int COLL_TAG_REDUCE = -112; constexpr int COLL_TAG_SCATTER = -223; @@ -38,10 +39,12 @@ constexpr int COLL_TAG_ALLGATHERV = -667; constexpr int COLL_TAG_BARRIER = -778; constexpr int COLL_TAG_REDUCE_SCATTER = -889; constexpr int COLL_TAG_ALLTOALLV = -1000; +constexpr int COLL_TAG_ALLTOALLW = -1020; constexpr int COLL_TAG_ALLTOALL = -1112; constexpr int COLL_TAG_GATHERV = -2223; constexpr int COLL_TAG_BCAST = -3334; constexpr int COLL_TAG_ALLREDUCE = -4445; + // SMPI_RMA_TAG has to be the smallest one, as it will be decremented for accumulate ordering. constexpr int SMPI_RMA_TAG = -6666; @@ -56,10 +59,11 @@ extern XBT_PUBLIC int mpi_statuses_ignore_; #define FORT_ADDR(addr, val, val2) \ (((void *)(addr) == (void*) &(val2)) \ ? (val) : (void *)(addr)) -#define FORT_BOTTOM(addr) FORT_ADDR(addr, MPI_BOTTOM, mpi_bottom_) -#define FORT_IN_PLACE(addr) FORT_ADDR(addr, MPI_IN_PLACE, mpi_in_place_) -#define FORT_STATUS_IGNORE(addr) static_cast(FORT_ADDR(addr, MPI_STATUS_IGNORE, mpi_status_ignore_)) -#define FORT_STATUSES_IGNORE(addr) static_cast(FORT_ADDR(addr, MPI_STATUSES_IGNORE, mpi_statuses_ignore_)) +#define FORT_BOTTOM(addr) FORT_ADDR((addr), MPI_BOTTOM, mpi_bottom_) +#define FORT_IN_PLACE(addr) FORT_ADDR((addr), MPI_IN_PLACE, mpi_in_place_) +#define FORT_STATUS_IGNORE(addr) static_cast(FORT_ADDR((addr), MPI_STATUS_IGNORE, mpi_status_ignore_)) +#define FORT_STATUSES_IGNORE(addr) \ + static_cast(FORT_ADDR((addr), MPI_STATUSES_IGNORE, mpi_statuses_ignore_)) extern XBT_PRIVATE MPI_Comm MPI_COMM_UNINITIALIZED; @@ -71,12 +75,12 @@ typedef SMPI_Dist_Graph_topology* MPIR_Dist_Graph_Topology; XBT_PRIVATE simgrid::smpi::ActorExt* smpi_process(); XBT_PRIVATE simgrid::smpi::ActorExt* smpi_process_remote(simgrid::s4u::ActorPtr actor); -XBT_PRIVATE int smpi_process_count(); +XBT_PRIVATE int smpi_get_universe_size(); + +XBT_PRIVATE void smpi_deployment_register_process(const std::string& instance_id, int rank, simgrid::s4u::Actor* actor); +XBT_PRIVATE void smpi_deployment_unregister_process(const std::string& instance_id); -XBT_PRIVATE void smpi_deployment_register_process(const std::string& instance_id, int rank, - simgrid::s4u::ActorPtr actor); XBT_PRIVATE MPI_Comm* smpi_deployment_comm_world(const std::string& instance_id); -XBT_PRIVATE simgrid::s4u::Barrier* smpi_deployment_finalization_barrier(const std::string& instance_id); XBT_PRIVATE void smpi_deployment_cleanup_instances(); XBT_PRIVATE void smpi_comm_copy_buffer_callback(simgrid::kernel::activity::CommImpl* comm, void* buff, @@ -86,22 +90,32 @@ XBT_PRIVATE void smpi_comm_null_copy_buffer_callback(simgrid::kernel::activity:: size_t buff_size); XBT_PRIVATE int smpi_enabled(); -XBT_PRIVATE void smpi_global_init(); -XBT_PRIVATE void smpi_global_destroy(); XBT_PRIVATE double smpi_mpi_wtime(); XBT_PRIVATE void smpi_mpi_init(); +enum class SharedMallocType { NONE, LOCAL, GLOBAL }; +enum class SmpiPrivStrategies { NONE = 0, MMAP = 1, DLOPEN = 2, DEFAULT = DLOPEN }; + +XBT_PRIVATE double smpi_cfg_host_speed(); +XBT_PRIVATE bool smpi_cfg_simulate_computation(); +XBT_PRIVATE SharedMallocType smpi_cfg_shared_malloc(); +XBT_PRIVATE double smpi_cfg_cpu_thresh(); +XBT_PRIVATE SmpiPrivStrategies smpi_cfg_privatization(); +XBT_PRIVATE int smpi_cfg_async_small_thresh(); +XBT_PRIVATE int smpi_cfg_detached_send_thresh(); +XBT_PRIVATE bool smpi_cfg_grow_injected_times(); +XBT_PRIVATE double smpi_cfg_iprobe_cpu_usage(); +XBT_PRIVATE bool smpi_cfg_trace_call_location(); +XBT_PRIVATE bool smpi_cfg_trace_call_use_absolute_path(); +XBT_PRIVATE std::string smpi_cfg_comp_adjustment_file(); +XBT_PRIVATE std::string smpi_cfg_papi_events_file(); +XBT_PRIVATE double smpi_cfg_auto_shared_malloc_thresh(); + // utilities -extern XBT_PRIVATE double smpi_cpu_threshold; -extern XBT_PRIVATE double smpi_host_speed; extern XBT_PRIVATE char* smpi_data_exe_start; // start of the data+bss segment of the executable extern XBT_PRIVATE int smpi_data_exe_size; // size of the data+bss segment of the executable -enum class SharedMallocType { NONE, LOCAL, GLOBAL }; -extern XBT_PRIVATE SharedMallocType smpi_cfg_shared_malloc; // Whether to activate shared malloc - XBT_PRIVATE void smpi_switch_data_segment(simgrid::s4u::ActorPtr actor); -XBT_PRIVATE void smpi_really_switch_data_segment(simgrid::s4u::ActorPtr actor); XBT_PRIVATE void smpi_prepare_global_memory_segment(); XBT_PRIVATE void smpi_backup_global_memory_segment(); @@ -110,6 +124,7 @@ XBT_PRIVATE void smpi_bench_destroy(); XBT_PRIVATE void smpi_bench_begin(); XBT_PRIVATE void smpi_bench_end(); XBT_PRIVATE void smpi_shared_destroy(); +XBT_PRIVATE double smpi_adjust_comp_speed(); XBT_PRIVATE unsigned char* smpi_get_tmp_sendbuffer(size_t size); XBT_PRIVATE unsigned char* smpi_get_tmp_recvbuffer(size_t size); @@ -342,12 +357,12 @@ void mpi_graph_neighbors_count_(int* comm, int* rank, int* nneighbors, int* ierr void mpi_graphdims_get_(int* comm, int* nnodes, int* nedges, int* ierr); void mpi_topo_test_(int* comm, int* top_type, int* ierr); void mpi_error_class_(int* errorcode, int* errorclass, int* ierr); -void mpi_errhandler_create_(void* function, void* errhandler, int* ierr); -void mpi_errhandler_free_(void* errhandler, int* ierr); -void mpi_errhandler_get_(int* comm, void* errhandler, int* ierr); -void mpi_errhandler_set_(int* comm, void* errhandler, int* ierr); -void mpi_comm_set_errhandler_(int* comm, void* errhandler, int* ierr); -void mpi_comm_get_errhandler_(int* comm, void* errhandler, int* ierr); +void mpi_errhandler_create_(void* function, int* errhandler, int* ierr); +void mpi_errhandler_free_(int* errhandler, int* ierr); +void mpi_errhandler_get_(int* comm, int* errhandler, int* ierr); +void mpi_errhandler_set_(int* comm, int* errhandler, int* ierr); +void mpi_comm_set_errhandler_(int* comm, int* errhandler, int* ierr); +void mpi_comm_get_errhandler_(int* comm, int* errhandler, int* ierr); void mpi_type_contiguous_(int* count, int* old_type, int* newtype, int* ierr); void mpi_cancel_(int* request, int* ierr); void mpi_buffer_attach_(void* buffer, int* size, int* ierr); @@ -360,14 +375,14 @@ void mpi_pack_external_(char* datarep, void* inbuf, int* incount, int* datatype, MPI_Aint* position, int* ierr); void mpi_unpack_external_(char* datarep, void* inbuf, MPI_Aint* insize, MPI_Aint* position, void* outbuf, int* outcount, int* datatype, int* ierr); -void mpi_type_hindexed_(int* count, int* blocklens, MPI_Aint* indices, int* old_type, int* newtype, int* ierr); +void mpi_type_hindexed_(int* count, int* blocklens, int* indices, int* old_type, int* newtype, int* ierr); void mpi_type_create_hindexed_(int* count, int* blocklens, MPI_Aint* indices, int* old_type, int* newtype, int* ierr); void mpi_type_create_hindexed_block_(int* count, int* blocklength, MPI_Aint* indices, int* old_type, int* newtype, int* ierr); void mpi_type_indexed_(int* count, int* blocklens, int* indices, int* old_type, int* newtype, int* ierr); void mpi_type_create_indexed_(int* count, int* blocklens, int* indices, int* old_type, int* newtype, int* ierr); void mpi_type_create_indexed_block_(int* count, int* blocklength, int* indices, int* old_type, int* newtype, int* ierr); -void mpi_type_struct_(int* count, int* blocklens, MPI_Aint* indices, int* old_types, int* newtype, int* ierr); +void mpi_type_struct_(int* count, int* blocklens, int* indices, int* old_types, int* newtype, int* ierr); void mpi_type_create_struct_(int* count, int* blocklens, MPI_Aint* indices, int* old_types, int* newtype, int* ierr); void mpi_ssend_(void* buf, int* count, int* datatype, int* dest, int* tag, int* comm, int* ierr); void mpi_ssend_init_(void* buf, int* count, int* datatype, int* dest, int* tag, int* comm, int* request, int* ierr); @@ -408,7 +423,7 @@ void mpi_comm_split_type_(int* comm, int* split_type, int* key, int* info, int* void mpi_comm_set_info_(int* comm, int* info, int* ierr); void mpi_comm_get_info_(int* comm, int* info, int* ierr); void mpi_info_get_(int* info, char* key, int* valuelen, char* value, int* flag, int* ierr, unsigned int keylen); -void mpi_comm_create_errhandler_(void* function, void* errhandler, int* ierr); +void mpi_comm_create_errhandler_(void* function, int* errhandler, int* ierr); void mpi_add_error_class_(int* errorclass, int* ierr); void mpi_add_error_code_(int* errorclass, int* errorcode, int* ierr); void mpi_add_error_string_(int* errorcode, char* string, int* ierr); @@ -448,6 +463,9 @@ void mpi_file_write_(int* fh, void* buf, int* count, int* datatype, MPI_Status* void smpi_init_fortran_types(); } // extern "C" +XBT_PRIVATE int smpi_temp_shm_get(); +XBT_PRIVATE void* smpi_temp_shm_mmap(int fd, size_t size); + struct s_smpi_privatization_region_t { void* address; int file_descriptor; @@ -455,7 +473,6 @@ struct s_smpi_privatization_region_t { typedef s_smpi_privatization_region_t* smpi_privatization_region_t; extern XBT_PRIVATE int smpi_loaded_page; -extern XBT_PRIVATE int smpi_universe_size; XBT_PRIVATE smpi_privatization_region_t smpi_init_global_memory_segment_process(); /** @@ -479,8 +496,62 @@ extern std::unordered_map location2speedup; /** @brief Returns the last call location (filename, linenumber). Process-specific. */ XBT_PUBLIC smpi_trace_call_location_t* smpi_trace_get_call_location(); -enum class SmpiPrivStrategies { NONE = 0, MMAP = 1, DLOPEN = 2, DEFAULT = DLOPEN }; - -extern XBT_PRIVATE SmpiPrivStrategies smpi_privatize_global_variables; - +XBT_PRIVATE void private_execute_flops(double flops); + + +#define CHECK_ARGS(test, errcode, ...) \ + if (test) { \ + if((errcode) != MPI_SUCCESS) \ + XBT_WARN(__VA_ARGS__); \ + return (errcode); \ + } + +#define CHECK_MPI_NULL(num, val, err, ptr) \ + CHECK_ARGS((ptr) == (val), (err), \ + "%s: param %d %s cannot be %s", __func__, (num), #ptr, #val); +#define CHECK_NULL(num,err,buf) \ + CHECK_ARGS((buf) == nullptr, (err), \ + "%s: param %d %s cannot be NULL", __func__, (num), #buf); +#define CHECK_NEGATIVE(num, err, val) \ + CHECK_ARGS((val) < 0, (err), \ + "%s: param %d %s cannot be negative", __func__, (num), #val); +#define CHECK_COMM2(num, comm) \ + CHECK_MPI_NULL((num), MPI_COMM_NULL, MPI_ERR_COMM, (comm)) +#define CHECK_COMM(num) \ + CHECK_COMM2((num), comm) +#define CHECK_REQUEST(num) \ + CHECK_ARGS(request == nullptr, MPI_ERR_REQUEST, \ + "%s: param %d request cannot be NULL",__func__, (num)); +#define CHECK_BUFFER(num,buf,count) \ + CHECK_ARGS((buf) == nullptr && (count) > 0, MPI_ERR_BUFFER, \ + "%s: param %d %s cannot be NULL if %s > 0",__func__, (num), #buf, #count); +#define CHECK_COUNT(num, count) \ + CHECK_NEGATIVE((num), MPI_ERR_COUNT, (count)) +#define CHECK_TYPE(num, datatype) \ + CHECK_ARGS(((datatype) == MPI_DATATYPE_NULL|| not (datatype)->is_valid()), MPI_ERR_TYPE, \ + "%s: param %d %s cannot be MPI_DATATYPE_NULL or invalid", __func__, (num), #datatype); +#define CHECK_OP(num) \ + CHECK_MPI_NULL((num), MPI_OP_NULL, MPI_ERR_OP, op) +#define CHECK_ROOT(num)\ + CHECK_ARGS((root < 0 || root >= comm->size()), MPI_ERR_ROOT, \ + "%s: param %d root (=%d) cannot be negative or larger than communicator size (=%d)", __func__, (num), root, \ + comm->size()); +#define CHECK_PROC(num,proc) \ + CHECK_MPI_NULL((num), MPI_PROC_NULL, MPI_SUCCESS, (proc)) +#define CHECK_INFO(num,info) \ + CHECK_MPI_NULL((num), MPI_INFO_NULL, MPI_ERR_INFO, (info)) +#define CHECK_TAG(num,tag) \ + CHECK_ARGS(((tag) < 0 && (tag) != MPI_ANY_TAG), MPI_ERR_TAG, \ + "%s: param %d %s (=%d) cannot be negative", __func__, (num), #tag, (tag)); +#define CHECK_FILE(num, fh) \ + CHECK_MPI_NULL((num), MPI_FILE_NULL, MPI_ERR_FILE, (fh)) +#define CHECK_OFFSET(num, offset) \ + CHECK_NEGATIVE((num), MPI_ERR_DISP, (offset)) +#define CHECK_GROUP(num, group) \ + CHECK_MPI_NULL((num), MPI_GROUP_NULL, MPI_ERR_GROUP, (group)) +#define CHECK_WIN(num, win) \ + CHECK_MPI_NULL((num), MPI_WIN_NULL, MPI_ERR_WIN, (win)) +#define CHECK_RANK(num, rank, comm) \ + CHECK_ARGS(((rank) >= (comm)->group()->size() || (rank) <0), MPI_ERR_RANK, \ + "%s: param %d %s (=%d) cannot be < 0 or > %d", __func__, (num), #rank, (rank), (comm)->group()->size() ); #endif