X-Git-Url: http://info.iut-bm.univ-fcomte.fr/pub/gitweb/simgrid.git/blobdiff_plain/12572db97b786e78f79c1b119151fae53287b633..dacc7f742e213df2a54511bfc5dc7b350987b014:/src/smpi/internals/smpi_replay.cpp diff --git a/src/smpi/internals/smpi_replay.cpp b/src/smpi/internals/smpi_replay.cpp index 9e6883dec1..42c8904076 100644 --- a/src/smpi/internals/smpi_replay.cpp +++ b/src/smpi/internals/smpi_replay.cpp @@ -12,6 +12,8 @@ #include "smpi_request.hpp" #include "xbt/replay.hpp" +#include +#include #include #include @@ -24,13 +26,16 @@ static int active_processes = 0; static std::unordered_map*> reqq; static MPI_Datatype MPI_DEFAULT_TYPE; -static MPI_Datatype MPI_CURRENT_TYPE; static int sendbuffer_size = 0; static char* sendbuffer = nullptr; static int recvbuffer_size = 0; static char* recvbuffer = nullptr; +class ReplayActionArg { + ReplayActionArg() {} +}; + static void log_timed_action (const char *const *action, double clock){ if (XBT_LOG_ISENABLED(smpi_replay, xbt_log_priority_verbose)){ char *name = xbt_str_join_array(action, " "); @@ -91,53 +96,15 @@ static double parse_double(const char *string) //TODO: this logic should be moved inside the datatype class, to support all predefined types and get rid of is_replayable. static MPI_Datatype decode_datatype(const char *const action) { - switch(atoi(action)) { - case 0: - return MPI_DOUBLE; - break; - case 1: - return MPI_INT; - break; - case 2: - return MPI_CHAR; - break; - case 3: - return MPI_SHORT; - break; - case 4: - return MPI_LONG; - break; - case 5: - return MPI_FLOAT; - break; - case 6: - return MPI_BYTE; - break; - default: - return MPI_DEFAULT_TYPE; - break; - } + return simgrid::smpi::Datatype::decode(action); } const char* encode_datatype(MPI_Datatype datatype) { - if (datatype==MPI_BYTE) - return ""; - if(datatype==MPI_DOUBLE) - return "0"; - if(datatype==MPI_INT) - return "1"; - if(datatype==MPI_CHAR) - return "2"; - if(datatype==MPI_SHORT) - return "3"; - if(datatype==MPI_LONG) - return "4"; - if(datatype==MPI_FLOAT) - return "5"; - // default - not implemented. - // do not warn here as we pass in this function even for other trace formats - return "-1"; + if (datatype == nullptr) /* this actually does seem to be possible, had this in the scatter2 test */ + return "-1"; + + return datatype->encode(); } #define CHECK_ACTION_PARAMS(action, mandatory, optional) {\ @@ -213,7 +180,7 @@ static void action_send(const char *const *action) double size=parse_double(action[3]); double clock = smpi_process()->simulated_elapsed(); - MPI_CURRENT_TYPE = (action[4]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; + MPI_Datatype MPI_CURRENT_TYPE = (action[4]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; int my_proc_id = Actor::self()->getPid(); int dst_traced = MPI_COMM_WORLD->group()->actor(to)->getPid(); @@ -237,7 +204,7 @@ static void action_Isend(const char *const *action) double size=parse_double(action[3]); double clock = smpi_process()->simulated_elapsed(); - MPI_CURRENT_TYPE = (action[4]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; + MPI_Datatype MPI_CURRENT_TYPE = (action[4]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; int my_proc_id = Actor::self()->getPid(); int dst_traced = MPI_COMM_WORLD->group()->actor(to)->getPid(); @@ -262,7 +229,7 @@ static void action_recv(const char *const *action) { double clock = smpi_process()->simulated_elapsed(); MPI_Status status; - MPI_CURRENT_TYPE = (action[4]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; + MPI_Datatype MPI_CURRENT_TYPE = (action[4]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; int my_proc_id = Actor::self()->getPid(); int src_traced = MPI_COMM_WORLD->group()->actor(from)->getPid(); @@ -293,7 +260,7 @@ static void action_Irecv(const char *const *action) double size=parse_double(action[3]); double clock = smpi_process()->simulated_elapsed(); - MPI_CURRENT_TYPE = (action[4]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; + MPI_Datatype MPI_CURRENT_TYPE = (action[4]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; int my_proc_id = Actor::self()->getPid(); TRACE_smpi_comm_in(my_proc_id, __FUNCTION__, @@ -420,9 +387,7 @@ static void action_bcast(const char *const *action) double clock = smpi_process()->simulated_elapsed(); int root = (action[3]) ? atoi(action[3]) : 0; /* Initialize MPI_CURRENT_TYPE in order to decrease the number of the checks */ - MPI_CURRENT_TYPE= MPI_DEFAULT_TYPE; - - MPI_CURRENT_TYPE = (action[3] && action[4]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; + MPI_Datatype MPI_CURRENT_TYPE = (action[3] && action[4]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; int my_proc_id = Actor::self()->getPid(); TRACE_smpi_comm_in(my_proc_id, __FUNCTION__, @@ -445,7 +410,7 @@ static void action_reduce(const char *const *action) double clock = smpi_process()->simulated_elapsed(); int root = (action[4]) ? atoi(action[4]) : 0; - MPI_CURRENT_TYPE = (action[4] && action[5]) ? decode_datatype(action[5]) : MPI_DEFAULT_TYPE; + MPI_Datatype MPI_CURRENT_TYPE = (action[4] && action[5]) ? decode_datatype(action[5]) : MPI_DEFAULT_TYPE; int my_proc_id = Actor::self()->getPid(); TRACE_smpi_comm_in(my_proc_id, __FUNCTION__, @@ -466,7 +431,7 @@ static void action_allReduce(const char *const *action) { double comm_size = parse_double(action[2]); double comp_size = parse_double(action[3]); - MPI_CURRENT_TYPE = (action[4]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; + MPI_Datatype MPI_CURRENT_TYPE = (action[4]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; double clock = smpi_process()->simulated_elapsed(); int my_proc_id = Actor::self()->getPid(); @@ -488,7 +453,7 @@ static void action_allToAll(const char *const *action) { int comm_size = MPI_COMM_WORLD->size(); int send_size = parse_double(action[2]); int recv_size = parse_double(action[3]); - MPI_CURRENT_TYPE = (action[4] && action[5]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; + MPI_Datatype MPI_CURRENT_TYPE = (action[4] && action[5]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; MPI_Datatype MPI_CURRENT_TYPE2{(action[4] && action[5]) ? decode_datatype(action[5]) : MPI_DEFAULT_TYPE}; void *send = smpi_get_tmp_sendbuffer(send_size*comm_size* MPI_CURRENT_TYPE->size()); @@ -521,7 +486,7 @@ static void action_gather(const char *const *action) { int comm_size = MPI_COMM_WORLD->size(); int send_size = parse_double(action[2]); int recv_size = parse_double(action[3]); - MPI_CURRENT_TYPE = (action[5] && action[6]) ? decode_datatype(action[5]) : MPI_DEFAULT_TYPE; + MPI_Datatype MPI_CURRENT_TYPE = (action[5] && action[6]) ? decode_datatype(action[5]) : MPI_DEFAULT_TYPE; MPI_Datatype MPI_CURRENT_TYPE2{(action[5] && action[6]) ? decode_datatype(action[6]) : MPI_DEFAULT_TYPE}; void *send = smpi_get_tmp_sendbuffer(send_size* MPI_CURRENT_TYPE->size()); @@ -558,7 +523,7 @@ static void action_scatter(const char* const* action) int comm_size = MPI_COMM_WORLD->size(); int send_size = parse_double(action[2]); int recv_size = parse_double(action[3]); - MPI_CURRENT_TYPE = (action[5] && action[6]) ? decode_datatype(action[5]) : MPI_DEFAULT_TYPE; + MPI_Datatype MPI_CURRENT_TYPE = (action[5] && action[6]) ? decode_datatype(action[5]) : MPI_DEFAULT_TYPE; MPI_Datatype MPI_CURRENT_TYPE2{(action[5] && action[6]) ? decode_datatype(action[6]) : MPI_DEFAULT_TYPE}; void* send = smpi_get_tmp_sendbuffer(send_size * MPI_CURRENT_TYPE->size()); @@ -593,11 +558,10 @@ static void action_gatherv(const char *const *action) { int comm_size = MPI_COMM_WORLD->size(); CHECK_ACTION_PARAMS(action, comm_size+1, 2) int send_size = parse_double(action[2]); - int disps[comm_size]; - int recvcounts[comm_size]; - int recv_sum=0; + std::vector disps(comm_size, 0); + std::shared_ptr> recvcounts(new std::vector(comm_size)); - MPI_CURRENT_TYPE = + MPI_Datatype MPI_CURRENT_TYPE = (action[4 + comm_size] && action[5 + comm_size]) ? decode_datatype(action[4 + comm_size]) : MPI_DEFAULT_TYPE; MPI_Datatype MPI_CURRENT_TYPE2{ (action[4 + comm_size] && action[5 + comm_size]) ? decode_datatype(action[5 + comm_size]) : MPI_DEFAULT_TYPE}; @@ -605,10 +569,9 @@ static void action_gatherv(const char *const *action) { void *send = smpi_get_tmp_sendbuffer(send_size* MPI_CURRENT_TYPE->size()); void *recv = nullptr; for(int i=0;ibegin(), recvcounts->end(), 0); int root = (action[3 + comm_size]) ? atoi(action[3 + comm_size]) : 0; int rank = MPI_COMM_WORLD->rank(); @@ -616,13 +579,12 @@ static void action_gatherv(const char *const *action) { if(rank==root) recv = smpi_get_tmp_recvbuffer(recv_sum* MPI_CURRENT_TYPE2->size()); - std::vector* trace_recvcounts = new std::vector(recvcounts, recvcounts + comm_size); - TRACE_smpi_comm_in(rank, __FUNCTION__, new simgrid::instr::VarCollTIData( - "gatherV", root, send_size, nullptr, -1, trace_recvcounts, + "gatherV", root, send_size, nullptr, -1, recvcounts, encode_datatype(MPI_CURRENT_TYPE), encode_datatype(MPI_CURRENT_TYPE2))); - Colls::gatherv(send, send_size, MPI_CURRENT_TYPE, recv, recvcounts, disps, MPI_CURRENT_TYPE2, root, MPI_COMM_WORLD); + Colls::gatherv(send, send_size, MPI_CURRENT_TYPE, recv, recvcounts->data(), disps.data(), MPI_CURRENT_TYPE2, root, + MPI_COMM_WORLD); TRACE_smpi_comm_out(Actor::self()->getPid()); log_timed_action (action, clock); @@ -643,11 +605,10 @@ static void action_scatterv(const char* const* action) int comm_size = MPI_COMM_WORLD->size(); CHECK_ACTION_PARAMS(action, comm_size + 1, 2) int recv_size = parse_double(action[2 + comm_size]); - int disps[comm_size]; - int sendcounts[comm_size]; - int send_sum = 0; + std::vector disps(comm_size, 0); + std::shared_ptr> sendcounts(new std::vector(comm_size)); - MPI_CURRENT_TYPE = + MPI_Datatype MPI_CURRENT_TYPE = (action[4 + comm_size] && action[5 + comm_size]) ? decode_datatype(action[4 + comm_size]) : MPI_DEFAULT_TYPE; MPI_Datatype MPI_CURRENT_TYPE2{ (action[4 + comm_size] && action[5 + comm_size]) ? decode_datatype(action[5 + comm_size]) : MPI_DEFAULT_TYPE}; @@ -655,10 +616,9 @@ static void action_scatterv(const char* const* action) void* send = nullptr; void* recv = smpi_get_tmp_recvbuffer(recv_size * MPI_CURRENT_TYPE->size()); for (int i = 0; i < comm_size; i++) { - sendcounts[i] = atoi(action[i + 2]); - send_sum += sendcounts[i]; - disps[i] = 0; + (*sendcounts)[i] = atoi(action[i + 2]); } + int send_sum = std::accumulate(sendcounts->begin(), sendcounts->end(), 0); int root = (action[3 + comm_size]) ? atoi(action[3 + comm_size]) : 0; int rank = MPI_COMM_WORLD->rank(); @@ -666,13 +626,12 @@ static void action_scatterv(const char* const* action) if (rank == root) send = smpi_get_tmp_sendbuffer(send_sum * MPI_CURRENT_TYPE2->size()); - std::vector* trace_sendcounts = new std::vector(sendcounts, sendcounts + comm_size); + TRACE_smpi_comm_in(rank, __FUNCTION__, new simgrid::instr::VarCollTIData("gatherV", root, -1, sendcounts, recv_size, + nullptr, encode_datatype(MPI_CURRENT_TYPE), + encode_datatype(MPI_CURRENT_TYPE2))); - TRACE_smpi_comm_in(rank, __FUNCTION__, new simgrid::instr::VarCollTIData( - "gatherV", root, -1, trace_sendcounts, recv_size, nullptr, - encode_datatype(MPI_CURRENT_TYPE), encode_datatype(MPI_CURRENT_TYPE2))); - - Colls::scatterv(send, sendcounts, disps, MPI_CURRENT_TYPE, recv, recv_size, MPI_CURRENT_TYPE2, root, MPI_COMM_WORLD); + Colls::scatterv(send, sendcounts->data(), disps.data(), MPI_CURRENT_TYPE, recv, recv_size, MPI_CURRENT_TYPE2, root, + MPI_COMM_WORLD); TRACE_smpi_comm_out(Actor::self()->getPid()); log_timed_action(action, clock); @@ -690,27 +649,24 @@ static void action_reducescatter(const char *const *action) { int comm_size = MPI_COMM_WORLD->size(); CHECK_ACTION_PARAMS(action, comm_size+1, 1) int comp_size = parse_double(action[2+comm_size]); - int recvcounts[comm_size]; int my_proc_id = Actor::self()->getPid(); - int size = 0; - std::vector* trace_recvcounts = new std::vector; - MPI_CURRENT_TYPE = (action[3 + comm_size]) ? decode_datatype(action[3 + comm_size]) : MPI_DEFAULT_TYPE; + std::shared_ptr> recvcounts(new std::vector); + MPI_Datatype MPI_CURRENT_TYPE = (action[3 + comm_size]) ? decode_datatype(action[3 + comm_size]) : MPI_DEFAULT_TYPE; for(int i=0;ipush_back(recvcounts[i]); - size+=recvcounts[i]; + recvcounts->push_back(atoi(action[i + 2])); } + int size{std::accumulate(recvcounts->begin(), recvcounts->end(), 0)}; TRACE_smpi_comm_in(my_proc_id, __FUNCTION__, - new simgrid::instr::VarCollTIData("reduceScatter", -1, 0, nullptr, -1, trace_recvcounts, + new simgrid::instr::VarCollTIData("reduceScatter", -1, 0, nullptr, -1, recvcounts, std::to_string(comp_size), /* ugly hack to print comp_size */ encode_datatype(MPI_CURRENT_TYPE))); void *sendbuf = smpi_get_tmp_sendbuffer(size* MPI_CURRENT_TYPE->size()); void *recvbuf = smpi_get_tmp_recvbuffer(size* MPI_CURRENT_TYPE->size()); - Colls::reduce_scatter(sendbuf, recvbuf, recvcounts, MPI_CURRENT_TYPE, MPI_OP_NULL, MPI_COMM_WORLD); + Colls::reduce_scatter(sendbuf, recvbuf, recvcounts->data(), MPI_CURRENT_TYPE, MPI_OP_NULL, MPI_COMM_WORLD); smpi_execute_flops(comp_size); TRACE_smpi_comm_out(my_proc_id); @@ -731,7 +687,7 @@ static void action_allgather(const char *const *action) { int sendcount=atoi(action[2]); int recvcount=atoi(action[3]); - MPI_CURRENT_TYPE = (action[4] && action[5]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; + MPI_Datatype MPI_CURRENT_TYPE = (action[4] && action[5]) ? decode_datatype(action[4]) : MPI_DEFAULT_TYPE; MPI_Datatype MPI_CURRENT_TYPE2{(action[4] && action[5]) ? decode_datatype(action[5]) : MPI_DEFAULT_TYPE}; void *sendbuf = smpi_get_tmp_sendbuffer(sendcount* MPI_CURRENT_TYPE->size()); @@ -763,11 +719,10 @@ static void action_allgatherv(const char *const *action) { int comm_size = MPI_COMM_WORLD->size(); CHECK_ACTION_PARAMS(action, comm_size+1, 2) int sendcount=atoi(action[2]); - int recvcounts[comm_size]; - int disps[comm_size]; - int recv_sum=0; + std::shared_ptr> recvcounts(new std::vector(comm_size)); + std::vector disps(comm_size, 0); - MPI_CURRENT_TYPE = + MPI_Datatype MPI_CURRENT_TYPE = (action[3 + comm_size] && action[4 + comm_size]) ? decode_datatype(action[3 + comm_size]) : MPI_DEFAULT_TYPE; MPI_Datatype MPI_CURRENT_TYPE2{ (action[3 + comm_size] && action[4 + comm_size]) ? decode_datatype(action[4 + comm_size]) : MPI_DEFAULT_TYPE}; @@ -775,23 +730,20 @@ static void action_allgatherv(const char *const *action) { void *sendbuf = smpi_get_tmp_sendbuffer(sendcount* MPI_CURRENT_TYPE->size()); for(int i=0;ibegin(), recvcounts->end(), 0); void *recvbuf = smpi_get_tmp_recvbuffer(recv_sum* MPI_CURRENT_TYPE2->size()); int my_proc_id = Actor::self()->getPid(); - std::vector* trace_recvcounts = new std::vector(recvcounts, recvcounts + comm_size); - TRACE_smpi_comm_in(my_proc_id, __FUNCTION__, - new simgrid::instr::VarCollTIData("allGatherV", -1, sendcount, nullptr, -1, trace_recvcounts, + new simgrid::instr::VarCollTIData("allGatherV", -1, sendcount, nullptr, -1, recvcounts, encode_datatype(MPI_CURRENT_TYPE), encode_datatype(MPI_CURRENT_TYPE2))); - Colls::allgatherv(sendbuf, sendcount, MPI_CURRENT_TYPE, recvbuf, recvcounts, disps, MPI_CURRENT_TYPE2, - MPI_COMM_WORLD); + Colls::allgatherv(sendbuf, sendcount, MPI_CURRENT_TYPE, recvbuf, recvcounts->data(), disps.data(), MPI_CURRENT_TYPE2, + MPI_COMM_WORLD); TRACE_smpi_comm_out(my_proc_id); log_timed_action (action, clock); @@ -810,18 +762,14 @@ static void action_allToAllv(const char *const *action) { int comm_size = MPI_COMM_WORLD->size(); CHECK_ACTION_PARAMS(action, 2*comm_size+2, 2) - int send_size = 0; - int recv_size = 0; - int sendcounts[comm_size]; - std::vector* trace_sendcounts = new std::vector; - int recvcounts[comm_size]; - std::vector* trace_recvcounts = new std::vector; - int senddisps[comm_size]; - int recvdisps[comm_size]; - - MPI_CURRENT_TYPE = (action[4 + 2 * comm_size] && action[5 + 2 * comm_size]) - ? decode_datatype(action[4 + 2 * comm_size]) - : MPI_DEFAULT_TYPE; + std::shared_ptr> sendcounts(new std::vector(comm_size)); + std::shared_ptr> recvcounts(new std::vector(comm_size)); + std::vector senddisps(comm_size, 0); + std::vector recvdisps(comm_size, 0); + + MPI_Datatype MPI_CURRENT_TYPE = (action[4 + 2 * comm_size] && action[5 + 2 * comm_size]) + ? decode_datatype(action[4 + 2 * comm_size]) + : MPI_DEFAULT_TYPE; MPI_Datatype MPI_CURRENT_TYPE2{(action[4 + 2 * comm_size] && action[5 + 2 * comm_size]) ? decode_datatype(action[5 + 2 * comm_size]) : MPI_DEFAULT_TYPE}; @@ -833,23 +781,19 @@ static void action_allToAllv(const char *const *action) { void *recvbuf = smpi_get_tmp_recvbuffer(recv_buf_size* MPI_CURRENT_TYPE2->size()); for(int i=0;ipush_back(sendcounts[i]); - send_size += sendcounts[i]; - recvcounts[i] = atoi(action[i+4+comm_size]); - trace_recvcounts->push_back(recvcounts[i]); - recv_size += recvcounts[i]; - senddisps[i] = 0; - recvdisps[i] = 0; + (*sendcounts)[i] = atoi(action[3 + i]); + (*recvcounts)[i] = atoi(action[4 + comm_size + i]); } + int send_size = std::accumulate(sendcounts->begin(), sendcounts->end(), 0); + int recv_size = std::accumulate(recvcounts->begin(), recvcounts->end(), 0); TRACE_smpi_comm_in(my_proc_id, __FUNCTION__, - new simgrid::instr::VarCollTIData("allToAllV", -1, send_size, trace_sendcounts, recv_size, - trace_recvcounts, encode_datatype(MPI_CURRENT_TYPE), + new simgrid::instr::VarCollTIData("allToAllV", -1, send_size, sendcounts, recv_size, recvcounts, + encode_datatype(MPI_CURRENT_TYPE), encode_datatype(MPI_CURRENT_TYPE2))); - Colls::alltoallv(sendbuf, sendcounts, senddisps, MPI_CURRENT_TYPE,recvbuf, recvcounts, recvdisps, - MPI_CURRENT_TYPE, MPI_COMM_WORLD); + Colls::alltoallv(sendbuf, sendcounts->data(), senddisps.data(), MPI_CURRENT_TYPE, recvbuf, recvcounts->data(), + recvdisps.data(), MPI_CURRENT_TYPE, MPI_COMM_WORLD); TRACE_smpi_comm_out(my_proc_id); log_timed_action (action, clock);