Logo AND Algorithmique Numérique Distribuée

Public GIT Repository
Free exception, and fix warnings about variables possibly clobbered by longjmp.
[simgrid.git] / src / smpi / colls / smpi_automatic_selector.c
1 #include "colls_private.h"
2 #include "mc/mc_private.h"
3 #include <float.h>
4
5 //attempt to do a quick autotuning version of the collective,
6
7 #ifdef HAVE_TRACING
8 #define TRACE_AUTO_COLL(cat) if (TRACE_is_enabled()){\
9         type_t type = PJ_type_get_or_null (#cat, PJ_type_get_root());\
10          if (!type){\
11              type=PJ_type_event_new(#cat, PJ_type_get_root());\
12          }\
13          char cont_name[25];\
14          sprintf(cont_name, "rank-%d", smpi_process_index());\
15          val_t value = PJ_value_get_or_new(mpi_coll_##cat##_description[i].name,"1.0 1.0 1.0", type);\
16          new_pajeNewEvent (SIMIX_get_clock(), PJ_container_get(cont_name), type, value);\
17       }
18 #else
19 #define TRACE_AUTO_COLL(cat)
20 #endif
21
22
23 #define AUTOMATIC_COLL_BENCH(cat, ret, args, args2)\
24     ret smpi_coll_tuned_ ## cat ## _ ## automatic(COLL_UNPAREN args)\
25 {\
26   double time1, time2, time_min=DBL_MAX;\
27   volatile int min_coll=-1, global_coll=-1;\
28   volatile int i;\
29   xbt_ex_t ex;\
30   double buf_in, buf_out, max_min=DBL_MAX;\
31   for (i = 0; mpi_coll_##cat##_description[i].name; i++){\
32       if(!strcmp(mpi_coll_##cat##_description[i].name, "automatic"))continue;\
33       if(!strcmp(mpi_coll_##cat##_description[i].name, "default"))continue;\
34       smpi_mpi_barrier(comm);\
35       TRACE_AUTO_COLL(cat)\
36       time1 = SIMIX_get_clock();\
37       TRY{\
38       ((int (*) args)\
39           mpi_coll_##cat##_description[i].coll) args2 ;\
40       }\
41       CATCH(ex) {\
42         xbt_ex_free(ex);\
43         continue;\
44       }\
45       time2 = SIMIX_get_clock();\
46       buf_out=time2-time1;\
47       smpi_mpi_reduce((void*)&buf_out,(void*)&buf_in, 1, MPI_DOUBLE, MPI_MAX, 0,comm );\
48       if(time2-time1<time_min){\
49           min_coll=i;\
50           time_min=time2-time1;\
51       }\
52       if(smpi_comm_rank(comm)==0){\
53           if(buf_in<max_min){\
54               max_min=buf_in;\
55               global_coll=i;\
56           }\
57       }\
58   }\
59   if(smpi_comm_rank(comm)==0){\
60       XBT_WARN("For rank 0, the quickest was %s : %f , but global was %s : %f at max",mpi_coll_##cat##_description[min_coll].name, time_min,mpi_coll_##cat##_description[global_coll].name, max_min);\
61   }else\
62   XBT_WARN("The quickest %s was %s on rank %d and took %f",#cat,mpi_coll_##cat##_description[min_coll].name, smpi_comm_rank(comm), time_min);\
63   return (min_coll!=-1)?MPI_SUCCESS:MPI_ERR_INTERN;\
64 }\
65
66
67 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_ALLGATHERV_SIG, (send_buff, send_count, send_type, recv_buff, recv_count, recv_disps, recv_type, comm));
68 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_ALLREDUCE_SIG, (sbuf, rbuf, rcount, dtype, op, comm));
69 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_GATHER_SIG, (send_buff, send_count, send_type, recv_buff, recv_count, recv_type, root, comm));
70 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_ALLGATHER_SIG, (send_buff,send_count,send_type,recv_buff,recv_count,recv_type,comm));
71 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_ALLTOALL_SIG,(send_buff, send_count, send_type, recv_buff, recv_count, recv_type,comm));
72 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_ALLTOALLV_SIG, (send_buff, send_counts, send_disps, send_type, recv_buff, recv_counts, recv_disps, recv_type, comm));
73 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_BCAST_SIG , (buf, count, datatype, root, comm));
74 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_REDUCE_SIG,(buf,rbuf, count, datatype, op, root, comm));
75 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_REDUCE_SCATTER_SIG ,(sbuf,rbuf, rcounts,dtype,op,comm));
76 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_SCATTER_SIG ,(sendbuf, sendcount, sendtype,recvbuf, recvcount, recvtype,root, comm));
77 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_BARRIER_SIG,(comm));