Logo AND Algorithmique Numérique Distribuée

Public GIT Repository
Merge branch 'master' of git+ssh://scm.gforge.inria.fr//gitroot/simgrid/simgrid
[simgrid.git] / src / smpi / colls / smpi_automatic_selector.cpp
1 /* Copyright (c) 2013-2017. The SimGrid Team.
2  * All rights reserved.                                                     */
3
4 /* This program is free software; you can redistribute it and/or modify it
5  * under the terms of the license (GNU LGPL) which comes with this package. */
6
7 #include <float.h>
8
9 #include <exception>
10
11 #include "colls_private.h"
12 #include "src/smpi/smpi_process.hpp"
13
14
15 //attempt to do a quick autotuning version of the collective,
16
17 #define TRACE_AUTO_COLL(cat) if (TRACE_is_enabled()){\
18         type_t type = PJ_type_get_or_null (#cat, PJ_type_get_root());\
19          if (!type){\
20              type=PJ_type_event_new(#cat, PJ_type_get_root());\
21          }\
22          char cont_name[25];\
23          snprintf(cont_name,25, "rank-%d", smpi_process()->index());\
24          val_t value = PJ_value_get_or_new(Colls::mpi_coll_##cat##_description[i].name,"1.0 1.0 1.0", type);\
25          new_pajeNewEvent (SIMIX_get_clock(), PJ_container_get(cont_name), type, value);\
26       }
27
28 #define AUTOMATIC_COLL_BENCH(cat, ret, args, args2)\
29     ret Coll_ ## cat ## _automatic:: cat (COLL_UNPAREN args)\
30 {\
31   double time1, time2, time_min=DBL_MAX;\
32   int min_coll=-1, global_coll=-1;\
33   int i;\
34   double buf_in, buf_out, max_min=DBL_MAX;\
35   for (i = 0; Colls::mpi_coll_##cat##_description[i].name; i++){\
36       if(!strcmp(Colls::mpi_coll_##cat##_description[i].name, "automatic"))continue;\
37       if(!strcmp(Colls::mpi_coll_##cat##_description[i].name, "default"))continue;\
38       Coll_barrier_default::barrier(comm);\
39       TRACE_AUTO_COLL(cat)\
40       time1 = SIMIX_get_clock();\
41       try {\
42       ((int (*) args)\
43           Colls::mpi_coll_##cat##_description[i].coll) args2 ;\
44       }\
45       catch (std::exception& ex) {\
46         continue;\
47       }\
48       time2 = SIMIX_get_clock();\
49       buf_out=time2-time1;\
50       Coll_reduce_default::reduce((void*)&buf_out,(void*)&buf_in, 1, MPI_DOUBLE, MPI_MAX, 0,comm );\
51       if(time2-time1<time_min){\
52           min_coll=i;\
53           time_min=time2-time1;\
54       }\
55       if(comm->rank()==0){\
56           if(buf_in<max_min){\
57               max_min=buf_in;\
58               global_coll=i;\
59           }\
60       }\
61   }\
62   if(comm->rank()==0){\
63       XBT_WARN("For rank 0, the quickest was %s : %f , but global was %s : %f at max",Colls::mpi_coll_##cat##_description[min_coll].name, time_min,Colls::mpi_coll_##cat##_description[global_coll].name, max_min);\
64   }else\
65   XBT_WARN("The quickest %s was %s on rank %d and took %f",#cat,Colls::mpi_coll_##cat##_description[min_coll].name, comm->rank(), time_min);\
66   return (min_coll!=-1)?MPI_SUCCESS:MPI_ERR_INTERN;\
67 }
68
69 namespace simgrid{
70 namespace smpi{
71
72 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_ALLGATHERV_SIG, (send_buff, send_count, send_type, recv_buff, recv_count, recv_disps, recv_type, comm));
73 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_ALLREDUCE_SIG, (sbuf, rbuf, rcount, dtype, op, comm));
74 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_GATHER_SIG, (send_buff, send_count, send_type, recv_buff, recv_count, recv_type, root, comm));
75 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_ALLGATHER_SIG, (send_buff,send_count,send_type,recv_buff,recv_count,recv_type,comm));
76 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_ALLTOALL_SIG,(send_buff, send_count, send_type, recv_buff, recv_count, recv_type,comm));
77 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_ALLTOALLV_SIG, (send_buff, send_counts, send_disps, send_type, recv_buff, recv_counts, recv_disps, recv_type, comm));
78 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_BCAST_SIG , (buf, count, datatype, root, comm));
79 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_REDUCE_SIG,(buf,rbuf, count, datatype, op, root, comm));
80 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_REDUCE_SCATTER_SIG ,(sbuf,rbuf, rcounts,dtype,op,comm));
81 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_SCATTER_SIG ,(sendbuf, sendcount, sendtype,recvbuf, recvcount, recvtype,root, comm));
82 COLL_APPLY(AUTOMATIC_COLL_BENCH, COLL_BARRIER_SIG,(comm));
83
84 }
85 }