-#define AUTOMATIC_COLL_BENCH(cat, ret, args, args2)\
- ret Coll_ ## cat ## _automatic:: cat (COLL_UNPAREN args)\
-{\
- double time1, time2, time_min=DBL_MAX;\
- int min_coll=-1, global_coll=-1;\
- int i;\
- double buf_in, buf_out, max_min=DBL_MAX;\
- for (i = 0; Colls::mpi_coll_##cat##_description[i].name; i++){\
- if(!strcmp(Colls::mpi_coll_##cat##_description[i].name, "automatic"))continue;\
- if(!strcmp(Colls::mpi_coll_##cat##_description[i].name, "default"))continue;\
- Coll_barrier_default::barrier(comm);\
- TRACE_AUTO_COLL(cat)\
- time1 = SIMIX_get_clock();\
- try {\
- ((int (*) args)\
- Colls::mpi_coll_##cat##_description[i].coll) args2 ;\
- }\
- catch (std::exception& ex) {\
- continue;\
- }\
- time2 = SIMIX_get_clock();\
- buf_out=time2-time1;\
- Coll_reduce_default::reduce((void*)&buf_out,(void*)&buf_in, 1, MPI_DOUBLE, MPI_MAX, 0,comm );\
- if(time2-time1<time_min){\
- min_coll=i;\
- time_min=time2-time1;\
- }\
- if(comm->rank()==0){\
- if(buf_in<max_min){\
- max_min=buf_in;\
- global_coll=i;\
- }\
- }\
- }\
- if(comm->rank()==0){\
- XBT_WARN("For rank 0, the quickest was %s : %f , but global was %s : %f at max",Colls::mpi_coll_##cat##_description[min_coll].name, time_min,Colls::mpi_coll_##cat##_description[global_coll].name, max_min);\
- }else\
- XBT_WARN("The quickest %s was %s on rank %d and took %f",#cat,Colls::mpi_coll_##cat##_description[min_coll].name, comm->rank(), time_min);\
- return (min_coll!=-1)?MPI_SUCCESS:MPI_ERR_INTERN;\
-}
+#define AUTOMATIC_COLL_BENCH(cat, ret, args, args2) \
+ ret Coll_##cat##_automatic::cat(COLL_UNPAREN args) \
+ { \
+ double time1, time2, time_min = DBL_MAX; \
+ int min_coll = -1, global_coll = -1; \
+ int i; \
+ double buf_in, buf_out, max_min = DBL_MAX; \
+ for (i = 0; Colls::mpi_coll_##cat##_description[i].name; i++) { \
+ if (not strcmp(Colls::mpi_coll_##cat##_description[i].name, "automatic")) \
+ continue; \
+ if (not strcmp(Colls::mpi_coll_##cat##_description[i].name, "default")) \
+ continue; \
+ Coll_barrier_default::barrier(comm); \
+ TRACE_AUTO_COLL(cat) \
+ time1 = SIMIX_get_clock(); \
+ try { \
+ ((int(*) args)Colls::mpi_coll_##cat##_description[i].coll) args2; \
+ } catch (std::exception & ex) { \
+ continue; \
+ } \
+ time2 = SIMIX_get_clock(); \
+ buf_out = time2 - time1; \
+ Coll_reduce_default::reduce((void*)&buf_out, (void*)&buf_in, 1, MPI_DOUBLE, MPI_MAX, 0, comm); \
+ if (time2 - time1 < time_min) { \
+ min_coll = i; \
+ time_min = time2 - time1; \
+ } \
+ if (comm->rank() == 0) { \
+ if (buf_in < max_min) { \
+ max_min = buf_in; \
+ global_coll = i; \
+ } \
+ } \
+ } \
+ if (comm->rank() == 0) { \
+ XBT_WARN("For rank 0, the quickest was %s : %f , but global was %s : %f at max", \
+ Colls::mpi_coll_##cat##_description[min_coll].name, time_min, \
+ Colls::mpi_coll_##cat##_description[global_coll].name, max_min); \
+ } else \
+ XBT_WARN("The quickest %s was %s on rank %d and took %f", #cat, \
+ Colls::mpi_coll_##cat##_description[min_coll].name, comm->rank(), time_min); \
+ return (min_coll != -1) ? MPI_SUCCESS : MPI_ERR_INTERN; \
+ }