Logo AND Algorithmique Numérique Distribuée

Public GIT Repository
smpi: many classes died tonight, but that will save kitten on the long term.
[simgrid.git] / src / smpi / include / smpi_coll.hpp
1 /*High level handling of collective algorithms*/
2 /* Copyright (c) 2009-2019. The SimGrid Team.
3  * All rights reserved.                                                     */
4
5 /* This program is free software; you can redistribute it and/or modify it
6  * under the terms of the license (GNU LGPL) which comes with this package. */
7
8 #ifndef SMPI_COLL_HPP
9 #define SMPI_COLL_HPP
10
11 #include "private.hpp"
12 #include "xbt/base.h"
13
14 /** @brief MPI collective description */
15
16 #define COLL_DEFS(cat, ret, args, args2)                                                                               \
17   static void _XBT_CONCAT(set_, cat)(const std::string& name);                                                         \
18   static s_mpi_coll_description_t _XBT_CONCAT3(mpi_coll_, cat, _description)[];                                        \
19   static int(*cat) args;
20
21 #define COLL_SIG(cat, ret, args, args2)\
22     static int cat args;
23
24 #define COLL_DESCRIPTION(cat, ret, args, name)                                                                         \
25   {                                                                                                                    \
26     _XBT_STRINGIFY(name)                                                                                               \
27     , _XBT_STRINGIFY(cat) " " _XBT_STRINGIFY(name) " collective", (void*)_XBT_CONCAT3(cat, __, name)        \
28   }
29
30 #define COLL_PROTO(cat, ret, args, name)                                                                               \
31   ret _XBT_CONCAT3(cat, __, name) args;
32
33 #define COLL_UNPAREN(...)  __VA_ARGS__
34
35 #define COLL_APPLY(action, sig, name) action(sig, name)
36 #define COLL_COMMA ,
37 #define COLL_NOsep
38 #define COLL_NOTHING(...)
39
40 #define COLL_GATHER_SIG gather, int, \
41                       (const void *send_buff, int send_count, MPI_Datatype send_type, \
42                        void *recv_buff, int recv_count, MPI_Datatype recv_type, \
43                            int root, MPI_Comm comm)
44 #define COLL_ALLGATHER_SIG allgather, int, \
45                       (const void *send_buff, int send_count, MPI_Datatype send_type, \
46                        void *recv_buff, int recv_count, MPI_Datatype recv_type, \
47                            MPI_Comm comm)
48 #define COLL_ALLGATHERV_SIG allgatherv, int, \
49                       (const void *send_buff, int send_count, MPI_Datatype send_type, \
50                        void *recv_buff, const int *recv_count, const int *recv_disps, \
51                MPI_Datatype recv_type, MPI_Comm comm)
52 #define COLL_ALLTOALL_SIG alltoall, int, \
53                      (const void *send_buff, int send_count, MPI_Datatype send_type, \
54                       void *recv_buff, int recv_count, MPI_Datatype recv_type, \
55                           MPI_Comm comm)
56 #define COLL_ALLTOALLV_SIG alltoallv, int, \
57                      (const void *send_buff, const int *send_counts, const int *send_disps, MPI_Datatype send_type, \
58                       void *recv_buff, const int *recv_counts, const int *recv_disps, MPI_Datatype recv_type, \
59                           MPI_Comm comm)
60 #define COLL_BCAST_SIG bcast, int, \
61                   (void *buf, int count, MPI_Datatype datatype, \
62                    int root, MPI_Comm comm)
63 #define COLL_REDUCE_SIG reduce, int, \
64                    (const void *buf, void *rbuf, int count, MPI_Datatype datatype, \
65                         MPI_Op op, int root, MPI_Comm comm)
66 #define COLL_ALLREDUCE_SIG allreduce, int, \
67                       (const void *sbuf, void *rbuf, int rcount, \
68                            MPI_Datatype dtype, MPI_Op op, MPI_Comm comm)
69 #define COLL_REDUCE_SCATTER_SIG reduce_scatter, int, \
70                       (const void *sbuf, void *rbuf, const int *rcounts,\
71                     MPI_Datatype dtype,MPI_Op  op,MPI_Comm  comm)
72 #define COLL_SCATTER_SIG scatter, int, \
73                 (const void *sendbuf, int sendcount, MPI_Datatype sendtype,\
74                 void *recvbuf, int recvcount, MPI_Datatype recvtype,\
75                 int root, MPI_Comm comm)
76 #define COLL_BARRIER_SIG barrier, int, \
77                 (MPI_Comm comm)
78
79 namespace simgrid{
80 namespace smpi{
81
82 struct s_mpi_coll_description_t {
83   std::string name;
84   std::string description;
85   void *coll;
86 };
87
88 class Colls{
89 public:
90   static XBT_PUBLIC void coll_help(const char* category, s_mpi_coll_description_t* table);
91   static XBT_PUBLIC int find_coll_description(s_mpi_coll_description_t* table, const std::string& name,
92                                               const char* desc);
93   static void set_collectives();
94
95   // for each collective type, create the set_* prototype, the description array and the function pointer
96 //  static void set_gather(const std::string& name);
97 //  static s_mpi_coll_description_t mpi_coll_gather_description[];
98 //  static int(*gather)(const void *send_buff, int send_count, MPI_Datatype send_type, void *recv_buff, int recv_count, MPI_Datatype recv_type,
99 //                      int root, MPI_Comm comm);
100   COLL_APPLY(COLL_DEFS, COLL_GATHER_SIG, "")
101   COLL_APPLY(COLL_DEFS, COLL_ALLGATHER_SIG, "")
102   COLL_APPLY(COLL_DEFS, COLL_ALLGATHERV_SIG, "")
103   COLL_APPLY(COLL_DEFS, COLL_REDUCE_SIG, "")
104   COLL_APPLY(COLL_DEFS, COLL_ALLREDUCE_SIG, "")
105   COLL_APPLY(COLL_DEFS, COLL_REDUCE_SCATTER_SIG, "")
106   COLL_APPLY(COLL_DEFS, COLL_SCATTER_SIG, "")
107   COLL_APPLY(COLL_DEFS, COLL_BARRIER_SIG, "")
108   COLL_APPLY(COLL_DEFS, COLL_BCAST_SIG, "")
109   COLL_APPLY(COLL_DEFS, COLL_ALLTOALL_SIG, "")
110   COLL_APPLY(COLL_DEFS, COLL_ALLTOALLV_SIG, "")
111
112   // These fairly unused collectives only have one implementation in SMPI
113   static int gatherv(const void* sendbuf, int sendcount, MPI_Datatype sendtype, void* recvbuf, const int* recvcounts, const int* displs,
114                      MPI_Datatype recvtype, int root, MPI_Comm comm);
115   static int scatterv(const void* sendbuf, const int* sendcounts, const int* displs, MPI_Datatype sendtype, void* recvbuf, int recvcount,
116                       MPI_Datatype recvtype, int root, MPI_Comm comm);
117   static int scan(const void* sendbuf, void* recvbuf, int count, MPI_Datatype datatype, MPI_Op op, MPI_Comm comm);
118   static int exscan(const void* sendbuf, void* recvbuf, int count, MPI_Datatype datatype, MPI_Op op, MPI_Comm comm);
119   static int alltoallw
120          (const void* sendbuf, const int* sendcounts, const int* senddisps, const MPI_Datatype* sendtypes, void* recvbuf, const int* recvcounts,
121           const int* recvdisps, const MPI_Datatype* recvtypes, MPI_Comm comm);
122
123   //async collectives
124   static int ibarrier(MPI_Comm comm, MPI_Request* request, int external=1);
125   static int ibcast(void *buf, int count, MPI_Datatype datatype, 
126                    int root, MPI_Comm comm, MPI_Request* request, int external=1);
127   static int igather (const void* sendbuf, int sendcount, MPI_Datatype sendtype, void* recvbuf, int recvcount,
128                                       MPI_Datatype recvtype, int root, MPI_Comm comm, MPI_Request *request, int external=1);
129   static int igatherv (const void* sendbuf, int sendcount, MPI_Datatype sendtype, void* recvbuf,
130                                        const int* recvcounts, const int* displs, MPI_Datatype recvtype, int root, MPI_Comm comm, MPI_Request *request, int external=1);
131   static int iallgather (const void* sendbuf, int sendcount, MPI_Datatype sendtype, void* recvbuf,
132                                          int recvcount, MPI_Datatype recvtype, MPI_Comm comm, MPI_Request *request, int external=1);
133   static int iallgatherv (const void* sendbuf, int sendcount, MPI_Datatype sendtype, void* recvbuf,
134                                           const int* recvcounts, const int* displs, MPI_Datatype recvtype, MPI_Comm comm, MPI_Request *request, int external=1);
135   static int iscatter (const void* sendbuf, int sendcount, MPI_Datatype sendtype, void* recvbuf,
136                                        int recvcount, MPI_Datatype recvtype, int root, MPI_Comm comm, MPI_Request *request, int external=1);
137   static int iscatterv (const void* sendbuf, const int* sendcounts, const int* displs, MPI_Datatype sendtype,
138                                         void* recvbuf, int recvcount, MPI_Datatype recvtype, int root, MPI_Comm comm, MPI_Request *request, int external=1);
139   static int ireduce
140          (const void* sendbuf, void* recvbuf, int count, MPI_Datatype datatype, MPI_Op op, int root, MPI_Comm comm, MPI_Request *request, int external=1);
141   static int iallreduce
142          (const void* sendbuf, void* recvbuf, int count, MPI_Datatype datatype, MPI_Op op, MPI_Comm comm, MPI_Request *request, int external=1);
143   static int iscan
144          (const void* sendbuf, void* recvbuf, int count, MPI_Datatype datatype, MPI_Op op, MPI_Comm comm, MPI_Request *request, int external=1);
145   static int iexscan
146          (const void* sendbuf, void* recvbuf, int count, MPI_Datatype datatype, MPI_Op op, MPI_Comm comm, MPI_Request *request, int external=1);
147   static int ireduce_scatter
148          (const void* sendbuf, void* recvbuf, const int* recvcounts, MPI_Datatype datatype, MPI_Op op, MPI_Comm comm, MPI_Request *request, int external=1);
149   static int ireduce_scatter_block
150          (const void* sendbuf, void* recvbuf, int recvcount, MPI_Datatype datatype, MPI_Op op, MPI_Comm comm, MPI_Request *request, int external=1);
151   static int ialltoall (const void* sendbuf, int sendcount, MPI_Datatype sendtype, void* recvbuf,
152                                         int recvcount, MPI_Datatype recvtype, MPI_Comm comm, MPI_Request *request, int external=1);
153   static int ialltoallv
154          (const void* sendbuf, const int* sendcounts, const int* senddisps, MPI_Datatype sendtype, void* recvbuf, const int* recvcounts,
155           const int* recvdisps, MPI_Datatype recvtype, MPI_Comm comm, MPI_Request *request, int external=1);
156   static int ialltoallw
157          (const void* sendbuf, const int* sendcounts, const int* senddisps, const MPI_Datatype* sendtypes, void* recvbuf, const int* recvcounts,
158           const int* recvdisps, const MPI_Datatype* recvtypes, MPI_Comm comm, MPI_Request *request, int external=1);
159
160
161   static void (*smpi_coll_cleanup_callback)();
162 };
163
164 /*************
165  * GATHER *
166  *************/
167
168 #define COLL_GATHERS(action, COLL_sep) \
169 COLL_APPLY(action, COLL_GATHER_SIG, default) COLL_sep \
170 COLL_APPLY(action, COLL_GATHER_SIG, ompi) COLL_sep \
171 COLL_APPLY(action, COLL_GATHER_SIG, ompi_basic_linear) COLL_sep \
172 COLL_APPLY(action, COLL_GATHER_SIG, ompi_binomial) COLL_sep \
173 COLL_APPLY(action, COLL_GATHER_SIG, ompi_linear_sync) COLL_sep \
174 COLL_APPLY(action, COLL_GATHER_SIG, mpich) COLL_sep \
175 COLL_APPLY(action, COLL_GATHER_SIG, mvapich2) COLL_sep \
176 COLL_APPLY(action, COLL_GATHER_SIG, mvapich2_two_level) COLL_sep \
177 COLL_APPLY(action, COLL_GATHER_SIG, impi) COLL_sep \
178 COLL_APPLY(action, COLL_GATHER_SIG, automatic)
179
180 COLL_GATHERS(COLL_PROTO, COLL_NOsep)
181
182 /*************
183  * ALLGATHER *
184  *************/
185
186 #define COLL_ALLGATHERS(action, COLL_sep) \
187 COLL_APPLY(action, COLL_ALLGATHER_SIG, default) COLL_sep \
188 COLL_APPLY(action, COLL_ALLGATHER_SIG, 2dmesh) COLL_sep \
189 COLL_APPLY(action, COLL_ALLGATHER_SIG, 3dmesh) COLL_sep \
190 COLL_APPLY(action, COLL_ALLGATHER_SIG, bruck) COLL_sep \
191 COLL_APPLY(action, COLL_ALLGATHER_SIG, GB) COLL_sep \
192 COLL_APPLY(action, COLL_ALLGATHER_SIG, loosely_lr) COLL_sep \
193 COLL_APPLY(action, COLL_ALLGATHER_SIG, NTSLR) COLL_sep \
194 COLL_APPLY(action, COLL_ALLGATHER_SIG, NTSLR_NB) COLL_sep \
195 COLL_APPLY(action, COLL_ALLGATHER_SIG, pair) COLL_sep \
196 COLL_APPLY(action, COLL_ALLGATHER_SIG, rdb) COLL_sep \
197 COLL_APPLY(action, COLL_ALLGATHER_SIG, rhv) COLL_sep \
198 COLL_APPLY(action, COLL_ALLGATHER_SIG, ring) COLL_sep \
199 COLL_APPLY(action, COLL_ALLGATHER_SIG, SMP_NTS) COLL_sep \
200 COLL_APPLY(action, COLL_ALLGATHER_SIG, smp_simple) COLL_sep \
201 COLL_APPLY(action, COLL_ALLGATHER_SIG, spreading_simple) COLL_sep \
202 COLL_APPLY(action, COLL_ALLGATHER_SIG, ompi) COLL_sep \
203 COLL_APPLY(action, COLL_ALLGATHER_SIG, ompi_neighborexchange) COLL_sep \
204 COLL_APPLY(action, COLL_ALLGATHER_SIG, mvapich2) COLL_sep \
205 COLL_APPLY(action, COLL_ALLGATHER_SIG, mvapich2_smp) COLL_sep \
206 COLL_APPLY(action, COLL_ALLGATHER_SIG, mpich) COLL_sep \
207 COLL_APPLY(action, COLL_ALLGATHER_SIG, impi) COLL_sep \
208 COLL_APPLY(action, COLL_ALLGATHER_SIG, automatic)
209
210 COLL_ALLGATHERS(COLL_PROTO, COLL_NOsep)
211
212 /**************
213  * ALLGATHERV *
214  **************/
215
216 #define COLL_ALLGATHERVS(action, COLL_sep) \
217 COLL_APPLY(action, COLL_ALLGATHERV_SIG, default) COLL_sep \
218 COLL_APPLY(action, COLL_ALLGATHERV_SIG, GB) COLL_sep \
219 COLL_APPLY(action, COLL_ALLGATHERV_SIG, pair) COLL_sep \
220 COLL_APPLY(action, COLL_ALLGATHERV_SIG, ring) COLL_sep \
221 COLL_APPLY(action, COLL_ALLGATHERV_SIG, ompi) COLL_sep \
222 COLL_APPLY(action, COLL_ALLGATHERV_SIG, ompi_neighborexchange) COLL_sep \
223 COLL_APPLY(action, COLL_ALLGATHERV_SIG, ompi_bruck) COLL_sep \
224 COLL_APPLY(action, COLL_ALLGATHERV_SIG, mpich) COLL_sep \
225 COLL_APPLY(action, COLL_ALLGATHERV_SIG, mpich_rdb) COLL_sep \
226 COLL_APPLY(action, COLL_ALLGATHERV_SIG, mpich_ring) COLL_sep \
227 COLL_APPLY(action, COLL_ALLGATHERV_SIG, mvapich2) COLL_sep \
228 COLL_APPLY(action, COLL_ALLGATHERV_SIG, impi) COLL_sep \
229 COLL_APPLY(action, COLL_ALLGATHERV_SIG, automatic)
230
231 COLL_ALLGATHERVS(COLL_PROTO, COLL_NOsep)
232
233 /*************
234  * ALLREDUCE *
235  *************/
236
237 #define COLL_ALLREDUCES(action, COLL_sep) \
238 COLL_APPLY(action, COLL_ALLREDUCE_SIG, default) COLL_sep \
239 COLL_APPLY(action, COLL_ALLREDUCE_SIG, lr) COLL_sep \
240 COLL_APPLY(action, COLL_ALLREDUCE_SIG, rab1) COLL_sep \
241 COLL_APPLY(action, COLL_ALLREDUCE_SIG, rab2) COLL_sep \
242 COLL_APPLY(action, COLL_ALLREDUCE_SIG, rab_rdb) COLL_sep \
243 COLL_APPLY(action, COLL_ALLREDUCE_SIG, rdb) COLL_sep \
244 COLL_APPLY(action, COLL_ALLREDUCE_SIG, smp_binomial) COLL_sep \
245 COLL_APPLY(action, COLL_ALLREDUCE_SIG, smp_binomial_pipeline) COLL_sep \
246 COLL_APPLY(action, COLL_ALLREDUCE_SIG, smp_rdb) COLL_sep \
247 COLL_APPLY(action, COLL_ALLREDUCE_SIG, smp_rsag) COLL_sep \
248 COLL_APPLY(action, COLL_ALLREDUCE_SIG, smp_rsag_lr) COLL_sep \
249 COLL_APPLY(action, COLL_ALLREDUCE_SIG, smp_rsag_rab) COLL_sep \
250 COLL_APPLY(action, COLL_ALLREDUCE_SIG, redbcast) COLL_sep \
251 COLL_APPLY(action, COLL_ALLREDUCE_SIG, ompi) COLL_sep \
252 COLL_APPLY(action, COLL_ALLREDUCE_SIG, ompi_ring_segmented) COLL_sep \
253 COLL_APPLY(action, COLL_ALLREDUCE_SIG, mpich) COLL_sep \
254 COLL_APPLY(action, COLL_ALLREDUCE_SIG, mvapich2) COLL_sep \
255 COLL_APPLY(action, COLL_ALLREDUCE_SIG, mvapich2_rs) COLL_sep \
256 COLL_APPLY(action, COLL_ALLREDUCE_SIG, mvapich2_two_level) COLL_sep \
257 COLL_APPLY(action, COLL_ALLREDUCE_SIG, impi) COLL_sep \
258 COLL_APPLY(action, COLL_ALLREDUCE_SIG, rab) COLL_sep \
259 COLL_APPLY(action, COLL_ALLREDUCE_SIG, automatic)
260
261 COLL_ALLREDUCES(COLL_PROTO, COLL_NOsep)
262
263 /************
264  * ALLTOALL *
265  ************/
266
267 #define COLL_ALLTOALLS(action, COLL_sep) \
268 COLL_APPLY(action, COLL_ALLTOALL_SIG, default) COLL_sep \
269 COLL_APPLY(action, COLL_ALLTOALL_SIG, 2dmesh) COLL_sep \
270 COLL_APPLY(action, COLL_ALLTOALL_SIG, 3dmesh) COLL_sep \
271 COLL_APPLY(action, COLL_ALLTOALL_SIG, basic_linear) COLL_sep \
272 COLL_APPLY(action, COLL_ALLTOALL_SIG, bruck) COLL_sep \
273 COLL_APPLY(action, COLL_ALLTOALL_SIG, pair) COLL_sep \
274 COLL_APPLY(action, COLL_ALLTOALL_SIG, pair_rma) COLL_sep \
275 COLL_APPLY(action, COLL_ALLTOALL_SIG, pair_light_barrier) COLL_sep \
276 COLL_APPLY(action, COLL_ALLTOALL_SIG, pair_mpi_barrier) COLL_sep \
277 COLL_APPLY(action, COLL_ALLTOALL_SIG, pair_one_barrier) COLL_sep \
278 COLL_APPLY(action, COLL_ALLTOALL_SIG, rdb) COLL_sep \
279 COLL_APPLY(action, COLL_ALLTOALL_SIG, ring) COLL_sep \
280 COLL_APPLY(action, COLL_ALLTOALL_SIG, ring_light_barrier) COLL_sep \
281 COLL_APPLY(action, COLL_ALLTOALL_SIG, ring_mpi_barrier) COLL_sep \
282 COLL_APPLY(action, COLL_ALLTOALL_SIG, ring_one_barrier) COLL_sep \
283 COLL_APPLY(action, COLL_ALLTOALL_SIG, mvapich2) COLL_sep \
284 COLL_APPLY(action, COLL_ALLTOALL_SIG, mvapich2_scatter_dest) COLL_sep \
285 COLL_APPLY(action, COLL_ALLTOALL_SIG, ompi) COLL_sep \
286 COLL_APPLY(action, COLL_ALLTOALL_SIG, mpich) COLL_sep \
287 COLL_APPLY(action, COLL_ALLTOALL_SIG, impi) COLL_sep \
288 COLL_APPLY(action, COLL_ALLTOALL_SIG, automatic)
289
290 COLL_ALLTOALLS(COLL_PROTO, COLL_NOsep)
291
292 /*************
293  * ALLTOALLV *
294  *************/
295
296 #define COLL_ALLTOALLVS(action, COLL_sep) \
297 COLL_APPLY(action, COLL_ALLTOALLV_SIG, default) COLL_sep \
298 COLL_APPLY(action, COLL_ALLTOALLV_SIG, bruck) COLL_sep \
299 COLL_APPLY(action, COLL_ALLTOALLV_SIG, pair) COLL_sep \
300 COLL_APPLY(action, COLL_ALLTOALLV_SIG, pair_light_barrier) COLL_sep \
301 COLL_APPLY(action, COLL_ALLTOALLV_SIG, pair_mpi_barrier) COLL_sep \
302 COLL_APPLY(action, COLL_ALLTOALLV_SIG, pair_one_barrier) COLL_sep \
303 COLL_APPLY(action, COLL_ALLTOALLV_SIG, ring) COLL_sep \
304 COLL_APPLY(action, COLL_ALLTOALLV_SIG, ring_light_barrier) COLL_sep \
305 COLL_APPLY(action, COLL_ALLTOALLV_SIG, ring_mpi_barrier) COLL_sep \
306 COLL_APPLY(action, COLL_ALLTOALLV_SIG, ring_one_barrier) COLL_sep \
307 COLL_APPLY(action, COLL_ALLTOALLV_SIG, ompi) COLL_sep \
308 COLL_APPLY(action, COLL_ALLTOALLV_SIG, mpich) COLL_sep \
309 COLL_APPLY(action, COLL_ALLTOALLV_SIG, ompi_basic_linear) COLL_sep \
310 COLL_APPLY(action, COLL_ALLTOALLV_SIG, mvapich2) COLL_sep \
311 COLL_APPLY(action, COLL_ALLTOALLV_SIG, impi) COLL_sep \
312 COLL_APPLY(action, COLL_ALLTOALLV_SIG, automatic)
313
314 COLL_ALLTOALLVS(COLL_PROTO, COLL_NOsep)
315
316 /*********
317  * BCAST *
318  *********/
319
320 #define COLL_BCASTS(action, COLL_sep) \
321 COLL_APPLY(action, COLL_BCAST_SIG, default) COLL_sep \
322 COLL_APPLY(action, COLL_BCAST_SIG, arrival_pattern_aware) COLL_sep \
323 COLL_APPLY(action, COLL_BCAST_SIG, arrival_pattern_aware_wait) COLL_sep \
324 COLL_APPLY(action, COLL_BCAST_SIG, arrival_scatter) COLL_sep \
325 COLL_APPLY(action, COLL_BCAST_SIG, binomial_tree) COLL_sep \
326 COLL_APPLY(action, COLL_BCAST_SIG, flattree) COLL_sep \
327 COLL_APPLY(action, COLL_BCAST_SIG, flattree_pipeline) COLL_sep \
328 COLL_APPLY(action, COLL_BCAST_SIG, NTSB) COLL_sep \
329 COLL_APPLY(action, COLL_BCAST_SIG, NTSL) COLL_sep \
330 COLL_APPLY(action, COLL_BCAST_SIG, NTSL_Isend) COLL_sep \
331 COLL_APPLY(action, COLL_BCAST_SIG, scatter_LR_allgather) COLL_sep \
332 COLL_APPLY(action, COLL_BCAST_SIG, scatter_rdb_allgather) COLL_sep \
333 COLL_APPLY(action, COLL_BCAST_SIG, SMP_binary) COLL_sep \
334 COLL_APPLY(action, COLL_BCAST_SIG, SMP_binomial) COLL_sep \
335 COLL_APPLY(action, COLL_BCAST_SIG, SMP_linear) COLL_sep \
336 COLL_APPLY(action, COLL_BCAST_SIG, ompi) COLL_sep \
337 COLL_APPLY(action, COLL_BCAST_SIG, ompi_split_bintree) COLL_sep \
338 COLL_APPLY(action, COLL_BCAST_SIG, ompi_pipeline) COLL_sep \
339 COLL_APPLY(action, COLL_BCAST_SIG, mpich) COLL_sep \
340 COLL_APPLY(action, COLL_BCAST_SIG, mvapich2)   COLL_sep \
341 COLL_APPLY(action, COLL_BCAST_SIG, mvapich2_inter_node)   COLL_sep \
342 COLL_APPLY(action, COLL_BCAST_SIG, mvapich2_intra_node)   COLL_sep \
343 COLL_APPLY(action, COLL_BCAST_SIG, mvapich2_knomial_intra_node)   COLL_sep \
344 COLL_APPLY(action, COLL_BCAST_SIG, impi)   COLL_sep \
345 COLL_APPLY(action, COLL_BCAST_SIG, automatic)
346
347 COLL_BCASTS(COLL_PROTO, COLL_NOsep)
348
349 /**********
350  * REDUCE *
351  **********/
352
353 #define COLL_REDUCES(action, COLL_sep) \
354 COLL_APPLY(action, COLL_REDUCE_SIG, default) COLL_sep \
355 COLL_APPLY(action, COLL_REDUCE_SIG, arrival_pattern_aware) COLL_sep \
356 COLL_APPLY(action, COLL_REDUCE_SIG, binomial) COLL_sep \
357 COLL_APPLY(action, COLL_REDUCE_SIG, flat_tree) COLL_sep \
358 COLL_APPLY(action, COLL_REDUCE_SIG, NTSL) COLL_sep \
359 COLL_APPLY(action, COLL_REDUCE_SIG, scatter_gather) COLL_sep \
360 COLL_APPLY(action, COLL_REDUCE_SIG, ompi) COLL_sep \
361 COLL_APPLY(action, COLL_REDUCE_SIG, ompi_chain) COLL_sep \
362 COLL_APPLY(action, COLL_REDUCE_SIG, ompi_pipeline) COLL_sep \
363 COLL_APPLY(action, COLL_REDUCE_SIG, ompi_basic_linear) COLL_sep \
364 COLL_APPLY(action, COLL_REDUCE_SIG, ompi_in_order_binary) COLL_sep \
365 COLL_APPLY(action, COLL_REDUCE_SIG, ompi_binary) COLL_sep \
366 COLL_APPLY(action, COLL_REDUCE_SIG, ompi_binomial) COLL_sep \
367 COLL_APPLY(action, COLL_REDUCE_SIG, mpich) COLL_sep \
368 COLL_APPLY(action, COLL_REDUCE_SIG, mvapich2) COLL_sep \
369 COLL_APPLY(action, COLL_REDUCE_SIG, mvapich2_knomial) COLL_sep \
370 COLL_APPLY(action, COLL_REDUCE_SIG, mvapich2_two_level) COLL_sep \
371 COLL_APPLY(action, COLL_REDUCE_SIG, impi) COLL_sep \
372 COLL_APPLY(action, COLL_REDUCE_SIG, rab) COLL_sep \
373 COLL_APPLY(action, COLL_REDUCE_SIG, automatic)
374
375 COLL_REDUCES(COLL_PROTO, COLL_NOsep)
376
377 /*************
378  * REDUCE_SCATTER *
379  *************/
380
381 #define COLL_REDUCE_SCATTERS(action, COLL_sep) \
382 COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, default) COLL_sep \
383 COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, ompi) COLL_sep \
384 COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, ompi_basic_recursivehalving) COLL_sep \
385 COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, ompi_ring)  COLL_sep \
386 COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, mpich) COLL_sep \
387 COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, mpich_pair) COLL_sep \
388 COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, mpich_rdb) COLL_sep \
389 COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, mpich_noncomm) COLL_sep \
390 COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, mvapich2) COLL_sep \
391 COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, impi) COLL_sep \
392 COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, automatic)
393
394 COLL_REDUCE_SCATTERS(COLL_PROTO, COLL_NOsep)
395
396 /*************
397  * SCATTER *
398  *************/
399
400 #define COLL_SCATTERS(action, COLL_sep) \
401 COLL_APPLY(action, COLL_SCATTER_SIG, default) COLL_sep \
402 COLL_APPLY(action, COLL_SCATTER_SIG, ompi) COLL_sep \
403 COLL_APPLY(action, COLL_SCATTER_SIG, ompi_basic_linear) COLL_sep \
404 COLL_APPLY(action, COLL_SCATTER_SIG, ompi_binomial)  COLL_sep \
405 COLL_APPLY(action, COLL_SCATTER_SIG, mpich)   COLL_sep \
406 COLL_APPLY(action, COLL_SCATTER_SIG, mvapich2)   COLL_sep \
407 COLL_APPLY(action, COLL_SCATTER_SIG, mvapich2_two_level_binomial)   COLL_sep \
408 COLL_APPLY(action, COLL_SCATTER_SIG, mvapich2_two_level_direct)   COLL_sep \
409 COLL_APPLY(action, COLL_SCATTER_SIG, impi)   COLL_sep \
410 COLL_APPLY(action, COLL_SCATTER_SIG, automatic)
411
412 COLL_SCATTERS(COLL_PROTO, COLL_NOsep)
413
414 /*************
415  * BARRIER *
416  *************/
417
418 #define COLL_BARRIERS(action, COLL_sep) \
419 COLL_APPLY(action, COLL_BARRIER_SIG, default) COLL_sep \
420 COLL_APPLY(action, COLL_BARRIER_SIG, ompi) COLL_sep \
421 COLL_APPLY(action, COLL_BARRIER_SIG, ompi_basic_linear) COLL_sep \
422 COLL_APPLY(action, COLL_BARRIER_SIG, ompi_two_procs)  COLL_sep \
423 COLL_APPLY(action, COLL_BARRIER_SIG, ompi_tree)  COLL_sep \
424 COLL_APPLY(action, COLL_BARRIER_SIG, ompi_bruck)  COLL_sep \
425 COLL_APPLY(action, COLL_BARRIER_SIG, ompi_recursivedoubling) COLL_sep \
426 COLL_APPLY(action, COLL_BARRIER_SIG, ompi_doublering) COLL_sep \
427 COLL_APPLY(action, COLL_BARRIER_SIG, mpich_smp)   COLL_sep \
428 COLL_APPLY(action, COLL_BARRIER_SIG, mpich)   COLL_sep \
429 COLL_APPLY(action, COLL_BARRIER_SIG, mvapich2_pair)   COLL_sep \
430 COLL_APPLY(action, COLL_BARRIER_SIG, mvapich2)   COLL_sep \
431 COLL_APPLY(action, COLL_BARRIER_SIG, impi)   COLL_sep \
432 COLL_APPLY(action, COLL_BARRIER_SIG, automatic)
433
434 COLL_BARRIERS(COLL_PROTO, COLL_NOsep)
435
436 }
437 }
438 #endif