X-Git-Url: http://info.iut-bm.univ-fcomte.fr/pub/gitweb/simgrid.git/blobdiff_plain/9f4593d014139381fd8977a84e76f0094fb2fac8..4bb593c5dd46c9fa83345dc65903620c917317df:/src/smpi/colls/colls.h diff --git a/src/smpi/colls/colls.h b/src/smpi/colls/colls.h index 4495b4d9ba..be58707f4f 100644 --- a/src/smpi/colls/colls.h +++ b/src/smpi/colls/colls.h @@ -1,15 +1,24 @@ +/* Copyright (c) 2013-2014. The SimGrid Team. + * All rights reserved. */ + +/* This program is free software; you can redistribute it and/or modify it + * under the terms of the license (GNU LGPL) which comes with this package. */ + #ifndef SMPI_COLLS_H #define SMPI_COLLS_H #include #include "smpi/mpi.h" -#include "smpi/private.h" +#include "src/smpi/private.h" +#include "xbt/ex.h" #include "xbt.h" +SG_BEGIN_DECL() + #define COLL_DESCRIPTION(cat, ret, args, name) \ {# name,\ # cat " " # name " collective",\ - smpi_coll_tuned_ ## cat ## _ ## name} + (void*)smpi_coll_tuned_ ## cat ## _ ## name} #define COLL_PROTO(cat, ret, args, name) \ ret smpi_coll_tuned_ ## cat ## _ ## name(COLL_UNPAREN args); @@ -32,7 +41,13 @@ COLL_APPLY(action, COLL_GATHER_SIG, ompi) COLL_sep \ COLL_APPLY(action, COLL_GATHER_SIG, ompi_basic_linear) COLL_sep \ COLL_APPLY(action, COLL_GATHER_SIG, ompi_binomial) COLL_sep \ -COLL_APPLY(action, COLL_GATHER_SIG, ompi_linear_sync) \ +COLL_APPLY(action, COLL_GATHER_SIG, ompi_linear_sync) COLL_sep \ +COLL_APPLY(action, COLL_GATHER_SIG, mpich) COLL_sep \ +COLL_APPLY(action, COLL_GATHER_SIG, mvapich2) COLL_sep \ +COLL_APPLY(action, COLL_GATHER_SIG, mvapich2_two_level) COLL_sep \ +COLL_APPLY(action, COLL_GATHER_SIG, impi) COLL_sep \ +COLL_APPLY(action, COLL_GATHER_SIG, automatic) + COLL_GATHERS(COLL_PROTO, COLL_NOsep) @@ -51,7 +66,6 @@ COLL_APPLY(action, COLL_ALLGATHER_SIG, 3dmesh) COLL_sep \ COLL_APPLY(action, COLL_ALLGATHER_SIG, bruck) COLL_sep \ COLL_APPLY(action, COLL_ALLGATHER_SIG, GB) COLL_sep \ COLL_APPLY(action, COLL_ALLGATHER_SIG, loosely_lr) COLL_sep \ -COLL_APPLY(action, COLL_ALLGATHER_SIG, lr) COLL_sep \ COLL_APPLY(action, COLL_ALLGATHER_SIG, NTSLR) COLL_sep \ COLL_APPLY(action, COLL_ALLGATHER_SIG, NTSLR_NB) COLL_sep \ COLL_APPLY(action, COLL_ALLGATHER_SIG, pair) COLL_sep \ @@ -62,7 +76,13 @@ COLL_APPLY(action, COLL_ALLGATHER_SIG, SMP_NTS) COLL_sep \ COLL_APPLY(action, COLL_ALLGATHER_SIG, smp_simple) COLL_sep \ COLL_APPLY(action, COLL_ALLGATHER_SIG, spreading_simple) COLL_sep \ COLL_APPLY(action, COLL_ALLGATHER_SIG, ompi) COLL_sep \ -COLL_APPLY(action, COLL_ALLGATHER_SIG, ompi_neighborexchange) +COLL_APPLY(action, COLL_ALLGATHER_SIG, ompi_neighborexchange) COLL_sep \ +COLL_APPLY(action, COLL_ALLGATHER_SIG, mvapich2) COLL_sep \ +COLL_APPLY(action, COLL_ALLGATHER_SIG, mvapich2_smp) COLL_sep \ +COLL_APPLY(action, COLL_ALLGATHER_SIG, mpich) COLL_sep \ +COLL_APPLY(action, COLL_ALLGATHER_SIG, impi) COLL_sep \ +COLL_APPLY(action, COLL_ALLGATHER_SIG, automatic) + COLL_ALLGATHERS(COLL_PROTO, COLL_NOsep) @@ -79,7 +99,14 @@ COLL_APPLY(action, COLL_ALLGATHERV_SIG, GB) COLL_sep \ COLL_APPLY(action, COLL_ALLGATHERV_SIG, pair) COLL_sep \ COLL_APPLY(action, COLL_ALLGATHERV_SIG, ring) COLL_sep \ COLL_APPLY(action, COLL_ALLGATHERV_SIG, ompi) COLL_sep \ -COLL_APPLY(action, COLL_ALLGATHERV_SIG, ompi_neighborexchange) +COLL_APPLY(action, COLL_ALLGATHERV_SIG, ompi_neighborexchange) COLL_sep \ +COLL_APPLY(action, COLL_ALLGATHERV_SIG, ompi_bruck) COLL_sep \ +COLL_APPLY(action, COLL_ALLGATHERV_SIG, mpich) COLL_sep \ +COLL_APPLY(action, COLL_ALLGATHERV_SIG, mpich_rdb) COLL_sep \ +COLL_APPLY(action, COLL_ALLGATHERV_SIG, mpich_ring) COLL_sep \ +COLL_APPLY(action, COLL_ALLGATHERV_SIG, mvapich2) COLL_sep \ +COLL_APPLY(action, COLL_ALLGATHERV_SIG, impi) COLL_sep \ +COLL_APPLY(action, COLL_ALLGATHERV_SIG, automatic) COLL_ALLGATHERVS(COLL_PROTO, COLL_NOsep) @@ -92,12 +119,9 @@ COLL_ALLGATHERVS(COLL_PROTO, COLL_NOsep) #define COLL_ALLREDUCES(action, COLL_sep) \ COLL_APPLY(action, COLL_ALLREDUCE_SIG, lr) COLL_sep \ -COLL_APPLY(action, COLL_ALLREDUCE_SIG, NTS) COLL_sep \ COLL_APPLY(action, COLL_ALLREDUCE_SIG, rab1) COLL_sep \ COLL_APPLY(action, COLL_ALLREDUCE_SIG, rab2) COLL_sep \ COLL_APPLY(action, COLL_ALLREDUCE_SIG, rab_rdb) COLL_sep \ -COLL_NOTHING(COLL_APPLY(action, COLL_ALLREDUCE_SIG, rab_reduce_scatter) COLL_sep) \ -COLL_APPLY(action, COLL_ALLREDUCE_SIG, rab_rsag) COLL_sep \ COLL_APPLY(action, COLL_ALLREDUCE_SIG, rdb) COLL_sep \ COLL_APPLY(action, COLL_ALLREDUCE_SIG, smp_binomial) COLL_sep \ COLL_APPLY(action, COLL_ALLREDUCE_SIG, smp_binomial_pipeline) COLL_sep \ @@ -107,7 +131,14 @@ COLL_APPLY(action, COLL_ALLREDUCE_SIG, smp_rsag_lr) COLL_sep \ COLL_APPLY(action, COLL_ALLREDUCE_SIG, smp_rsag_rab) COLL_sep \ COLL_APPLY(action, COLL_ALLREDUCE_SIG, redbcast) COLL_sep \ COLL_APPLY(action, COLL_ALLREDUCE_SIG, ompi) COLL_sep \ -COLL_APPLY(action, COLL_ALLREDUCE_SIG, ompi_ring_segmented) +COLL_APPLY(action, COLL_ALLREDUCE_SIG, ompi_ring_segmented) COLL_sep \ +COLL_APPLY(action, COLL_ALLREDUCE_SIG, mpich) COLL_sep \ +COLL_APPLY(action, COLL_ALLREDUCE_SIG, mvapich2) COLL_sep \ +COLL_APPLY(action, COLL_ALLREDUCE_SIG, mvapich2_rs) COLL_sep \ +COLL_APPLY(action, COLL_ALLREDUCE_SIG, mvapich2_two_level) COLL_sep \ +COLL_APPLY(action, COLL_ALLREDUCE_SIG, impi) COLL_sep \ +COLL_APPLY(action, COLL_ALLREDUCE_SIG, rab) COLL_sep \ +COLL_APPLY(action, COLL_ALLREDUCE_SIG, automatic) COLL_ALLREDUCES(COLL_PROTO, COLL_NOsep) @@ -118,13 +149,15 @@ COLL_ALLREDUCES(COLL_PROTO, COLL_NOsep) #define COLL_ALLTOALL_SIG alltoall, int, \ (void *send_buff, int send_count, MPI_Datatype send_type, \ void *recv_buff, int recv_count, MPI_Datatype recv_type, \ - MPI_Comm com) + MPI_Comm comm) #define COLL_ALLTOALLS(action, COLL_sep) \ COLL_APPLY(action, COLL_ALLTOALL_SIG, 2dmesh) COLL_sep \ COLL_APPLY(action, COLL_ALLTOALL_SIG, 3dmesh) COLL_sep \ -COLL_NOTHING(COLL_APPLY(action, COLL_ALLTOALL_SIG, bruck) COLL_sep) \ +COLL_APPLY(action, COLL_ALLTOALL_SIG, basic_linear) COLL_sep \ +COLL_APPLY(action, COLL_ALLTOALL_SIG, bruck) COLL_sep \ COLL_APPLY(action, COLL_ALLTOALL_SIG, pair) COLL_sep \ +COLL_APPLY(action, COLL_ALLTOALL_SIG, pair_rma) COLL_sep \ COLL_APPLY(action, COLL_ALLTOALL_SIG, pair_light_barrier) COLL_sep \ COLL_APPLY(action, COLL_ALLTOALL_SIG, pair_mpi_barrier) COLL_sep \ COLL_APPLY(action, COLL_ALLTOALL_SIG, pair_one_barrier) COLL_sep \ @@ -133,8 +166,12 @@ COLL_APPLY(action, COLL_ALLTOALL_SIG, ring) COLL_sep \ COLL_APPLY(action, COLL_ALLTOALL_SIG, ring_light_barrier) COLL_sep \ COLL_APPLY(action, COLL_ALLTOALL_SIG, ring_mpi_barrier) COLL_sep \ COLL_APPLY(action, COLL_ALLTOALL_SIG, ring_one_barrier) COLL_sep \ -COLL_APPLY(action, COLL_ALLTOALL_SIG, simple) COLL_sep \ -COLL_APPLY(action, COLL_ALLTOALL_SIG, ompi) +COLL_APPLY(action, COLL_ALLTOALL_SIG, mvapich2) COLL_sep \ +COLL_APPLY(action, COLL_ALLTOALL_SIG, mvapich2_scatter_dest) COLL_sep \ +COLL_APPLY(action, COLL_ALLTOALL_SIG, ompi) COLL_sep \ +COLL_APPLY(action, COLL_ALLTOALL_SIG, mpich) COLL_sep \ +COLL_APPLY(action, COLL_ALLTOALL_SIG, impi) COLL_sep \ +COLL_APPLY(action, COLL_ALLTOALL_SIG, automatic) COLL_ALLTOALLS(COLL_PROTO, COLL_NOsep) @@ -144,7 +181,7 @@ COLL_ALLTOALLS(COLL_PROTO, COLL_NOsep) #define COLL_ALLTOALLV_SIG alltoallv, int, \ (void *send_buff, int *send_counts, int *send_disps, MPI_Datatype send_type, \ void *recv_buff, int *recv_counts, int *recv_disps, MPI_Datatype recv_type, \ - MPI_Comm com) + MPI_Comm comm) #define COLL_ALLTOALLVS(action, COLL_sep) \ COLL_APPLY(action, COLL_ALLTOALLV_SIG, bruck) COLL_sep \ @@ -156,7 +193,12 @@ COLL_APPLY(action, COLL_ALLTOALLV_SIG, ring) COLL_sep \ COLL_APPLY(action, COLL_ALLTOALLV_SIG, ring_light_barrier) COLL_sep \ COLL_APPLY(action, COLL_ALLTOALLV_SIG, ring_mpi_barrier) COLL_sep \ COLL_APPLY(action, COLL_ALLTOALLV_SIG, ring_one_barrier) COLL_sep \ -COLL_APPLY(action, COLL_ALLTOALLV_SIG, ompi) +COLL_APPLY(action, COLL_ALLTOALLV_SIG, ompi) COLL_sep \ +COLL_APPLY(action, COLL_ALLTOALLV_SIG, mpich) COLL_sep \ +COLL_APPLY(action, COLL_ALLTOALLV_SIG, ompi_basic_linear) COLL_sep \ +COLL_APPLY(action, COLL_ALLTOALLV_SIG, mvapich2) COLL_sep \ +COLL_APPLY(action, COLL_ALLTOALLV_SIG, impi) COLL_sep \ +COLL_APPLY(action, COLL_ALLTOALLV_SIG, automatic) COLL_ALLTOALLVS(COLL_PROTO, COLL_NOsep) @@ -168,7 +210,6 @@ COLL_ALLTOALLVS(COLL_PROTO, COLL_NOsep) int root, MPI_Comm comm) #define COLL_BCASTS(action, COLL_sep) \ -COLL_APPLY(action, COLL_BCAST_SIG, arrival_nb) COLL_sep \ COLL_APPLY(action, COLL_BCAST_SIG, arrival_pattern_aware) COLL_sep \ COLL_APPLY(action, COLL_BCAST_SIG, arrival_pattern_aware_wait) COLL_sep \ COLL_APPLY(action, COLL_BCAST_SIG, arrival_scatter) COLL_sep \ @@ -185,7 +226,14 @@ COLL_APPLY(action, COLL_BCAST_SIG, SMP_binomial) COLL_sep \ COLL_APPLY(action, COLL_BCAST_SIG, SMP_linear) COLL_sep \ COLL_APPLY(action, COLL_BCAST_SIG, ompi) COLL_sep \ COLL_APPLY(action, COLL_BCAST_SIG, ompi_split_bintree) COLL_sep \ -COLL_APPLY(action, COLL_BCAST_SIG, ompi_pipeline) +COLL_APPLY(action, COLL_BCAST_SIG, ompi_pipeline) COLL_sep \ +COLL_APPLY(action, COLL_BCAST_SIG, mpich) COLL_sep \ +COLL_APPLY(action, COLL_BCAST_SIG, mvapich2) COLL_sep \ +COLL_APPLY(action, COLL_BCAST_SIG, mvapich2_inter_node) COLL_sep \ +COLL_APPLY(action, COLL_BCAST_SIG, mvapich2_intra_node) COLL_sep \ +COLL_APPLY(action, COLL_BCAST_SIG, mvapich2_knomial_intra_node) COLL_sep \ +COLL_APPLY(action, COLL_BCAST_SIG, impi) COLL_sep \ +COLL_APPLY(action, COLL_BCAST_SIG, automatic) COLL_BCASTS(COLL_PROTO, COLL_NOsep) @@ -209,8 +257,84 @@ COLL_APPLY(action, COLL_REDUCE_SIG, ompi_pipeline) COLL_sep \ COLL_APPLY(action, COLL_REDUCE_SIG, ompi_basic_linear) COLL_sep \ COLL_APPLY(action, COLL_REDUCE_SIG, ompi_in_order_binary) COLL_sep \ COLL_APPLY(action, COLL_REDUCE_SIG, ompi_binary) COLL_sep \ -COLL_APPLY(action, COLL_REDUCE_SIG, ompi_binomial) +COLL_APPLY(action, COLL_REDUCE_SIG, ompi_binomial) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SIG, mpich) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SIG, mvapich2) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SIG, mvapich2_knomial) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SIG, mvapich2_two_level) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SIG, impi) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SIG, rab) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SIG, automatic) COLL_REDUCES(COLL_PROTO, COLL_NOsep) +/************* + * REDUCE_SCATTER * + *************/ +#define COLL_REDUCE_SCATTER_SIG reduce_scatter, int, \ + (void *sbuf, void *rbuf, int *rcounts,\ + MPI_Datatype dtype,MPI_Op op,MPI_Comm comm) + +#define COLL_REDUCE_SCATTERS(action, COLL_sep) \ +COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, ompi) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, ompi_basic_recursivehalving) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, ompi_ring) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, mpich) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, mpich_pair) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, mpich_rdb) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, mpich_noncomm) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, mvapich2) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, impi) COLL_sep \ +COLL_APPLY(action, COLL_REDUCE_SCATTER_SIG, automatic) + + + +COLL_REDUCE_SCATTERS(COLL_PROTO, COLL_NOsep) + + +/************* + * SCATTER * + *************/ +#define COLL_SCATTER_SIG scatter, int, \ + (void *sendbuf, int sendcount, MPI_Datatype sendtype,\ + void *recvbuf, int recvcount, MPI_Datatype recvtype,\ + int root, MPI_Comm comm) + +#define COLL_SCATTERS(action, COLL_sep) \ +COLL_APPLY(action, COLL_SCATTER_SIG, ompi) COLL_sep \ +COLL_APPLY(action, COLL_SCATTER_SIG, ompi_basic_linear) COLL_sep \ +COLL_APPLY(action, COLL_SCATTER_SIG, ompi_binomial) COLL_sep \ +COLL_APPLY(action, COLL_SCATTER_SIG, mpich) COLL_sep \ +COLL_APPLY(action, COLL_SCATTER_SIG, mvapich2) COLL_sep \ +COLL_APPLY(action, COLL_SCATTER_SIG, mvapich2_two_level_binomial) COLL_sep \ +COLL_APPLY(action, COLL_SCATTER_SIG, mvapich2_two_level_direct) COLL_sep \ +COLL_APPLY(action, COLL_SCATTER_SIG, impi) COLL_sep \ +COLL_APPLY(action, COLL_SCATTER_SIG, automatic) + +COLL_SCATTERS(COLL_PROTO, COLL_NOsep) + +/************* + * SCATTER * + *************/ +#define COLL_BARRIER_SIG barrier, int, \ + (MPI_Comm comm) + +#define COLL_BARRIERS(action, COLL_sep) \ +COLL_APPLY(action, COLL_BARRIER_SIG, ompi) COLL_sep \ +COLL_APPLY(action, COLL_BARRIER_SIG, ompi_basic_linear) COLL_sep \ +COLL_APPLY(action, COLL_BARRIER_SIG, ompi_two_procs) COLL_sep \ +COLL_APPLY(action, COLL_BARRIER_SIG, ompi_tree) COLL_sep \ +COLL_APPLY(action, COLL_BARRIER_SIG, ompi_bruck) COLL_sep \ +COLL_APPLY(action, COLL_BARRIER_SIG, ompi_recursivedoubling) COLL_sep \ +COLL_APPLY(action, COLL_BARRIER_SIG, ompi_doublering) COLL_sep \ +COLL_APPLY(action, COLL_BARRIER_SIG, mpich) COLL_sep \ +COLL_APPLY(action, COLL_BARRIER_SIG, mvapich2_pair) COLL_sep \ +COLL_APPLY(action, COLL_BARRIER_SIG, mvapich2) COLL_sep \ +COLL_APPLY(action, COLL_BARRIER_SIG, impi) COLL_sep \ +COLL_APPLY(action, COLL_BARRIER_SIG, automatic) + +COLL_BARRIERS(COLL_PROTO, COLL_NOsep) + +SG_END_DECL() + #endif