X-Git-Url: http://info.iut-bm.univ-fcomte.fr/pub/gitweb/simgrid.git/blobdiff_plain/e7ca102c2884a457fb10de086fbaf074506c02e1..6dc20ece02e7caea02aff55e3e3582b42c4cb4cf:/src/smpi/colls/smpi_mvapich2_selector_stampede.h diff --git a/src/smpi/colls/smpi_mvapich2_selector_stampede.h b/src/smpi/colls/smpi_mvapich2_selector_stampede.h index 07614eaa05..28baf73f26 100644 --- a/src/smpi/colls/smpi_mvapich2_selector_stampede.h +++ b/src/smpi/colls/smpi_mvapich2_selector_stampede.h @@ -10,6 +10,8 @@ /************ Alltoall variables and initializers */ #define MV2_MAX_NB_THRESHOLDS 32 + + typedef struct { int min; int max; @@ -47,6 +49,8 @@ static void init_mv2_alltoall_tables_stampede(){ int agg_table_sum = 0; mv2_alltoall_tuning_table **table_ptrs = NULL; mv2_alltoall_num_ppn_conf = 3; + if(smpi_coll_cleanup_callback==NULL) + smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2; mv2_alltoall_thresholds_table = xbt_malloc(sizeof(mv2_alltoall_tuning_table *) * mv2_alltoall_num_ppn_conf); table_ptrs = xbt_malloc(sizeof(mv2_alltoall_tuning_table *) @@ -591,6 +595,8 @@ MV2_Gather_function_ptr MV2_Gather_intra_node_function = NULL; static void init_mv2_gather_tables_stampede(){ + if(smpi_coll_cleanup_callback==NULL) + smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2; mv2_size_gather_tuning_table=7; mv2_gather_thresholds_table = xbt_malloc(mv2_size_gather_tuning_table* sizeof (mv2_gather_tuning_table)); @@ -676,6 +682,8 @@ mv2_allgatherv_tuning_table *mv2_allgatherv_thresholds_table = NULL; static void init_mv2_allgatherv_tables_stampede(){ + if(smpi_coll_cleanup_callback==NULL) + smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2; mv2_size_allgatherv_tuning_table = 6; mv2_allgatherv_thresholds_table = xbt_malloc(mv2_size_allgatherv_tuning_table * sizeof (mv2_allgatherv_tuning_table)); @@ -822,6 +830,8 @@ static int MPIR_Allreduce_reduce_shmem_MV2( void *sendbuf, static void init_mv2_allreduce_tables_stampede(){ + if(smpi_coll_cleanup_callback==NULL) + smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2; mv2_size_allreduce_tuning_table = 8; mv2_allreduce_thresholds_table = xbt_malloc(mv2_size_allreduce_tuning_table * sizeof (mv2_allreduce_tuning_table)); @@ -963,8 +973,8 @@ static void init_mv2_allreduce_tables_stampede(){ } -/* -Bcast deactivated for now, defaults to mpich one + + typedef struct { int min; int max; @@ -995,16 +1005,36 @@ int (*MV2_Bcast_function) (void *buffer, int count, MPI_Datatype datatype, int (*MV2_Bcast_intra_node_function) (void *buffer, int count, MPI_Datatype datatype, int root, MPI_Comm comm_ptr) = NULL; +int zcpy_knomial_factor = 2; +int mv2_pipelined_zcpy_knomial_factor = -1; +int bcast_segment_size = 8192; +int mv2_inter_node_knomial_factor = 4; +int mv2_intra_node_knomial_factor = 4; +#define mv2_bcast_two_level_system_size 64 +#define mv2_bcast_short_msg 16384 +#define mv2_bcast_large_msg 512*1024 + +#define INTRA_NODE_ROOT 0 + +#define MPIR_Pipelined_Bcast_Zcpy_MV2 smpi_coll_tuned_bcast_mpich +#define MPIR_Pipelined_Bcast_MV2 smpi_coll_tuned_bcast_mpich +#define MPIR_Bcast_binomial_MV2 smpi_coll_tuned_bcast_binomial_tree +#define MPIR_Bcast_scatter_ring_allgather_shm_MV2 smpi_coll_tuned_bcast_scatter_LR_allgather +#define MPIR_Bcast_scatter_doubling_allgather_MV2 smpi_coll_tuned_bcast_scatter_rdb_allgather +#define MPIR_Bcast_scatter_ring_allgather_MV2 smpi_coll_tuned_bcast_scatter_LR_allgather +#define MPIR_Shmem_Bcast_MV2 smpi_coll_tuned_bcast_mpich +#define MPIR_Bcast_tune_inter_node_helper_MV2 smpi_coll_tuned_bcast_mvapich2_inter_node +#define MPIR_Bcast_inter_node_helper_MV2 smpi_coll_tuned_bcast_mvapich2_inter_node +#define MPIR_Knomial_Bcast_intra_node_MV2 smpi_coll_tuned_bcast_mvapich2_knomial_intra_node +#define MPIR_Bcast_intra_MV2 smpi_coll_tuned_bcast_mvapich2_intra_node - */ - - -/* static void init_mv2_bcast_tables_stampede(){ //Stampede, - mv2_size_bcast_tuning_table=8; - mv2_bcast_thresholds_table = xbt_malloc(mv2_size_bcast_tuning_table * - sizeof (mv2_bcast_tuning_table)); + if(smpi_coll_cleanup_callback==NULL) + smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2; + mv2_size_bcast_tuning_table=8; + mv2_bcast_thresholds_table = xbt_malloc(mv2_size_bcast_tuning_table * + sizeof (mv2_bcast_tuning_table)); mv2_bcast_tuning_table mv2_tmp_bcast_thresholds_table[]={ { @@ -1207,7 +1237,7 @@ static void init_mv2_bcast_tables_stampede(){ memcpy(mv2_bcast_thresholds_table, mv2_tmp_bcast_thresholds_table, mv2_size_bcast_tuning_table * sizeof (mv2_bcast_tuning_table)); -}*/ +} /************ Reduce variables and initializers */ @@ -1239,8 +1269,8 @@ int mv2_size_reduce_tuning_table = 0; mv2_reduce_tuning_table *mv2_reduce_thresholds_table = NULL; -int mv2_reduce_intra_knomial_factor = 2; -int mv2_reduce_inter_knomial_factor = 2; +int mv2_reduce_intra_knomial_factor = -1; +int mv2_reduce_inter_knomial_factor = -1; int (*MV2_Reduce_function)( void *sendbuf, void *recvbuf, @@ -1264,10 +1294,12 @@ int (*MV2_Reduce_intra_function)( void *sendbuf, #define MPIR_Reduce_binomial_MV2 smpi_coll_tuned_reduce_binomial #define MPIR_Reduce_redscat_gather_MV2 smpi_coll_tuned_reduce_scatter_gather #define MPIR_Reduce_shmem_MV2 smpi_coll_tuned_reduce_ompi_basic_linear - +#define MPIR_Reduce_two_level_helper_MV2 smpi_coll_tuned_reduce_mvapich2_two_level static void init_mv2_reduce_tables_stampede(){ + if(smpi_coll_cleanup_callback==NULL) + smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2; /*Stampede*/ mv2_size_reduce_tuning_table = 8; mv2_reduce_thresholds_table = xbt_malloc(mv2_size_reduce_tuning_table * @@ -1510,6 +1542,8 @@ static int MPIR_Reduce_Scatter_Basic_MV2(void *sendbuf, static void init_mv2_reduce_scatter_tables_stampede(){ + if(smpi_coll_cleanup_callback==NULL) + smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2; mv2_size_red_scat_tuning_table = 6; mv2_red_scat_thresholds_table = xbt_malloc(mv2_size_red_scat_tuning_table * sizeof (mv2_red_scat_tuning_table)); @@ -1627,14 +1661,16 @@ int MPIR_Scatter_mcst_wrap_MV2(void *sendbuf, #define MPIR_Scatter_MV2_Binomial smpi_coll_tuned_scatter_ompi_binomial #define MPIR_Scatter_MV2_Direct smpi_coll_tuned_scatter_ompi_basic_linear -#define MPIR_Scatter_MV2_two_level_Binomial smpi_coll_tuned_scatter_ompi_binomial -#define MPIR_Scatter_MV2_two_level_Direct smpi_coll_tuned_scatter_ompi_basic_linear +#define MPIR_Scatter_MV2_two_level_Binomial smpi_coll_tuned_scatter_mvapich2_two_level_binomial +#define MPIR_Scatter_MV2_two_level_Direct smpi_coll_tuned_scatter_mvapich2_two_level_direct static void init_mv2_scatter_tables_stampede(){ - { + if(smpi_coll_cleanup_callback==NULL) + smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2; + int agg_table_sum = 0; int i; mv2_scatter_tuning_table **table_ptrs = NULL; @@ -1941,6 +1977,6 @@ static void init_mv2_scatter_tables_stampede(){ * mv2_size_scatter_tuning_table[i])); } xbt_free(table_ptrs); - } + }