int agg_table_sum = 0;
mv2_alltoall_tuning_table **table_ptrs = NULL;
mv2_alltoall_num_ppn_conf = 3;
+ if(smpi_coll_cleanup_callback==NULL)
+ smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2;
mv2_alltoall_thresholds_table = xbt_malloc(sizeof(mv2_alltoall_tuning_table *)
* mv2_alltoall_num_ppn_conf);
table_ptrs = xbt_malloc(sizeof(mv2_alltoall_tuning_table *)
static void init_mv2_allgather_tables_stampede(){
int i;
int agg_table_sum = 0;
+
+ if(smpi_coll_cleanup_callback==NULL)
+ smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2;
mv2_allgather_tuning_table **table_ptrs = NULL;
mv2_allgather_num_ppn_conf = 3;
mv2_allgather_thresholds_table
static void init_mv2_gather_tables_stampede(){
+ if(smpi_coll_cleanup_callback==NULL)
+ smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2;
mv2_size_gather_tuning_table=7;
mv2_gather_thresholds_table = xbt_malloc(mv2_size_gather_tuning_table*
sizeof (mv2_gather_tuning_table));
static void init_mv2_allgatherv_tables_stampede(){
+ if(smpi_coll_cleanup_callback==NULL)
+ smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2;
mv2_size_allgatherv_tuning_table = 6;
mv2_allgatherv_thresholds_table = xbt_malloc(mv2_size_allgatherv_tuning_table *
sizeof (mv2_allgatherv_tuning_table));
static void init_mv2_allreduce_tables_stampede(){
+ if(smpi_coll_cleanup_callback==NULL)
+ smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2;
mv2_size_allreduce_tuning_table = 8;
mv2_allreduce_thresholds_table = xbt_malloc(mv2_size_allreduce_tuning_table *
sizeof (mv2_allreduce_tuning_table));
int bcast_segment_size = 8192;
int mv2_inter_node_knomial_factor = 4;
int mv2_intra_node_knomial_factor = 4;
+#define mv2_bcast_two_level_system_size 64
+#define mv2_bcast_short_msg 16384
+#define mv2_bcast_large_msg 512*1024
+
#define INTRA_NODE_ROOT 0
#define MPIR_Pipelined_Bcast_Zcpy_MV2 smpi_coll_tuned_bcast_mpich
#define MPIR_Pipelined_Bcast_MV2 smpi_coll_tuned_bcast_mpich
-#define MPIR_Bcast_binomial_MV2 smpi_coll_tuned_bcast_mpich
-#define MPIR_Bcast_scatter_ring_allgather_shm_MV2 smpi_coll_tuned_bcast_mpich
-#define MPIR_Bcast_scatter_doubling_allgather_MV2 smpi_coll_tuned_bcast_mpich
-#define MPIR_Bcast_scatter_ring_allgather_MV2 smpi_coll_tuned_bcast_mpich
+#define MPIR_Bcast_binomial_MV2 smpi_coll_tuned_bcast_binomial_tree
+#define MPIR_Bcast_scatter_ring_allgather_shm_MV2 smpi_coll_tuned_bcast_scatter_LR_allgather
+#define MPIR_Bcast_scatter_doubling_allgather_MV2 smpi_coll_tuned_bcast_scatter_rdb_allgather
+#define MPIR_Bcast_scatter_ring_allgather_MV2 smpi_coll_tuned_bcast_scatter_LR_allgather
#define MPIR_Shmem_Bcast_MV2 smpi_coll_tuned_bcast_mpich
-#define MPIR_Bcast_tune_inter_node_helper_MV2 smpi_coll_tuned_bcast_mpich
-#define MPIR_Knomial_Bcast_intra_node_MV2 smpi_coll_tuned_bcast_mpich
-#define MPIR_Bcast_intra_MV2 smpi_coll_tuned_bcast_mpich
+#define MPIR_Bcast_tune_inter_node_helper_MV2 smpi_coll_tuned_bcast_mvapich2_inter_node
+#define MPIR_Bcast_inter_node_helper_MV2 smpi_coll_tuned_bcast_mvapich2_inter_node
+#define MPIR_Knomial_Bcast_intra_node_MV2 smpi_coll_tuned_bcast_mvapich2_knomial_intra_node
+#define MPIR_Bcast_intra_MV2 smpi_coll_tuned_bcast_mvapich2_intra_node
static void init_mv2_bcast_tables_stampede(){
//Stampede,
- mv2_size_bcast_tuning_table=8;
- mv2_bcast_thresholds_table = xbt_malloc(mv2_size_bcast_tuning_table *
- sizeof (mv2_bcast_tuning_table));
+ if(smpi_coll_cleanup_callback==NULL)
+ smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2;
+ mv2_size_bcast_tuning_table=8;
+ mv2_bcast_thresholds_table = xbt_malloc(mv2_size_bcast_tuning_table *
+ sizeof (mv2_bcast_tuning_table));
mv2_bcast_tuning_table mv2_tmp_bcast_thresholds_table[]={
{
mv2_reduce_tuning_table *mv2_reduce_thresholds_table = NULL;
-int mv2_reduce_intra_knomial_factor = 2;
-int mv2_reduce_inter_knomial_factor = 2;
+int mv2_reduce_intra_knomial_factor = -1;
+int mv2_reduce_inter_knomial_factor = -1;
int (*MV2_Reduce_function)( void *sendbuf,
void *recvbuf,
static void init_mv2_reduce_tables_stampede(){
+ if(smpi_coll_cleanup_callback==NULL)
+ smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2;
/*Stampede*/
mv2_size_reduce_tuning_table = 8;
mv2_reduce_thresholds_table = xbt_malloc(mv2_size_reduce_tuning_table *
static void init_mv2_reduce_scatter_tables_stampede(){
+ if(smpi_coll_cleanup_callback==NULL)
+ smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2;
mv2_size_red_scat_tuning_table = 6;
mv2_red_scat_thresholds_table = xbt_malloc(mv2_size_red_scat_tuning_table *
sizeof (mv2_red_scat_tuning_table));
static void init_mv2_scatter_tables_stampede(){
- {
+ if(smpi_coll_cleanup_callback==NULL)
+ smpi_coll_cleanup_callback=&smpi_coll_cleanup_mvapich2;
+
int agg_table_sum = 0;
int i;
mv2_scatter_tuning_table **table_ptrs = NULL;
* mv2_size_scatter_tuning_table[i]));
}
xbt_free(table_ptrs);
- }
+
}