X-Git-Url: http://info.iut-bm.univ-fcomte.fr/pub/gitweb/simgrid.git/blobdiff_plain/d53d00d608a60a6f05e77ea7b7cd5c4e544d7ab1..96cedde3cdbc0b8ffc3f096a1b65d021b0226f99:/src/smpi/colls/coll_tuned_topo.cpp diff --git a/src/smpi/colls/coll_tuned_topo.cpp b/src/smpi/colls/coll_tuned_topo.cpp index a5c53b10f2..c9527705db 100644 --- a/src/smpi/colls/coll_tuned_topo.cpp +++ b/src/smpi/colls/coll_tuned_topo.cpp @@ -1,4 +1,4 @@ -/* Copyright (c) 2013-2014. The SimGrid Team. +/* Copyright (c) 2013-2019. The SimGrid Team. * All rights reserved. */ /* This program is free software; you can redistribute it and/or modify it @@ -11,16 +11,16 @@ * Copyright (c) 2004-2005 The University of Tennessee and The University * of Tennessee Research Foundation. All rights * reserved. - * Copyright (c) 2004-2005 High Performance Computing Center Stuttgart, + * Copyright (c) 2004-2005 High Performance Computing Center Stuttgart, * University of Stuttgart. All rights reserved. * Copyright (c) 2004-2005 The Regents of the University of California. * All rights reserved. - * + * * Additional copyrights may follow */ -#include "colls_private.h" -#include "coll_tuned_topo.h" +#include "coll_tuned_topo.hpp" +#include "colls_private.hpp" /* * Some static helpers. */ @@ -52,7 +52,10 @@ static int calculate_num_nodes_up_to_level( int fanout, int level ) { /* just use geometric progression formula for sum: a^0+a^1+...a^(n-1) = (a^n-1)/(a-1) */ - return ((pown(fanout,level) - 1)/(fanout - 1)); + if (fanout > 1) + return ((pown(fanout, level) - 1) / (fanout - 1)); + else + return 0; // is this right ? } /* @@ -76,7 +79,7 @@ ompi_coll_tuned_topo_build_tree( int fanout, int schild, sparent; int level; /* location of my rank in the tree structure of size */ int delta; /* number of nodes on my level */ - int slimit; /* total number of nodes on levels above me */ + int slimit; /* total number of nodes on levels above me */ int shiftedrank; int i; ompi_coll_tree_t* tree; @@ -92,16 +95,16 @@ ompi_coll_tuned_topo_build_tree( int fanout, return NULL; } - /* - * Get size and rank of the process in this communicator + /* + * Get size and rank of the process in this communicator */ - size = smpi_comm_size(comm); - rank = smpi_comm_rank(comm); + size = comm->size(); + rank = comm->rank(); - tree = (ompi_coll_tree_t*)malloc(sizeof(ompi_coll_tree_t)); - if (!tree) { - XBT_DEBUG("coll:tuned:topo_build_tree PANIC::out of memory"); - return NULL; + tree = new ompi_coll_tree_t; + if (not tree) { + XBT_DEBUG("coll:tuned:topo_build_tree PANIC::out of memory"); + return NULL; } tree->tree_root = MPI_UNDEFINED; @@ -111,8 +114,8 @@ ompi_coll_tuned_topo_build_tree( int fanout, * Set root */ tree->tree_root = root; - - /* + + /* * Initialize tree */ tree->tree_fanout = fanout; @@ -128,11 +131,11 @@ ompi_coll_tuned_topo_build_tree( int fanout, if( size < 2 ) { return tree; } - + /* - * Shift all ranks by root, so that the algorithm can be + * Shift all ranks by root, so that the algorithm can be * designed as if root would be always 0 - * shiftedrank should be used in calculating distances + * shiftedrank should be used in calculating distances * and position in tree */ shiftedrank = rank - root; @@ -154,7 +157,7 @@ ompi_coll_tuned_topo_build_tree( int fanout, break; } } - + /* find my parent */ slimit = calculate_num_nodes_up_to_level( fanout, level ); sparent = shiftedrank; @@ -166,12 +169,12 @@ ompi_coll_tuned_topo_build_tree( int fanout, } } tree->tree_prev = (sparent+root)%size; - + return tree; } /* - * Constructs in-order binary tree which can be used for non-commutative reduce + * Constructs in-order binary tree which can be used for non-commutative reduce * operations. * Root of this tree is always rank (size-1) and fanout is 2. * Here are some of the examples of this tree: @@ -192,23 +195,22 @@ ompi_coll_tuned_topo_build_in_order_bintree( MPI_Comm comm ) int parent, lchild, rchild; ompi_coll_tree_t* tree; - /* - * Get size and rank of the process in this communicator + /* + * Get size and rank of the process in this communicator */ - size = smpi_comm_size(comm); - rank = smpi_comm_rank(comm); + size = comm->size(); + rank = comm->rank(); - tree = (ompi_coll_tree_t*)malloc(sizeof(ompi_coll_tree_t)); - if (!tree) { - XBT_DEBUG( - "coll:tuned:topo_build_tree PANIC::out of memory"); - return NULL; + tree = new ompi_coll_tree_t; + if (not tree) { + XBT_DEBUG("coll:tuned:topo_build_tree PANIC::out of memory"); + return NULL; } tree->tree_root = MPI_UNDEFINED; tree->tree_nextsize = MPI_UNDEFINED; - /* + /* * Initialize tree */ tree->tree_fanout = 2; @@ -219,10 +221,10 @@ ompi_coll_tuned_topo_build_in_order_bintree( MPI_Comm comm ) tree->tree_next[0] = -1; tree->tree_next[1] = -1; XBT_DEBUG( - "coll:tuned:topo_build_in_order_tree Building fo %d rt %d", + "coll:tuned:topo_build_in_order_tree Building fo %d rt %d", tree->tree_fanout, tree->tree_root); - /* + /* * Build the tree */ myrank = rank; @@ -238,18 +240,18 @@ ompi_coll_tuned_topo_build_in_order_bintree( MPI_Comm comm ) rchild = -1; if (size - 1 > 0) { lchild = parent - 1; - if (lchild > 0) { + if (lchild > 0) { rchild = rightsize - 1; } } - - /* The following cases are possible: myrank can be + + /* The following cases are possible: myrank can be - a parent, - belong to the left subtree, or - belong to the right subtee Each of the cases need to be handled differently. */ - + if (myrank == parent) { /* I am the parent: - compute real ranks of my children, and exit the loop. */ @@ -260,7 +262,7 @@ ompi_coll_tuned_topo_build_in_order_bintree( MPI_Comm comm ) if (myrank > rchild) { /* I belong to the left subtree: - If I am the left child, compute real rank of my parent - - Iterate down through tree: + - Iterate down through tree: compute new size, shift ranks down, and update delta. */ if (myrank == lchild) { @@ -274,8 +276,8 @@ ompi_coll_tuned_topo_build_in_order_bintree( MPI_Comm comm ) } else { /* I belong to the right subtree: - If I am the right child, compute real rank of my parent - - Iterate down through tree: - compute new size and parent, + - Iterate down through tree: + compute new size and parent, but the delta and rank do not need to change. */ if (myrank == rchild) { @@ -285,7 +287,7 @@ ompi_coll_tuned_topo_build_in_order_bintree( MPI_Comm comm ) parent = rchild; } } - + if (tree->tree_next[0] >= 0) { tree->tree_nextsize = 1; } if (tree->tree_next[1] >= 0) { tree->tree_nextsize += 1; } @@ -296,20 +298,20 @@ int ompi_coll_tuned_topo_destroy_tree( ompi_coll_tree_t** tree ) { ompi_coll_tree_t *ptr; - if ((!tree)||(!*tree)) { - return MPI_SUCCESS; + if ((tree == nullptr) || (*tree == nullptr)) { + return MPI_SUCCESS; } ptr = *tree; - free (ptr); + delete ptr; *tree = NULL; /* mark tree as gone */ return MPI_SUCCESS; } /* - * + * * Here are some of the examples of this tree: * size == 2 size = 4 size = 8 * 0 0 0 @@ -335,18 +337,18 @@ ompi_coll_tuned_topo_build_bmtree( MPI_Comm comm, XBT_DEBUG("coll:tuned:topo:build_bmtree rt %d", root); - /* - * Get size and rank of the process in this communicator + /* + * Get size and rank of the process in this communicator */ - size = smpi_comm_size(comm); - rank = smpi_comm_rank(comm); + size = comm->size(); + rank = comm->rank(); index = rank -root; - bmtree = (ompi_coll_tree_t*)malloc(sizeof(ompi_coll_tree_t)); - if (!bmtree) { - XBT_DEBUG("coll:tuned:topo:build_bmtree PANIC out of memory"); - return NULL; + bmtree = new ompi_coll_tree_t; + if (not bmtree) { + XBT_DEBUG("coll:tuned:topo:build_bmtree PANIC out of memory"); + return NULL; } bmtree->tree_bmtree = 1; @@ -391,7 +393,7 @@ ompi_coll_tuned_topo_build_bmtree( MPI_Comm comm, /* * Constructs in-order binomial tree which can be used for gather/scatter * operations. - * + * * Here are some of the examples of this tree: * size == 2 size = 4 size = 8 * 0 0 0 @@ -402,9 +404,7 @@ ompi_coll_tuned_topo_build_bmtree( MPI_Comm comm, * | * 7 */ -ompi_coll_tree_t* -ompi_coll_tuned_topo_build_in_order_bmtree( MPI_Comm comm, - int root ) +ompi_coll_tree_t* ompi_coll_tuned_topo_build_in_order_bmtree(MPI_Comm comm, int root) { int childs = 0; int rank, vrank; @@ -416,18 +416,18 @@ ompi_coll_tuned_topo_build_in_order_bmtree( MPI_Comm comm, XBT_DEBUG("coll:tuned:topo:build_in_order_bmtree rt %d", root); - /* - * Get size and rank of the process in this communicator + /* + * Get size and rank of the process in this communicator */ - size = smpi_comm_size(comm); - rank = smpi_comm_rank(comm); + size = comm->size(); + rank = comm->rank(); vrank = (rank - root + size) % size; - bmtree = (ompi_coll_tree_t*)xbt_malloc(sizeof(ompi_coll_tree_t)); - if (!bmtree) { - XBT_DEBUG("coll:tuned:topo:build_bmtree PANIC out of memory"); - return NULL; + bmtree = new ompi_coll_tree_t; + if (not bmtree) { + XBT_DEBUG("coll:tuned:topo:build_bmtree PANIC out of memory"); + return NULL; } bmtree->tree_bmtree = 1; @@ -438,25 +438,23 @@ ompi_coll_tuned_topo_build_in_order_bmtree( MPI_Comm comm, } if (root == rank) { - bmtree->tree_prev = root; + bmtree->tree_prev = root; } while (mask < size) { - remote = vrank ^ mask; - if (remote < vrank) { - bmtree->tree_prev = (remote + root) % size; - break; - } else if (remote < size) { - bmtree->tree_next[childs] = (remote + root) % size; - childs++; - if (childs==MAXTREEFANOUT) { - XBT_DEBUG( - "coll:tuned:topo:build_bmtree max fanout incorrect %d needed %d", - MAXTREEFANOUT, childs); - return NULL; - } - } - mask <<= 1; + remote = vrank ^ mask; + if (remote < vrank) { + bmtree->tree_prev = (remote + root) % size; + break; + } else if (remote < size) { + bmtree->tree_next[childs] = (remote + root) % size; + childs++; + if (childs == MAXTREEFANOUT) { + XBT_DEBUG("coll:tuned:topo:build_bmtree max fanout incorrect %d needed %d", MAXTREEFANOUT, childs); + return NULL; + } + } + mask <<= 1; } bmtree->tree_nextsize = childs; bmtree->tree_root = root; @@ -478,11 +476,11 @@ ompi_coll_tuned_topo_build_chain( int fanout, XBT_DEBUG("coll:tuned:topo:build_chain fo %d rt %d", fanout, root); - /* - * Get size and rank of the process in this communicator + /* + * Get size and rank of the process in this communicator */ - size = smpi_comm_size(comm); - rank = smpi_comm_rank(comm); + size = comm->size(); + rank = comm->rank(); if( fanout < 1 ) { XBT_DEBUG("coll:tuned:topo:build_chain WARNING invalid fanout of ZERO, forcing to 1 (pipeline)!"); @@ -494,29 +492,29 @@ ompi_coll_tuned_topo_build_chain( int fanout, } /* - * Allocate space for topology arrays if needed + * Allocate space for topology arrays if needed */ - chain = (ompi_coll_tree_t*)malloc( sizeof(ompi_coll_tree_t) ); - if (!chain) { - XBT_DEBUG("coll:tuned:topo:build_chain PANIC out of memory"); - fflush(stdout); - return NULL; + chain = new ompi_coll_tree_t; + if (not chain) { + XBT_DEBUG("coll:tuned:topo:build_chain PANIC out of memory"); + fflush(stdout); + return NULL; } chain->tree_root = MPI_UNDEFINED; chain->tree_nextsize = -1; for(i=0;itree_next[i] = -1; - /* + /* * Set root & numchain */ chain->tree_root = root; - if( (size - 1) < fanout ) { + if( (size - 1) < fanout ) { chain->tree_nextsize = size-1; fanout = size-1; } else { chain->tree_nextsize = fanout; } - + /* * Shift ranks */ @@ -587,13 +585,13 @@ ompi_coll_tuned_topo_build_chain( int fanout, chain->tree_nextsize = 1; } else { chain->tree_next[0] = -1; - chain->tree_nextsize = 0; + chain->tree_nextsize = 0; } } } - + /* - * Unshift values + * Unshift values */ if( rank == root ) { chain->tree_prev = -1;