X-Git-Url: http://info.iut-bm.univ-fcomte.fr/pub/gitweb/simgrid.git/blobdiff_plain/482cc3463d7b94d6c39816c23f0d1e972a289728..954676b700e711f38ec4d286d33d5427d3f4ca46:/src/smpi/colls/alltoall-bruck.c diff --git a/src/smpi/colls/alltoall-bruck.c b/src/smpi/colls/alltoall-bruck.c index 5745f2f19c..99a93b5cfa 100644 --- a/src/smpi/colls/alltoall-bruck.c +++ b/src/smpi/colls/alltoall-bruck.c @@ -1,3 +1,9 @@ +/* Copyright (c) 2013-2014. The SimGrid Team. + * All rights reserved. */ + +/* This program is free software; you can redistribute it and/or modify it + * under the terms of the license (GNU LGPL) which comes with this package. */ + /***************************************************************************** * Function: alltoall_bruck @@ -19,113 +25,91 @@ ****************************************************************************/ int -smpi_coll_tuned_alltoall_bruck(void * send_buff, int send_count, MPI_Datatype send_type, - void * recv_buff, int recv_count, MPI_Datatype recv_type, - MPI_Comm comm) +smpi_coll_tuned_alltoall_bruck(void *send_buff, int send_count, + MPI_Datatype send_type, void *recv_buff, + int recv_count, MPI_Datatype recv_type, + MPI_Comm comm) { MPI_Status status; MPI_Aint extent; MPI_Datatype new_type; - - int * blocks_length, * disps; + + int *blocks_length, *disps; int i, src, dst, rank, num_procs, count, remainder, block, position; - int pack_size, tag = 1, pof2 = 1, success = 1, failure = 0; - - - char * tmp_buff; - char * send_ptr = (char *) send_buff; - char * recv_ptr = (char *) recv_buff; - - MPI_Comm_size(comm, &num_procs); - MPI_Comm_rank(comm, &rank); - - MPI_Type_extent(recv_type, &extent); - - tmp_buff = (char *) malloc (num_procs * recv_count * extent); - if (!tmp_buff) - { - printf("alltoall-bruck:53: cannot allocate memory\n"); - MPI_Finalize(); - exit(failure); - } - - disps = (int *) malloc(sizeof(int) * num_procs); - if (!disps) - { - printf("alltoall-bruck:61: cannot allocate memory\n"); - MPI_Finalize(); - exit(failure); - } - - blocks_length = (int *) malloc(sizeof(int) * num_procs); - if (!blocks_length) - { - printf("alltoall-bruck:69: cannot allocate memory\n"); - MPI_Finalize(); - exit(failure); - } - - - MPI_Sendrecv(send_ptr + rank * send_count * extent, - (num_procs - rank) * send_count, send_type, rank, tag, - recv_ptr, (num_procs - rank) * recv_count, recv_type, rank, - tag, comm, &status); - - MPI_Sendrecv(send_ptr, rank * send_count, send_type, rank, tag, - recv_ptr + (num_procs - rank) * recv_count * extent, - rank * recv_count, recv_type, rank, tag, comm, &status); - - - - MPI_Pack_size(send_count * num_procs, send_type, comm, &pack_size); - - while (pof2 < num_procs) - { - dst = (rank + pof2) % num_procs; - src = (rank - pof2 + num_procs) % num_procs; - - - count = 0; - for (block = 1; block < num_procs; block++) - if (block & pof2) - { - blocks_length[count] = send_count; - disps[count] = block * send_count; - count++; - } - - MPI_Type_indexed(count, blocks_length, disps, recv_type, &new_type); - MPI_Type_commit(&new_type); - - position = 0; - MPI_Pack(recv_buff, 1, new_type, tmp_buff, pack_size, &position, comm); - - MPI_Sendrecv(tmp_buff, position, MPI_PACKED, dst, tag, recv_buff, 1, - new_type, src, tag, comm, &status); - MPI_Type_free(&new_type); - - pof2 *= 2; - } + int pack_size, tag = COLL_TAG_ALLTOALL, pof2 = 1; + + + char *tmp_buff; + char *send_ptr = (char *) send_buff; + char *recv_ptr = (char *) recv_buff; + + num_procs = smpi_comm_size(comm); + rank = smpi_comm_rank(comm); + + extent = smpi_datatype_get_extent(recv_type); + + tmp_buff = (char *) smpi_get_tmp_sendbuffer(num_procs * recv_count * extent); + disps = (int *) xbt_malloc(sizeof(int) * num_procs); + blocks_length = (int *) xbt_malloc(sizeof(int) * num_procs); + + smpi_mpi_sendrecv(send_ptr + rank * send_count * extent, + (num_procs - rank) * send_count, send_type, rank, tag, + recv_ptr, (num_procs - rank) * recv_count, recv_type, rank, + tag, comm, &status); + + smpi_mpi_sendrecv(send_ptr, rank * send_count, send_type, rank, tag, + recv_ptr + (num_procs - rank) * recv_count * extent, + rank * recv_count, recv_type, rank, tag, comm, &status); + + + + MPI_Pack_size(send_count * num_procs, send_type, comm, &pack_size); + + while (pof2 < num_procs) { + dst = (rank + pof2) % num_procs; + src = (rank - pof2 + num_procs) % num_procs; + + + count = 0; + for (block = 1; block < num_procs; block++) + if (block & pof2) { + blocks_length[count] = send_count; + disps[count] = block * send_count; + count++; + } + + MPI_Type_indexed(count, blocks_length, disps, recv_type, &new_type); + smpi_datatype_commit(&new_type); + + position = 0; + MPI_Pack(recv_buff, 1, new_type, tmp_buff, pack_size, &position, comm); + + smpi_mpi_sendrecv(tmp_buff, position, MPI_PACKED, dst, tag, recv_buff, 1, + new_type, src, tag, comm, &status); + smpi_datatype_free(&new_type); + + pof2 *= 2; + } free(disps); free(blocks_length); - - MPI_Sendrecv(recv_ptr + (rank + 1) * recv_count * extent, - (num_procs - rank - 1) * recv_count, send_type, - rank, tag, tmp_buff, (num_procs - rank - 1) * recv_count, - recv_type, rank, tag, comm, &status); - - MPI_Sendrecv(recv_ptr, (rank + 1) * recv_count, send_type, rank, tag, - tmp_buff + (num_procs - rank - 1) * recv_count * extent, - (rank + 1) * recv_count, recv_type, rank, tag, comm, &status); - - - for (i = 0; i < num_procs; i++) - MPI_Sendrecv(tmp_buff + i * recv_count * extent, recv_count, send_type, - rank, tag, - recv_ptr + (num_procs - i - 1) * recv_count * extent, - recv_count, recv_type, rank, tag, comm, &status); - - free(tmp_buff); - return success; + + smpi_mpi_sendrecv(recv_ptr + (rank + 1) * recv_count * extent, + (num_procs - rank - 1) * recv_count, send_type, + rank, tag, tmp_buff, (num_procs - rank - 1) * recv_count, + recv_type, rank, tag, comm, &status); + + smpi_mpi_sendrecv(recv_ptr, (rank + 1) * recv_count, send_type, rank, tag, + tmp_buff + (num_procs - rank - 1) * recv_count * extent, + (rank + 1) * recv_count, recv_type, rank, tag, comm, &status); + + + for (i = 0; i < num_procs; i++) + smpi_mpi_sendrecv(tmp_buff + i * recv_count * extent, recv_count, send_type, + rank, tag, + recv_ptr + (num_procs - i - 1) * recv_count * extent, + recv_count, recv_type, rank, tag, comm, &status); + + smpi_free_tmp_buffer(tmp_buff); + return MPI_SUCCESS; }