+ if (*datatype == MPI_CHAR) {
+ APPLY_FUNC(a, b, length, char, MIN_OP);
+ } else if (*datatype == MPI_SHORT) {
+ APPLY_FUNC(a, b, length, short, MIN_OP);
+ } else if (*datatype == MPI_INT) {
+ APPLY_FUNC(a, b, length, int, MIN_OP);
+ } else if (*datatype == MPI_LONG) {
+ APPLY_FUNC(a, b, length, long, MIN_OP);
+ } else if (*datatype == MPI_UNSIGNED_SHORT) {
+ APPLY_FUNC(a, b, length, unsigned short, MIN_OP);
+ } else if (*datatype == MPI_UNSIGNED) {
+ APPLY_FUNC(a, b, length, unsigned int, MIN_OP);
+ } else if (*datatype == MPI_UNSIGNED_LONG) {
+ APPLY_FUNC(a, b, length, unsigned long, MIN_OP);
+ } else if (*datatype == MPI_UNSIGNED_CHAR) {
+ APPLY_FUNC(a, b, length, unsigned char, MIN_OP);
+ } else if (*datatype == MPI_FLOAT) {
+ APPLY_FUNC(a, b, length, float, MIN_OP);
+ } else if (*datatype == MPI_DOUBLE) {
+ APPLY_FUNC(a, b, length, double, MIN_OP);
+ } else if (*datatype == MPI_LONG_DOUBLE) {
+ APPLY_FUNC(a, b, length, long double, MIN_OP);
+ }
+}
+
+static void sum_func(void *a, void *b, int *length,
+ MPI_Datatype * datatype)
+{
+ if (*datatype == MPI_CHAR) {
+ APPLY_FUNC(a, b, length, char, SUM_OP);
+ } else if (*datatype == MPI_SHORT) {
+ APPLY_FUNC(a, b, length, short, SUM_OP);
+ } else if (*datatype == MPI_INT) {
+ APPLY_FUNC(a, b, length, int, SUM_OP);
+ } else if (*datatype == MPI_LONG) {
+ APPLY_FUNC(a, b, length, long, SUM_OP);
+ } else if (*datatype == MPI_UNSIGNED_SHORT) {
+ APPLY_FUNC(a, b, length, unsigned short, SUM_OP);
+ } else if (*datatype == MPI_UNSIGNED) {
+ APPLY_FUNC(a, b, length, unsigned int, SUM_OP);
+ } else if (*datatype == MPI_UNSIGNED_LONG) {
+ APPLY_FUNC(a, b, length, unsigned long, SUM_OP);
+ } else if (*datatype == MPI_UNSIGNED_CHAR) {
+ APPLY_FUNC(a, b, length, unsigned char, SUM_OP);
+ } else if (*datatype == MPI_FLOAT) {
+ APPLY_FUNC(a, b, length, float, SUM_OP);
+ } else if (*datatype == MPI_DOUBLE) {
+ APPLY_FUNC(a, b, length, double, SUM_OP);
+ } else if (*datatype == MPI_LONG_DOUBLE) {
+ APPLY_FUNC(a, b, length, long double, SUM_OP);
+ } else if (*datatype == MPI_C_FLOAT_COMPLEX) {
+ APPLY_FUNC(a, b, length, float _Complex, SUM_OP);
+ } else if (*datatype == MPI_C_DOUBLE_COMPLEX) {
+ APPLY_FUNC(a, b, length, double _Complex, SUM_OP);
+ } else if (*datatype == MPI_C_LONG_DOUBLE_COMPLEX) {
+ APPLY_FUNC(a, b, length, long double _Complex, SUM_OP);
+ }
+}
+
+static void prod_func(void *a, void *b, int *length,
+ MPI_Datatype * datatype)
+{
+ if (*datatype == MPI_CHAR) {
+ APPLY_FUNC(a, b, length, char, PROD_OP);
+ } else if (*datatype == MPI_SHORT) {
+ APPLY_FUNC(a, b, length, short, PROD_OP);
+ } else if (*datatype == MPI_INT) {
+ APPLY_FUNC(a, b, length, int, PROD_OP);
+ } else if (*datatype == MPI_LONG) {
+ APPLY_FUNC(a, b, length, long, PROD_OP);
+ } else if (*datatype == MPI_UNSIGNED_SHORT) {
+ APPLY_FUNC(a, b, length, unsigned short, PROD_OP);
+ } else if (*datatype == MPI_UNSIGNED) {
+ APPLY_FUNC(a, b, length, unsigned int, PROD_OP);
+ } else if (*datatype == MPI_UNSIGNED_LONG) {
+ APPLY_FUNC(a, b, length, unsigned long, PROD_OP);
+ } else if (*datatype == MPI_UNSIGNED_CHAR) {
+ APPLY_FUNC(a, b, length, unsigned char, PROD_OP);
+ } else if (*datatype == MPI_FLOAT) {
+ APPLY_FUNC(a, b, length, float, PROD_OP);
+ } else if (*datatype == MPI_DOUBLE) {
+ APPLY_FUNC(a, b, length, double, PROD_OP);
+ } else if (*datatype == MPI_LONG_DOUBLE) {
+ APPLY_FUNC(a, b, length, long double, PROD_OP);
+ } else if (*datatype == MPI_C_FLOAT_COMPLEX) {
+ APPLY_FUNC(a, b, length, float _Complex, PROD_OP);
+ } else if (*datatype == MPI_C_DOUBLE_COMPLEX) {
+ APPLY_FUNC(a, b, length, double _Complex, PROD_OP);
+ } else if (*datatype == MPI_C_LONG_DOUBLE_COMPLEX) {
+ APPLY_FUNC(a, b, length, long double _Complex, PROD_OP);
+ }
+}
+
+static void land_func(void *a, void *b, int *length,
+ MPI_Datatype * datatype)
+{
+ if (*datatype == MPI_CHAR) {
+ APPLY_FUNC(a, b, length, char, LAND_OP);
+ } else if (*datatype == MPI_SHORT) {
+ APPLY_FUNC(a, b, length, short, LAND_OP);
+ } else if (*datatype == MPI_INT) {
+ APPLY_FUNC(a, b, length, int, LAND_OP);
+ } else if (*datatype == MPI_LONG) {
+ APPLY_FUNC(a, b, length, long, LAND_OP);
+ } else if (*datatype == MPI_UNSIGNED_SHORT) {
+ APPLY_FUNC(a, b, length, unsigned short, LAND_OP);
+ } else if (*datatype == MPI_UNSIGNED) {
+ APPLY_FUNC(a, b, length, unsigned int, LAND_OP);
+ } else if (*datatype == MPI_UNSIGNED_LONG) {
+ APPLY_FUNC(a, b, length, unsigned long, LAND_OP);
+ } else if (*datatype == MPI_UNSIGNED_CHAR) {
+ APPLY_FUNC(a, b, length, unsigned char, LAND_OP);
+ } else if (*datatype == MPI_C_BOOL) {
+ APPLY_FUNC(a, b, length, _Bool, LAND_OP);
+ }
+}
+
+static void lor_func(void *a, void *b, int *length,
+ MPI_Datatype * datatype)
+{
+ if (*datatype == MPI_CHAR) {
+ APPLY_FUNC(a, b, length, char, LOR_OP);
+ } else if (*datatype == MPI_SHORT) {
+ APPLY_FUNC(a, b, length, short, LOR_OP);
+ } else if (*datatype == MPI_INT) {
+ APPLY_FUNC(a, b, length, int, LOR_OP);
+ } else if (*datatype == MPI_LONG) {
+ APPLY_FUNC(a, b, length, long, LOR_OP);
+ } else if (*datatype == MPI_UNSIGNED_SHORT) {
+ APPLY_FUNC(a, b, length, unsigned short, LOR_OP);
+ } else if (*datatype == MPI_UNSIGNED) {
+ APPLY_FUNC(a, b, length, unsigned int, LOR_OP);
+ } else if (*datatype == MPI_UNSIGNED_LONG) {
+ APPLY_FUNC(a, b, length, unsigned long, LOR_OP);
+ } else if (*datatype == MPI_UNSIGNED_CHAR) {
+ APPLY_FUNC(a, b, length, unsigned char, LOR_OP);
+ } else if (*datatype == MPI_C_BOOL) {
+ APPLY_FUNC(a, b, length, _Bool, LOR_OP);
+ }
+}
+
+static void lxor_func(void *a, void *b, int *length,
+ MPI_Datatype * datatype)
+{
+ if (*datatype == MPI_CHAR) {
+ APPLY_FUNC(a, b, length, char, LXOR_OP);
+ } else if (*datatype == MPI_SHORT) {
+ APPLY_FUNC(a, b, length, short, LXOR_OP);
+ } else if (*datatype == MPI_INT) {
+ APPLY_FUNC(a, b, length, int, LXOR_OP);
+ } else if (*datatype == MPI_LONG) {
+ APPLY_FUNC(a, b, length, long, LXOR_OP);
+ } else if (*datatype == MPI_UNSIGNED_SHORT) {
+ APPLY_FUNC(a, b, length, unsigned short, LXOR_OP);
+ } else if (*datatype == MPI_UNSIGNED) {
+ APPLY_FUNC(a, b, length, unsigned int, LXOR_OP);
+ } else if (*datatype == MPI_UNSIGNED_LONG) {
+ APPLY_FUNC(a, b, length, unsigned long, LXOR_OP);
+ } else if (*datatype == MPI_UNSIGNED_CHAR) {
+ APPLY_FUNC(a, b, length, unsigned char, LXOR_OP);
+ } else if (*datatype == MPI_C_BOOL) {
+ APPLY_FUNC(a, b, length, _Bool, LXOR_OP);
+ }
+}
+
+static void band_func(void *a, void *b, int *length,
+ MPI_Datatype * datatype)
+{
+ if (*datatype == MPI_CHAR) {
+ APPLY_FUNC(a, b, length, char, BAND_OP);
+ }else if (*datatype == MPI_SHORT) {
+ APPLY_FUNC(a, b, length, short, BAND_OP);
+ } else if (*datatype == MPI_INT) {
+ APPLY_FUNC(a, b, length, int, BAND_OP);
+ } else if (*datatype == MPI_LONG) {
+ APPLY_FUNC(a, b, length, long, BAND_OP);
+ } else if (*datatype == MPI_UNSIGNED_SHORT) {
+ APPLY_FUNC(a, b, length, unsigned short, BAND_OP);
+ } else if (*datatype == MPI_UNSIGNED) {
+ APPLY_FUNC(a, b, length, unsigned int, BAND_OP);
+ } else if (*datatype == MPI_UNSIGNED_LONG) {
+ APPLY_FUNC(a, b, length, unsigned long, BAND_OP);
+ } else if (*datatype == MPI_UNSIGNED_CHAR) {
+ APPLY_FUNC(a, b, length, unsigned char, BAND_OP);
+ } else if (*datatype == MPI_BYTE) {
+ APPLY_FUNC(a, b, length, uint8_t, BAND_OP);
+ }
+}
+
+static void bor_func(void *a, void *b, int *length,
+ MPI_Datatype * datatype)
+{
+ if (*datatype == MPI_CHAR) {
+ APPLY_FUNC(a, b, length, char, BOR_OP);
+ } else if (*datatype == MPI_SHORT) {
+ APPLY_FUNC(a, b, length, short, BOR_OP);
+ } else if (*datatype == MPI_INT) {
+ APPLY_FUNC(a, b, length, int, BOR_OP);
+ } else if (*datatype == MPI_LONG) {
+ APPLY_FUNC(a, b, length, long, BOR_OP);
+ } else if (*datatype == MPI_UNSIGNED_SHORT) {
+ APPLY_FUNC(a, b, length, unsigned short, BOR_OP);
+ } else if (*datatype == MPI_UNSIGNED) {
+ APPLY_FUNC(a, b, length, unsigned int, BOR_OP);
+ } else if (*datatype == MPI_UNSIGNED_LONG) {
+ APPLY_FUNC(a, b, length, unsigned long, BOR_OP);
+ } else if (*datatype == MPI_UNSIGNED_CHAR) {
+ APPLY_FUNC(a, b, length, unsigned char, BOR_OP);
+ } else if (*datatype == MPI_BYTE) {
+ APPLY_FUNC(a, b, length, uint8_t, BOR_OP);
+ }
+}
+
+static void bxor_func(void *a, void *b, int *length,
+ MPI_Datatype * datatype)
+{
+ if (*datatype == MPI_CHAR) {
+ APPLY_FUNC(a, b, length, char, BXOR_OP);
+ } else if (*datatype == MPI_SHORT) {
+ APPLY_FUNC(a, b, length, short, BXOR_OP);
+ } else if (*datatype == MPI_INT) {
+ APPLY_FUNC(a, b, length, int, BXOR_OP);
+ } else if (*datatype == MPI_LONG) {
+ APPLY_FUNC(a, b, length, long, BXOR_OP);
+ } else if (*datatype == MPI_UNSIGNED_SHORT) {
+ APPLY_FUNC(a, b, length, unsigned short, BXOR_OP);
+ } else if (*datatype == MPI_UNSIGNED) {
+ APPLY_FUNC(a, b, length, unsigned int, BXOR_OP);
+ } else if (*datatype == MPI_UNSIGNED_LONG) {
+ APPLY_FUNC(a, b, length, unsigned long, BXOR_OP);
+ } else if (*datatype == MPI_UNSIGNED_CHAR) {
+ APPLY_FUNC(a, b, length, unsigned char, BXOR_OP);
+ } else if (*datatype == MPI_BYTE) {
+ APPLY_FUNC(a, b, length, uint8_t, BXOR_OP);
+ }
+}
+
+static void minloc_func(void *a, void *b, int *length,
+ MPI_Datatype * datatype)
+{
+ if (*datatype == MPI_FLOAT_INT) {
+ APPLY_FUNC(a, b, length, float_int, MINLOC_OP);
+ } else if (*datatype == MPI_LONG_INT) {
+ APPLY_FUNC(a, b, length, long_int, MINLOC_OP);
+ } else if (*datatype == MPI_DOUBLE_INT) {
+ APPLY_FUNC(a, b, length, double_int, MINLOC_OP);
+ } else if (*datatype == MPI_SHORT_INT) {
+ APPLY_FUNC(a, b, length, short_int, MINLOC_OP);
+ } else if (*datatype == MPI_2LONG) {
+ APPLY_FUNC(a, b, length, long_long, MINLOC_OP);
+ } else if (*datatype == MPI_2INT) {
+ APPLY_FUNC(a, b, length, int_int, MINLOC_OP);
+ } else if (*datatype == MPI_LONG_DOUBLE_INT) {
+ APPLY_FUNC(a, b, length, long_double_int, MINLOC_OP);
+ } else if (*datatype == MPI_2FLOAT) {
+ APPLY_FUNC(a, b, length, float_float, MINLOC_OP);
+ } else if (*datatype == MPI_2DOUBLE) {
+ APPLY_FUNC(a, b, length, double_double, MINLOC_OP);
+ }
+}
+
+static void maxloc_func(void *a, void *b, int *length,
+ MPI_Datatype * datatype)
+{
+ if (*datatype == MPI_FLOAT_INT) {
+ APPLY_FUNC(a, b, length, float_int, MAXLOC_OP);
+ } else if (*datatype == MPI_LONG_INT) {
+ APPLY_FUNC(a, b, length, long_int, MAXLOC_OP);
+ } else if (*datatype == MPI_DOUBLE_INT) {
+ APPLY_FUNC(a, b, length, double_int, MAXLOC_OP);
+ } else if (*datatype == MPI_SHORT_INT) {
+ APPLY_FUNC(a, b, length, short_int, MAXLOC_OP);
+ } else if (*datatype == MPI_2LONG) {
+ APPLY_FUNC(a, b, length, long_long, MAXLOC_OP);
+ } else if (*datatype == MPI_2INT) {
+ APPLY_FUNC(a, b, length, int_int, MAXLOC_OP);
+ } else if (*datatype == MPI_LONG_DOUBLE_INT) {
+ APPLY_FUNC(a, b, length, long_double_int, MAXLOC_OP);
+ } else if (*datatype == MPI_2FLOAT) {
+ APPLY_FUNC(a, b, length, float_float, MAXLOC_OP);
+ } else if (*datatype == MPI_2DOUBLE) {
+ APPLY_FUNC(a, b, length, double_double, MAXLOC_OP);
+ }
+}
+
+static void replace_func(void *a, void *b, int *length,
+ MPI_Datatype * datatype)
+{
+ memcpy(b, a, *length * smpi_datatype_size(*datatype));
+}
+
+#define CREATE_MPI_OP(name, func) \
+ static s_smpi_mpi_op_t mpi_##name = { &(func) /* func */, TRUE }; \
+MPI_Op name = &mpi_##name;
+
+CREATE_MPI_OP(MPI_MAX, max_func);
+CREATE_MPI_OP(MPI_MIN, min_func);
+CREATE_MPI_OP(MPI_SUM, sum_func);
+CREATE_MPI_OP(MPI_PROD, prod_func);
+CREATE_MPI_OP(MPI_LAND, land_func);
+CREATE_MPI_OP(MPI_LOR, lor_func);
+CREATE_MPI_OP(MPI_LXOR, lxor_func);
+CREATE_MPI_OP(MPI_BAND, band_func);
+CREATE_MPI_OP(MPI_BOR, bor_func);
+CREATE_MPI_OP(MPI_BXOR, bxor_func);
+CREATE_MPI_OP(MPI_MAXLOC, maxloc_func);
+CREATE_MPI_OP(MPI_MINLOC, minloc_func);
+CREATE_MPI_OP(MPI_REPLACE, replace_func);
+
+
+MPI_Op smpi_op_new(MPI_User_function * function, int commute)
+{
+ MPI_Op op;
+ op = xbt_new(s_smpi_mpi_op_t, 1);
+ op->func = function;
+ op-> is_commute = commute;
+ return op;
+}
+
+int smpi_op_is_commute(MPI_Op op)
+{
+ return (op==MPI_OP_NULL) ? 1 : op-> is_commute;
+}
+
+void smpi_op_destroy(MPI_Op op)
+{
+ xbt_free(op);
+}
+
+void smpi_op_apply(MPI_Op op, void *invec, void *inoutvec, int *len,
+ MPI_Datatype * datatype)
+{
+ if(op==MPI_OP_NULL)
+ return;
+
+ if(smpi_privatize_global_variables){ //we need to switch here, as the called function may silently touch global variables
+ XBT_DEBUG("Applying operation, switch to the right data frame ");
+ smpi_switch_data_segment(smpi_process_index());
+ }
+
+ if(!smpi_process_get_replaying())
+ op->func(invec, inoutvec, len, datatype);
+}
+
+int smpi_type_attr_delete(MPI_Datatype type, int keyval){
+ smpi_type_key_elem elem = xbt_dict_get_or_null_ext(smpi_type_keyvals, (const char*)&keyval, sizeof(int));
+ if(!elem)
+ return MPI_ERR_ARG;
+ if(elem->delete_fn!=MPI_NULL_DELETE_FN){
+ void * value;
+ int flag;
+ if(smpi_type_attr_get(type, keyval, &value, &flag)==MPI_SUCCESS){
+ int ret = elem->delete_fn(type, keyval, value, &flag);
+ if(ret!=MPI_SUCCESS) return ret;
+ }
+ }
+ if(type->attributes==NULL)
+ return MPI_ERR_ARG;
+
+ xbt_dict_remove_ext(type->attributes, (const char*)&keyval, sizeof(int));
+ return MPI_SUCCESS;
+}
+
+int smpi_type_attr_get(MPI_Datatype type, int keyval, void* attr_value, int* flag){
+ smpi_type_key_elem elem = xbt_dict_get_or_null_ext(smpi_type_keyvals, (const char*)&keyval, sizeof(int));
+ if(!elem)
+ return MPI_ERR_ARG;
+ xbt_ex_t ex;
+ if(type->attributes==NULL){
+ *flag=0;
+ return MPI_SUCCESS;
+ }
+ TRY {
+ *(void**)attr_value = xbt_dict_get_ext(type->attributes, (const char*)&keyval, sizeof(int));
+ *flag=1;
+ }
+ CATCH(ex) {
+ *flag=0;
+ xbt_ex_free(ex);
+ }
+ return MPI_SUCCESS;
+}
+
+int smpi_type_attr_put(MPI_Datatype type, int keyval, void* attr_value){
+ if(!smpi_type_keyvals)
+ smpi_type_keyvals = xbt_dict_new();
+ smpi_type_key_elem elem = xbt_dict_get_or_null_ext(smpi_type_keyvals, (const char*)&keyval, sizeof(int));
+ if(!elem )
+ return MPI_ERR_ARG;
+ int flag;
+ void* value;
+ smpi_type_attr_get(type, keyval, &value, &flag);
+ if(flag && elem->delete_fn!=MPI_NULL_DELETE_FN){
+ int ret = elem->delete_fn(type, keyval, value, &flag);
+ if(ret!=MPI_SUCCESS) return ret;
+ }
+ if(type->attributes==NULL)
+ type->attributes=xbt_dict_new();
+
+ xbt_dict_set_ext(type->attributes, (const char*)&keyval, sizeof(int), attr_value, NULL);
+ return MPI_SUCCESS;
+}
+
+int smpi_type_keyval_create(MPI_Type_copy_attr_function* copy_fn, MPI_Type_delete_attr_function* delete_fn, int* keyval, void* extra_state){
+
+ if(!smpi_type_keyvals)
+ smpi_type_keyvals = xbt_dict_new();
+
+ smpi_type_key_elem value = (smpi_type_key_elem) xbt_new0(s_smpi_mpi_type_key_elem_t,1);
+
+ value->copy_fn=copy_fn;
+ value->delete_fn=delete_fn;
+
+ *keyval = type_keyval_id;
+ xbt_dict_set_ext(smpi_type_keyvals,(const char*)keyval, sizeof(int),(void*)value, NULL);
+ type_keyval_id++;
+ return MPI_SUCCESS;
+}
+
+int smpi_type_keyval_free(int* keyval){
+ smpi_type_key_elem elem = xbt_dict_get_or_null_ext(smpi_type_keyvals, (const char*)keyval, sizeof(int));
+ if(!elem){
+ return MPI_ERR_ARG;
+ }
+ xbt_dict_remove_ext(smpi_type_keyvals, (const char*)keyval, sizeof(int));
+ xbt_free(elem);
+ return MPI_SUCCESS;
+}
+
+int smpi_mpi_pack(void* inbuf, int incount, MPI_Datatype type, void* outbuf, int outcount, int* position, MPI_Comm comm){
+ size_t size = smpi_datatype_size(type);
+ if (outcount - *position < incount*size)
+ return MPI_ERR_BUFFER;
+ smpi_datatype_copy(inbuf, incount, type,
+ (char*)outbuf + *position, outcount, MPI_CHAR);
+ *position += incount * size;
+ return MPI_SUCCESS;
+}
+
+int smpi_mpi_unpack(void* inbuf, int insize, int* position, void* outbuf, int outcount, MPI_Datatype type, MPI_Comm comm){
+ size_t size = smpi_datatype_size(type);
+ if (outcount*size> insize)
+ return MPI_ERR_BUFFER;
+ smpi_datatype_copy((char*)inbuf + *position, insize, MPI_CHAR,
+ outbuf, outcount, type);
+ *position += outcount * size;
+ return MPI_SUCCESS;