Logo AND Algorithmique Numérique Distribuée

Public GIT Repository
make sure union and struct are closed before exchange; more useful debug
[simgrid.git] / src / gras / DataDesc / ddt_exchange.c
index 579f2ea..05905c3 100644 (file)
@@ -10,9 +10,9 @@
 
 #include "DataDesc/datadesc_private.h"
 
-GRAS_LOG_NEW_DEFAULT_SUBCATEGORY(exchange,DataDesc);
+GRAS_LOG_NEW_DEFAULT_SUBCATEGORY(exchange,datadesc);
 
-static const char *gras_datadesc_cat_names[9] = { 
+const char *gras_datadesc_cat_names[9] = { 
   "undefined", 
   "scalar", "struct", "union", "ref", "array", "ignored",
   "invalid"};
@@ -43,16 +43,18 @@ gras_datadesc_recv_rec(gras_socket_t        *sock,
                       int                   r_arch,
                       char                **r_data,
                       long int              r_lgr,
-                      char                **dst);
+                      char                 *dst,
+                      int                   subsize);
 
 
 static gras_error_t
 gras_dd_send_int(gras_socket_t *sock,int i) {
-  gras_error_t errcode;
 
-  if (!int_type) 
-    TRY(gras_datadesc_by_name("int", &int_type));
-  
+  if (!int_type) {
+    int_type = gras_datadesc_by_name("int");
+     gras_assert(int_type);  
+  }
+   
   DEBUG1("send_int(%d)",i);
   return gras_trp_chunk_send(sock, (char*)&i, int_type->size[GRAS_THISARCH]);
 }
@@ -61,17 +63,19 @@ static gras_error_t
 gras_dd_recv_int(gras_socket_t *sock, int r_arch, int *i) {
   gras_error_t errcode;
 
-  if (!int_type) 
-    TRY(gras_datadesc_by_name("int", &int_type));
+  if (!int_type) {
+     int_type = gras_datadesc_by_name("int");
+     gras_assert(int_type);
+  }
 
   if (int_type->size[GRAS_THISARCH] >= int_type->size[r_arch]) {
     TRY(gras_trp_chunk_recv(sock, (char*)i, int_type->size[r_arch]));
-    TRY(gras_dd_convert_elm(int_type,r_arch, i,i));
+    TRY(gras_dd_convert_elm(int_type,1,r_arch, i,i));
   } else {
     void *ptr = NULL;
     ptr = malloc((size_t)int_type->size[r_arch]);
     TRY(gras_trp_chunk_recv(sock, (char*)ptr, int_type->size[r_arch]));
-    TRY(gras_dd_convert_elm(int_type,r_arch, ptr,i));
+    TRY(gras_dd_convert_elm(int_type,1,r_arch, ptr,i));
     free(ptr);
   }
   DEBUG1("recv_int(%d)",*i);
@@ -119,12 +123,12 @@ gras_dd_alloc_ref(gras_dict_t *refs,
     void *ptr = malloc(sizeof(void *));
     if (!ptr)
       RAISE_MALLOC;
-    //    memcpy(ptr,&l_data, sizeof(void *));
+
     memcpy(ptr,l_ref, sizeof(void *));
 
     DEBUG2("Insert %p under %p",*(void**)ptr, *(void**)r_ref);
-    /* FIXME: Leaking on the ptr. Do I really need to copy it? */
-    TRY(gras_dict_set_ext(refs,(const char *) r_ref, r_len, ptr, NULL));
+
+    TRY(gras_dict_set_ext(refs,(const char *) r_ref, r_len, ptr, free));
   }
   return no_error;
 }
@@ -143,25 +147,62 @@ int gras_datadesc_type_cmp(const gras_datadesc_type_t *d1,
   gras_dd_cat_field_t *field1,*field2;
   gras_datadesc_type_t *field_desc_1,*field_desc_2;
 
+  if (d1 == d2) return 0; /* easy optimization */
 
-  if (!d1 && d2) return 1;
-  if (!d1 && !d2) return 0;
-  if ( d1 && !d2) return -1;
+  if (!d1 && d2) {
+    DEBUG0("ddt_cmp: !d1 && d2 => 1");
+    return 1;
+  }
+  if (!d1 && !d2) {
+    DEBUG0("ddt_cmp: !d1 && !d2 => 0");
+    return 0;
+  }
+  if ( d1 && !d2) {
+    DEBUG0("ddt_cmp: d1 && !d2 => -1");
+    return -1;
+  }
 
-  if      (d1->size          != d2->size     )     
-    return d1->size          >  d2->size         ? 1 : -1;
-  if      (d1->alignment     != d2->alignment)     
-    return d1->alignment     >  d2->alignment    ? 1 : -1;
-  if      (d1->aligned_size  != d2->aligned_size)  
-    return d1->aligned_size  >  d2->aligned_size ? 1 : -1;
+  for (cpt=0; cpt<gras_arch_count; cpt++) {
+    if (d1->size[cpt] != d2->size[cpt]) {
+      DEBUG5("ddt_cmp: %s->size=%d  !=  %s->size=%d (on %s)",
+            d1->name,d1->size[cpt],d2->name,d2->size[cpt],
+            gras_arches[cpt].name);
+      return d1->size[cpt] >  d2->size[cpt] ? 1 : -1;
+    }
 
-  if      (d1->category_code != d2->category_code) 
-    return d1->category_code >  d2->category_code ? 1 : -1;
+    if (d1->alignment[cpt] != d2->alignment[cpt]) {
+      DEBUG5("ddt_cmp: %s->alignment=%d  !=  %s->alignment=%d (on %s)",
+            d1->name,d1->alignment[cpt],d2->name,d2->alignment[cpt],
+            gras_arches[cpt].name);
+      return d1->alignment[cpt] > d2->alignment[cpt] ? 1 : -1;
+    }
 
-  if      (d1->pre          != d2->pre)           
-    return d1->pre          >  d2->pre ? 1 : -1;
-  if      (d1->post         != d2->post)
-    return d1->post          > d2->post ? 1 : -1;
+    if (d1->aligned_size[cpt] != d2->aligned_size[cpt]) {
+      DEBUG5("ddt_cmp: %s->aligned_size=%d  !=  %s->aligned_size=%d (on %s)",
+            d1->name,d1->aligned_size[cpt],d2->name,d2->aligned_size[cpt],
+            gras_arches[cpt].name);
+      return d1->aligned_size[cpt] > d2->aligned_size[cpt] ? 1 : -1;
+    }
+  }
+
+  if (d1->category_code != d2->category_code) {
+    DEBUG4("ddt_cmp: %s->cat=%s  !=  %s->cat=%s",
+          d1->name,gras_datadesc_cat_names[d1->category_code],
+          d2->name,gras_datadesc_cat_names[d2->category_code]);
+    return d1->category_code > d2->category_code ? 1 : -1;
+  }
+
+  if (d1->pre != d2->pre) {
+    DEBUG4("ddt_cmp: %s->pre=%p  !=  %s->pre=%p",
+          d1->name,d1->pre, d2->name,d2->pre);
+    return d1->pre > d2->pre ? 1 : -1;
+  }
+
+  if (d1->post != d2->post) {
+    DEBUG4("ddt_cmp: %s->post=%p  !=  %s->post=%p",
+          d1->name,d1->post, d2->name,d2->post);
+    return d1->post > d2->post ? 1 : -1;
+  }
 
   switch (d1->category_code) {
   case e_gras_datadesc_type_cat_scalar:
@@ -171,19 +212,27 @@ int gras_datadesc_type_cmp(const gras_datadesc_type_t *d1,
     
   case e_gras_datadesc_type_cat_struct:    
     if (gras_dynar_length(d1->category.struct_data.fields) != 
-       gras_dynar_length(d2->category.struct_data.fields))
+       gras_dynar_length(d2->category.struct_data.fields)) {
+      DEBUG4("ddt_cmp: %s (having %d fields) !=  %s (having %d fields)",
+            d1->name, gras_dynar_length(d1->category.struct_data.fields),
+            d2->name, gras_dynar_length(d2->category.struct_data.fields));
+      
       return gras_dynar_length(d1->category.struct_data.fields) >
        gras_dynar_length(d2->category.struct_data.fields) ?
        1 : -1;
-    
+    }
     gras_dynar_foreach(d1->category.struct_data.fields, cpt, field1) {
       
-      gras_dynar_get(d2->category.struct_data.fields, cpt, field2);
+      gras_dynar_get(d2->category.struct_data.fields, cpt, &field2);
       gras_datadesc_by_id(field1->code,&field_desc_1); /* FIXME: errcode ignored */
       gras_datadesc_by_id(field2->code,&field_desc_2);
       ret = gras_datadesc_type_cmp(field_desc_1,field_desc_2);
-      if (ret)
+      if (ret) {
+       DEBUG6("%s->field[%d]=%s != %s->field[%d]=%s",
+              d1->name,cpt,field1->name,              
+              d2->name,cpt,field2->name);
        return ret;
+      }
       
     }
     break;
@@ -282,17 +331,25 @@ gras_datadesc_send_rec(gras_socket_t        *sock,
     gras_dd_cat_field_t  *field;
     char                 *field_data;
 
+   gras_assert1(type->category.struct_data.closed,
+               "Please call gras_datadesc_declare_array_close on %s before sending it",
+               type->name);
     struct_data = type->category.struct_data;
     VERB1(">> Send all fields of the structure %s",type->name);
     gras_dynar_foreach(struct_data.fields, cpt, field) {
       field_data = data;
       field_data += field->offset[GRAS_THISARCH];
       
-      TRY(gras_datadesc_by_id(field->code, &sub_type));
+      errcode=gras_datadesc_by_id(field->code, &sub_type);
+      if (errcode != no_error) 
+       RAISE4(errcode,
+              "Got %s while searching for the sub type %d, #%d of %s",
+              gras_error_name(errcode),field->code,cpt,type->name);
       
       if (field->pre)
        field->pre(state,sub_type,field_data);
       
+      VERB1("Send field %s",field->name);
       TRY(gras_datadesc_send_rec(sock,state,refs,sub_type, field_data));
       
       if (field->post)
@@ -310,6 +367,9 @@ gras_datadesc_send_rec(gras_socket_t        *sock,
     
     union_data = type->category.union_data;
     
+    gras_assert1(union_data.closed,
+               "Please call gras_datadesc_declare_union_close on %s before sending it",
+               type->name);
     /* retrieve the field number */
     field_num = union_data.selector(state, type, data);
     
@@ -356,8 +416,11 @@ gras_datadesc_send_rec(gras_socket_t        *sock,
     }
     
     /* Send the actual value of the pointer for cycle handling */
-    if (!pointer_type)
-      TRY(gras_datadesc_by_name("data pointer", &pointer_type));
+    if (!pointer_type) {
+      pointer_type = gras_datadesc_by_name("data pointer");
+      gras_assert(pointer_type);
+    }
+     
     TRY(gras_trp_chunk_send(sock, (char*)data,
                            pointer_type->size[GRAS_THISARCH]));
     
@@ -402,9 +465,15 @@ gras_datadesc_send_rec(gras_socket_t        *sock,
     /* send the content */
     TRY(gras_datadesc_by_id(array_data.code, &sub_type));
     elm_size = sub_type->aligned_size[GRAS_THISARCH];
-    for (cpt=0; cpt<count; cpt++) {
-      TRY(gras_datadesc_send_rec(sock,state,refs, sub_type, ptr));
-      ptr += elm_size;
+    if (sub_type->category_code == e_gras_datadesc_type_cat_scalar) {
+      VERB1("Array of %d scalars, send it in one shoot",count);
+      TRY(gras_trp_chunk_send(sock, data, 
+                             sub_type->aligned_size[GRAS_THISARCH] * count));
+    } else {
+      for (cpt=0; cpt<count; cpt++) {
+       TRY(gras_datadesc_send_rec(sock,state,refs, sub_type, ptr));
+       ptr += elm_size;
+      }
     }
     break;
   }
@@ -449,6 +518,13 @@ gras_error_t gras_datadesc_send(gras_socket_t *sock,
  * gras_datadesc_recv_rec:
  *
  * Do the data reception job recursively.
+ *
+ * subsize used only to deal with vicious case of reference to dynamic array.
+ *  This size is needed at the reference reception level (to allocate enough 
+ * space) and at the array reception level (to fill enough room). 
+ * 
+ * Having this size passed as an argument of the recursive function is a crude
+ * hack, but I was told that working code is sometimes better than neat one ;)
  */
 gras_error_t
 gras_datadesc_recv_rec(gras_socket_t        *sock, 
@@ -458,30 +534,26 @@ gras_datadesc_recv_rec(gras_socket_t        *sock,
                       int                   r_arch,
                       char                **r_data,
                       long int              r_lgr,
-                      char                **dst) {
+                      char                 *l_data,
+                      int                   subsize) {
 
   gras_error_t          errcode;
-  char                 *l_data = *dst; /* dereference to avoid typo */
   int                   cpt;
   gras_datadesc_type_t *sub_type;
 
-  VERB1("Recv a %s", type->name);
+  VERB2("Recv a %s @%p", type->name, l_data);
+  gras_assert(l_data);
 
   switch (type->category_code) {
   case e_gras_datadesc_type_cat_scalar:
-    if (!l_data) {
-      TRY(gras_dd_alloc_ref(refs,type->size[GRAS_THISARCH],r_data,r_lgr, dst));
-      l_data = *dst;
-    } 
-    
-    if (type->size[GRAS_THISARCH] >= type->size[r_arch]) {
+    if (type->size[GRAS_THISARCH] == type->size[r_arch]) {
       TRY(gras_trp_chunk_recv(sock, (char*)l_data, type->size[r_arch]));
-      TRY(gras_dd_convert_elm(type,r_arch, l_data,l_data));
+      TRY(gras_dd_convert_elm(type,1,r_arch, l_data,l_data));
     } else {
       void *ptr = NULL;
       ptr = malloc((size_t)type->size[r_arch]);
       TRY(gras_trp_chunk_recv(sock, (char*)ptr, type->size[r_arch]));
-      TRY(gras_dd_convert_elm(type,r_arch, ptr,l_data));
+      TRY(gras_dd_convert_elm(type,1,r_arch, ptr,l_data));
       free(ptr);
     }
     break;
@@ -492,11 +564,9 @@ gras_datadesc_recv_rec(gras_socket_t        *sock,
 
     struct_data = type->category.struct_data;
 
-    if (!l_data) {
-      TRY(gras_dd_alloc_ref(refs,type->size[GRAS_THISARCH],r_data,r_lgr, dst));
-      l_data = *dst;
-    } 
-
+    gras_assert1(struct_data.closed,
+               "Please call gras_datadesc_declare_struct_close on %s before receiving it",
+               type->name);
     VERB1(">> Receive all fields of the structure %s",type->name);
     gras_dynar_foreach(struct_data.fields, cpt, field) {
       char                 *field_data = l_data + field->offset[GRAS_THISARCH];
@@ -505,7 +575,7 @@ gras_datadesc_recv_rec(gras_socket_t        *sock,
 
       TRY(gras_datadesc_recv_rec(sock,state,refs, sub_type,
                                 r_arch,NULL,0,
-                                &field_data));
+                                field_data,-1));
     }
     VERB1("<< Received all fields of the structure %s", type->name);
     
@@ -519,11 +589,9 @@ gras_datadesc_recv_rec(gras_socket_t        *sock,
 
     union_data = type->category.union_data;
 
-    if (!l_data) {
-      TRY(gras_dd_alloc_ref(refs,type->size[GRAS_THISARCH],r_data,r_lgr, dst));
-      l_data = *dst;
-    } 
-
+    gras_assert1(union_data.closed,
+               "Please call gras_datadesc_declare_union_close on %s before receiving it",
+               type->name);
     /* retrieve the field number */
     TRY(gras_dd_recv_int(sock, r_arch, &field_num));
     if (field_num < 0)
@@ -540,7 +608,7 @@ gras_datadesc_recv_rec(gras_socket_t        *sock,
     
     TRY(gras_datadesc_recv_rec(sock,state,refs, sub_type,
                               r_arch,NULL,0,
-                              dst));
+                              l_data,-1));
     break;
   }
 
@@ -558,24 +626,22 @@ gras_datadesc_recv_rec(gras_socket_t        *sock,
       TRY(gras_dd_recv_int(sock, r_arch, &ref_code));
 
     /* Get the actual value of the pointer for cycle handling */
-    if (!pointer_type)
-      TRY(gras_datadesc_by_name("data pointer", &pointer_type));
+    if (!pointer_type) {
+      pointer_type = gras_datadesc_by_name("data pointer");
+      gras_assert(pointer_type);
+    }
 
     if (! (r_ref = malloc((size_t)pointer_type->size[r_arch])) )
       RAISE_MALLOC;
     TRY(gras_trp_chunk_recv(sock, (char*)r_ref,
                            pointer_type->size[r_arch]));
 
-    if (!l_data) {
-      TRY(gras_dd_alloc_ref(refs,type->size[GRAS_THISARCH],r_data,r_lgr, dst));
-      l_data = *dst;
-    } 
-
     /* Receive the pointed data only if not already sent */
     if (gras_dd_is_r_null(r_ref, pointer_type->size[r_arch])) {
-      VERB1("Not receiving data remotely referenced at %p since it's NULL",
+      VERB1("Not receiving data remotely referenced @%p since it's NULL",
            *(void **)r_ref);
       *(void**)l_data = NULL;
+      free(r_ref);
       break;
     }
     errcode = gras_dict_get_ext(refs,
@@ -584,28 +650,53 @@ gras_datadesc_recv_rec(gras_socket_t        *sock,
 
 
     if (errcode == mismatch_error) {
+      int subsubcount = -1;
       void *l_referenced=NULL;
-      VERB1("Receiving data remotely referenced at %p", *(void**)r_ref);
 
       TRY(gras_datadesc_by_id(ref_code, &sub_type));
-      //      DEBUG2("l_ref= %p; &l_ref=%p",l_referenced,&l_referenced);
+      
+      VERB2("Receiving a ref to '%s', remotely @%p",
+           sub_type->name, *(void**)r_ref);
+      if (sub_type->category_code == e_gras_datadesc_type_cat_array) {
+       /* Damn. Reference to a dynamic array. Allocating the size for it 
+          is more complicated */
+       gras_dd_cat_array_t array_data = sub_type->category.array_data;
+       gras_datadesc_type_t *subsub_type;
+
+       subsubcount = array_data.fixed_size;
+       if (subsubcount < 0)
+         TRY(gras_dd_recv_int(sock, r_arch, &subsubcount));
+
+       TRY(gras_datadesc_by_id(array_data.code, &subsub_type));
+
+
+       TRY(gras_dd_alloc_ref(refs,
+                             subsub_type->size[GRAS_THISARCH] * subsubcount, 
+                             r_ref,pointer_type->size[r_arch], 
+                             (char**)&l_referenced));
+      } else {
+       TRY(gras_dd_alloc_ref(refs,sub_type->size[GRAS_THISARCH], 
+                             r_ref,pointer_type->size[r_arch], 
+                             (char**)&l_referenced));
+      }
+
       TRY(gras_datadesc_recv_rec(sock,state,refs, sub_type,
                                 r_arch,r_ref,pointer_type->size[r_arch],
-                                (char**)&l_referenced));
+                                (char*)l_referenced, subsubcount));
       *(void**)l_data=l_referenced;
+      VERB3("'%s' remotely referenced at %p locally at %p",
+           sub_type->name, *(void**)r_ref, l_referenced);
       
     } else if (errcode == no_error) {
-      VERB1("NOT receiving data remotely referenced at %p (already done). ",
-           *(void**)r_ref);
-
-      VERB2("l_ref=%p; *l_ref=%p", l_ref,*l_ref);
+      VERB2("NOT receiving data remotely referenced @%p (already done, @%p here)",
+           *(void**)r_ref, *(void**)l_ref);
 
       *(void**)l_data=*l_ref;
 
     } else {
       return errcode;
     }
-    VERB1("*l_data=%p",*(void**)l_data);
+    free(r_ref);
     break;
   }
 
@@ -616,9 +707,11 @@ gras_datadesc_recv_rec(gras_socket_t        *sock,
     long int  elm_size;
 
     array_data = type->category.array_data;
-    /* determine element count locally or from peer */
+    /* determine element count locally, or from caller, or from peer */
     count = array_data.fixed_size;
     if (count <= 0)
+      count = subsize;
+    if (count < 0)
       TRY(gras_dd_recv_int(sock, r_arch, &count));
     if (count < 0)
       RAISE1(mismatch_error,
@@ -626,18 +719,31 @@ gras_datadesc_recv_rec(gras_socket_t        *sock,
 
     /* receive the content */
     TRY(gras_datadesc_by_id(array_data.code, &sub_type));
-    elm_size = sub_type->aligned_size[GRAS_THISARCH];
-    
-    if (!l_data) {
-      TRY(gras_dd_alloc_ref(refs,elm_size*count,r_data,r_lgr, dst));
-      l_data = *dst;
-    } 
-
-    ptr = l_data;
-    for (cpt=0; cpt<count; cpt++) {
-      TRY(gras_datadesc_recv_rec(sock,state,refs, sub_type,
-                                r_arch, NULL, 0, &ptr));
-      ptr += elm_size;
+    if (sub_type->category_code == e_gras_datadesc_type_cat_scalar) {
+      VERB1("Array of %d scalars, get it in one shoot", count);
+      if (sub_type->aligned_size[GRAS_THISARCH] >= 
+         sub_type->aligned_size[r_arch]) {
+       TRY(gras_trp_chunk_recv(sock, (char*)l_data, 
+                               sub_type->aligned_size[r_arch] * count));
+       TRY(gras_dd_convert_elm(sub_type,count,r_arch, l_data,l_data));
+      } else {
+       ptr = malloc((size_t)sub_type->aligned_size[r_arch] * count);
+       TRY(gras_trp_chunk_recv(sock, (char*)ptr, 
+                               sub_type->size[r_arch] * count));
+       TRY(gras_dd_convert_elm(sub_type,count,r_arch, ptr,l_data));
+       free(ptr);
+      }
+    } else {
+      /* not scalar content, get it recursively (may contain pointers) */
+      elm_size = sub_type->aligned_size[GRAS_THISARCH];
+      VERB2("Receive a %d-long array of %s",count, sub_type->name);
+
+      ptr = l_data;
+      for (cpt=0; cpt<count; cpt++) {
+       TRY(gras_datadesc_recv_rec(sock,state,refs, sub_type,
+                                  r_arch, NULL, 0, ptr,-1));
+       ptr += elm_size;
+      }
     }
     break;
   }
@@ -660,7 +766,7 @@ gras_error_t
 gras_datadesc_recv(gras_socket_t *sock, 
                   gras_datadesc_type_t *type, 
                   int r_arch,
-                  void **dst) {
+                  void *dst) {
 
   gras_error_t errcode;
   gras_dd_cbps_t *state = NULL; /* callback persistent state */
@@ -668,14 +774,10 @@ gras_datadesc_recv(gras_socket_t *sock,
 
   TRY(gras_dict_new(&refs));
   TRY(gras_dd_cbps_new(&state));
-  if (!dst)
-    CRITICAL0("Cannot receive data into a NULL pointer!");
-  if (*dst) 
-    VERB0("'*dst' not NULL in datadesc_recv. Data to be copied there without malloc");
 
   errcode = gras_datadesc_recv_rec(sock, state, refs, type, 
                                   r_arch, NULL, 0,
-                                  (char **) dst);
+                                  (char *) dst,-1);
 
   gras_dict_free(&refs);
   gras_dd_cbps_free(&state);