Logo AND Algorithmique Numérique Distribuée

Public GIT Repository
Further investigate the dsend issue, in vain so far
[simgrid.git] / src / simix / smx_network.c
1 /* Copyright (c) 2009, 2010. The SimGrid Team.
2  * All rights reserved.                                                     */
3
4 /* This program is free software; you can redistribute it and/or modify it
5  * under the terms of the license (GNU LGPL) which comes with this package. */
6
7 #include "private.h"
8 #include "xbt/log.h"
9 #include "mc/mc.h"
10 #include "xbt/dict.h"
11
12 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(simix_network, simix,
13                                 "Logging specific to SIMIX (network)");
14
15 static xbt_dict_t rdv_points = NULL;
16 unsigned long int smx_total_comms = 0;
17
18 static void SIMIX_waitany_req_remove_from_actions(smx_req_t req);
19 static void SIMIX_comm_copy_data(smx_action_t comm);
20 static smx_action_t SIMIX_comm_new(e_smx_comm_type_t type);
21 static XBT_INLINE void SIMIX_rdv_push(smx_rdv_t rdv, smx_action_t comm);
22 static XBT_INLINE void SIMIX_rdv_remove(smx_rdv_t rdv, smx_action_t comm);
23 static smx_action_t SIMIX_rdv_get_request(smx_rdv_t rdv, e_smx_comm_type_t type,
24                                           int (*match_fun)(void *, void *), void *);
25 static void SIMIX_rdv_free(void *data);
26
27 void SIMIX_network_init(void)
28 {
29   rdv_points = xbt_dict_new_homogeneous(SIMIX_rdv_free);
30 }
31
32 void SIMIX_network_exit(void)
33 {
34   xbt_dict_free(&rdv_points);
35 }
36
37 /******************************************************************************/
38 /*                           Rendez-Vous Points                               */
39 /******************************************************************************/
40
41 smx_rdv_t SIMIX_rdv_create(const char *name)
42 {
43   /* two processes may have pushed the same rdv_create request at the same time */
44   smx_rdv_t rdv = name ? xbt_dict_get_or_null(rdv_points, name) : NULL;
45
46   if (!rdv) {
47     rdv = xbt_new0(s_smx_rvpoint_t, 1);
48     rdv->name = name ? xbt_strdup(name) : NULL;
49     rdv->comm_fifo = xbt_fifo_new();
50
51     if (rdv->name)
52       xbt_dict_set(rdv_points, rdv->name, rdv, NULL);
53   }
54   return rdv;
55 }
56
57 void SIMIX_rdv_destroy(smx_rdv_t rdv)
58 {
59   if (rdv->name)
60     xbt_dict_remove(rdv_points, rdv->name);
61 }
62
63 void SIMIX_rdv_free(void *data)
64 {
65   smx_rdv_t rdv = (smx_rdv_t) data;
66   xbt_free(rdv->name);
67   xbt_fifo_free(rdv->comm_fifo);
68   xbt_free(rdv);  
69 }
70
71 smx_rdv_t SIMIX_rdv_get_by_name(const char *name)
72 {
73   return xbt_dict_get_or_null(rdv_points, name);
74 }
75
76 int SIMIX_rdv_comm_count_by_host(smx_rdv_t rdv, smx_host_t host)
77 {
78   smx_action_t comm = NULL;
79   xbt_fifo_item_t item = NULL;
80   int count = 0;
81
82   xbt_fifo_foreach(rdv->comm_fifo, item, comm, smx_action_t) {
83     if (comm->comm.src_proc->smx_host == host)
84       count++;
85   }
86
87   return count;
88 }
89
90 smx_action_t SIMIX_rdv_get_head(smx_rdv_t rdv)
91 {
92   return xbt_fifo_get_item_content(xbt_fifo_get_first_item(rdv->comm_fifo));
93 }
94
95 /**
96  *  \brief Push a communication request into a rendez-vous point
97  *  \param rdv The rendez-vous point
98  *  \param comm The communication request
99  */
100 static XBT_INLINE void SIMIX_rdv_push(smx_rdv_t rdv, smx_action_t comm)
101 {
102   xbt_fifo_push(rdv->comm_fifo, comm);
103   comm->comm.rdv = rdv;
104 }
105
106 /**
107  *  \brief Remove a communication request from a rendez-vous point
108  *  \param rdv The rendez-vous point
109  *  \param comm The communication request
110  */
111 static XBT_INLINE void SIMIX_rdv_remove(smx_rdv_t rdv, smx_action_t comm)
112 {
113   xbt_fifo_remove(rdv->comm_fifo, comm);
114   comm->comm.rdv = NULL;
115 }
116
117 /**
118  *  \brief Wrapper to SIMIX_rdv_get_request
119  */
120 smx_action_t SIMIX_comm_get_send_match(smx_rdv_t rdv, int (*match_fun)(void*, void*), void* data) {
121    return SIMIX_rdv_get_request(rdv, SIMIX_COMM_SEND, match_fun, data);
122 }
123
124 /**
125  *  \brief Checks if there is a communication action queued in a rendez-vous matching our needs
126  *  \param type The type of communication we are looking for (comm_send, comm_recv)
127  *  \return The communication action if found, NULL otherwise
128  */
129 smx_action_t SIMIX_rdv_get_request(smx_rdv_t rdv, e_smx_comm_type_t type,
130                                    int (*match_fun)(void *, void *), void *data)
131 {
132   // FIXME rewrite this function by using SIMIX_rdv_has_send/recv_match
133   smx_action_t action;
134   xbt_fifo_item_t item;
135   void* req_data = NULL;
136
137   xbt_fifo_foreach(rdv->comm_fifo, item, action, smx_action_t) {
138     if (action->comm.type == SIMIX_COMM_SEND) {
139       req_data = action->comm.src_data;
140     } else if (action->comm.type == SIMIX_COMM_RECEIVE) {
141       req_data = action->comm.dst_data;
142     }
143     if (action->comm.type == type && (!match_fun || match_fun(data, req_data))) {
144       XBT_DEBUG("Found a matching communication action %p", action);
145       xbt_fifo_remove_item(rdv->comm_fifo, item);
146       xbt_fifo_free_item(item);
147       action->comm.refcount++;
148       action->comm.rdv = NULL;
149       return action;
150     }
151     XBT_DEBUG("Sorry, communication action %p does not match our needs:"
152            " its type is %d but we are looking for a comm of type %d",
153            action, action->comm.type, type);
154   }
155   XBT_DEBUG("No matching communication action found");
156   return NULL;
157 }
158
159 /**
160  *  \brief Checks if there is a send communication action
161  *  queued in a rendez-vous matching our needs.
162  *  \return 1 if found, 0 otherwise
163  */
164 int SIMIX_comm_has_send_match(smx_rdv_t rdv, int (*match_fun)(void*, void*), void* data) {
165
166   smx_action_t action;
167   xbt_fifo_item_t item;
168
169   xbt_fifo_foreach(rdv->comm_fifo, item, action, smx_action_t){
170     if (action->comm.type == SIMIX_COMM_SEND
171         && (!match_fun || match_fun(data, action->comm.src_data))) {
172       XBT_DEBUG("Found a matching communication action %p", action);
173       return 1;
174     }
175   }
176   XBT_DEBUG("No matching communication action found");
177   return 0;
178 }
179
180 /**
181  *  \brief Checks if there is a recv communication action
182  *  queued in a rendez-vous matching our needs.
183  *  \return 1 if found, 0 otherwise
184  */
185 int SIMIX_comm_has_recv_match(smx_rdv_t rdv, int (*match_fun)(void*, void*), void* data) {
186
187   smx_action_t action;
188   xbt_fifo_item_t item;
189
190   xbt_fifo_foreach(rdv->comm_fifo, item, action, smx_action_t) {
191     if (action->comm.type == SIMIX_COMM_RECEIVE
192         && (!match_fun || match_fun(data, action->comm.dst_data))) {
193       XBT_DEBUG("Found a matching communication action %p", action);
194       return 1;
195     }
196   }
197   XBT_DEBUG("No matching communication action found");
198   return 0;
199 }
200
201 /******************************************************************************/
202 /*                            Comunication Actions                            */
203 /******************************************************************************/
204
205 /**
206  *  \brief Creates a new comunicate action
207  *  \param type The type of request (comm_send, comm_recv)
208  *  \return The new comunicate action
209  */
210 smx_action_t SIMIX_comm_new(e_smx_comm_type_t type)
211 {
212   smx_action_t act;
213
214   /* alloc structures */
215   act = xbt_mallocator_get(simix_global->action_mallocator);
216
217   act->type = SIMIX_ACTION_COMMUNICATE;
218   act->state = SIMIX_WAITING;
219
220   /* set communication */
221   act->comm.type = type;
222   act->comm.refcount = 1;
223
224 #ifdef HAVE_LATENCY_BOUND_TRACKING
225   //initialize with unknown value
226   act->latency_limited = -1;
227 #endif
228
229 #ifdef HAVE_TRACING
230   act->category = NULL;
231 #endif
232
233   XBT_DEBUG("Create communicate action %p", act);
234   ++smx_total_comms;
235
236   return act;
237 }
238
239 /**
240  *  \brief Destroy a communicate action
241  *  \param action The communicate action to be destroyed
242  */
243 void SIMIX_comm_destroy(smx_action_t action)
244 {
245   XBT_DEBUG("Destroy action %p (refcount: %d), state: %d",
246       action, action->comm.refcount, action->state);
247
248   if (action->comm.refcount <= 0) {
249         xbt_backtrace_display_current();
250     xbt_die("the refcount of comm %p is already 0 before decreasing it. "
251             "That's a bug!", action);
252   }
253   action->comm.refcount--;
254   if (action->comm.refcount > 0)
255     return;
256   XBT_DEBUG("Really free communication %p; refcount is now %d", action,
257         action->comm.refcount);
258
259 #ifdef HAVE_LATENCY_BOUND_TRACKING
260     action->latency_limited = SIMIX_comm_is_latency_bounded( action ) ;
261 #endif
262
263   xbt_free(action->name);
264   SIMIX_comm_destroy_internal_actions(action);
265
266   if (action->comm.detached && action->state != SIMIX_DONE) {
267     /* the communication has failed and was detached:
268      * we have to free the buffer */
269     action->comm.clean_fun(action->comm.src_buff);
270     action->comm.src_buff = NULL;
271   }
272
273   xbt_mallocator_release(simix_global->action_mallocator, action);
274 }
275
276 void SIMIX_comm_destroy_internal_actions(smx_action_t action)
277 {
278   if (action->comm.surf_comm){
279 #ifdef HAVE_LATENCY_BOUND_TRACKING
280     action->latency_limited = SIMIX_comm_is_latency_bounded(action);
281 #endif
282     action->comm.surf_comm->model_type->action_unref(action->comm.surf_comm);
283     action->comm.surf_comm = NULL;
284   }
285
286   if (action->comm.src_timeout){
287     action->comm.src_timeout->model_type->action_unref(action->comm.src_timeout);
288     action->comm.src_timeout = NULL;
289   }
290
291   if (action->comm.dst_timeout){
292     action->comm.dst_timeout->model_type->action_unref(action->comm.dst_timeout);
293     action->comm.dst_timeout = NULL;
294   }
295 }
296
297 smx_action_t SIMIX_comm_isend(smx_process_t src_proc, smx_rdv_t rdv,
298                               double task_size, double rate,
299                               void *src_buff, size_t src_buff_size,
300                               int (*match_fun)(void *, void *),
301                               void (*clean_fun)(void *), // used to free the action in case of problem after a detached send
302                               void *data,
303                               int detached)
304 {
305   smx_action_t action;
306
307   /* Look for communication request matching our needs.
308      If it is not found then create it and push it into the rendez-vous point */
309   action = SIMIX_rdv_get_request(rdv, SIMIX_COMM_RECEIVE, match_fun, data);
310
311   if (!action) {
312     action = SIMIX_comm_new(SIMIX_COMM_SEND);
313     SIMIX_rdv_push(rdv, action);
314   } else {
315     action->state = SIMIX_READY;
316     action->comm.type = SIMIX_COMM_READY;
317   }
318   xbt_fifo_push(src_proc->comms, action);
319
320   /* if the communication action is detached then decrease the refcount
321    * by one, so it will be eliminated by the receiver's destroy call */
322   if (detached) {
323     action->comm.detached = 1;
324     action->comm.refcount--;
325     action->comm.clean_fun = clean_fun;
326   } else {
327     action->comm.clean_fun = NULL;
328   }
329
330   /* Setup the communication request */
331   action->comm.src_proc = src_proc;
332   action->comm.task_size = task_size;
333   action->comm.rate = rate;
334   action->comm.src_buff = src_buff;
335   action->comm.src_buff_size = src_buff_size;
336   action->comm.src_data = data;
337
338   if (MC_IS_ENABLED) {
339     action->state = SIMIX_RUNNING;
340     return action;
341   }
342
343   SIMIX_comm_start(action);
344   return (detached ? NULL : action);
345 }
346
347 smx_action_t SIMIX_comm_irecv(smx_process_t dst_proc, smx_rdv_t rdv,
348                       void *dst_buff, size_t *dst_buff_size,
349                       int (*match_fun)(void *, void *), void *data)
350 {
351   smx_action_t action;
352
353   /* Look for communication request matching our needs.
354    * If it is not found then create it and push it into the rendez-vous point
355    */
356   action = SIMIX_rdv_get_request(rdv, SIMIX_COMM_SEND, match_fun, data);
357
358   if (!action) {
359     action = SIMIX_comm_new(SIMIX_COMM_RECEIVE);
360     SIMIX_rdv_push(rdv, action);
361   } else {
362     action->state = SIMIX_READY;
363     action->comm.type = SIMIX_COMM_READY;
364   }
365   xbt_fifo_push(dst_proc->comms, action);
366
367   /* Setup communication request */
368   action->comm.dst_proc = dst_proc;
369   action->comm.dst_buff = dst_buff;
370   action->comm.dst_buff_size = dst_buff_size;
371   action->comm.dst_data = data;
372
373   if (MC_IS_ENABLED) {
374     action->state = SIMIX_RUNNING;
375     return action;
376   }
377
378   SIMIX_comm_start(action);
379   return action;
380 }
381
382 void SIMIX_pre_comm_wait(smx_req_t req, smx_action_t action, double timeout, int idx)
383 {
384
385   /* the request may be a wait, a send or a recv */
386   surf_action_t sleep;
387
388   /* Associate this request to the action */
389   xbt_fifo_push(action->request_list, req);
390   req->issuer->waiting_action = action;
391
392   if (MC_IS_ENABLED) {
393     if (idx == 0) {
394       action->state = SIMIX_DONE;
395     } else {
396       /* If we reached this point, the wait request must have a timeout */
397       /* Otherwise it shouldn't be enabled and executed by the MC */
398       if (timeout == -1)
399         THROW_IMPOSSIBLE;
400
401       if (action->comm.src_proc == req->issuer)
402         action->state = SIMIX_SRC_TIMEOUT;
403       else
404         action->state = SIMIX_DST_TIMEOUT;
405     }
406
407     SIMIX_comm_finish(action);
408     return;
409   }
410         XBT_INFO("Comm_wait. state:%d; I'm %s",action->state,
411                         req->issuer == action->comm.src_proc?"sender":"receiver");
412
413   /* If the action has already finish perform the error handling, */
414   /* otherwise set up a waiting timeout on the right side         */
415   if (action->state != SIMIX_WAITING && action->state != SIMIX_RUNNING) {
416     SIMIX_comm_finish(action);
417   } else { /* if (timeout >= 0) { we need a surf sleep action even when there is no timeout, otherwise surf won't tell us when the host fails */
418         XBT_INFO("Not done, we need a sleep action");
419     sleep = surf_workstation_model->extension.workstation.sleep(req->issuer->smx_host->host, timeout);
420     surf_workstation_model->action_data_set(sleep, action);
421
422     if (req->issuer == action->comm.src_proc)
423       action->comm.src_timeout = sleep;
424     else
425       action->comm.dst_timeout = sleep;
426   }
427 }
428
429 void SIMIX_pre_comm_test(smx_req_t req)
430 {
431   smx_action_t action = req->comm_test.comm;
432
433   if(MC_IS_ENABLED){
434     req->comm_test.result = action->comm.src_proc && action->comm.dst_proc;
435     if(req->comm_test.result){
436       action->state = SIMIX_DONE;
437       xbt_fifo_push(action->request_list, req);
438       SIMIX_comm_finish(action);
439     }else{
440       SIMIX_request_answer(req);
441     }
442     return;
443   }
444
445   req->comm_test.result = (action->state != SIMIX_WAITING && action->state != SIMIX_RUNNING);
446   if (req->comm_test.result) {
447     xbt_fifo_push(action->request_list, req);
448     SIMIX_comm_finish(action);
449   } else {
450     SIMIX_request_answer(req);
451   }
452 }
453
454 void SIMIX_pre_comm_testany(smx_req_t req, int idx)
455 {
456   unsigned int cursor;
457   smx_action_t action;
458   xbt_dynar_t actions = req->comm_testany.comms;
459   req->comm_testany.result = -1;
460
461   if (MC_IS_ENABLED){
462     if(idx == -1){
463       SIMIX_request_answer(req);
464     }else{
465       action = xbt_dynar_get_as(actions, idx, smx_action_t);
466       req->comm_testany.result = idx;
467       xbt_fifo_push(action->request_list, req);
468       action->state = SIMIX_DONE;
469       SIMIX_comm_finish(action);
470     }
471     return;
472   }
473
474   xbt_dynar_foreach(req->comm_testany.comms,cursor,action) {
475     if (action->state != SIMIX_WAITING && action->state != SIMIX_RUNNING) {
476       req->comm_testany.result = cursor;
477       xbt_fifo_push(action->request_list, req);
478       SIMIX_comm_finish(action);
479       return;
480     }
481   }
482   SIMIX_request_answer(req);
483 }
484
485 void SIMIX_pre_comm_waitany(smx_req_t req, int idx)
486 {
487   smx_action_t action;
488   unsigned int cursor = 0;
489   xbt_dynar_t actions = req->comm_waitany.comms;
490
491   if (MC_IS_ENABLED){
492     action = xbt_dynar_get_as(actions, idx, smx_action_t);
493     xbt_fifo_push(action->request_list, req);
494     req->comm_waitany.result = idx;
495     action->state = SIMIX_DONE;
496     SIMIX_comm_finish(action);
497     return;
498   }
499
500   xbt_dynar_foreach(actions, cursor, action){
501     /* Associate this request to the action */
502     xbt_fifo_push(action->request_list, req);
503     if (action->state != SIMIX_WAITING && action->state != SIMIX_RUNNING){
504       SIMIX_comm_finish(action);
505       break;
506     }
507   }
508 }
509
510 void SIMIX_waitany_req_remove_from_actions(smx_req_t req)
511 {
512   smx_action_t action;
513   unsigned int cursor = 0;
514   xbt_dynar_t actions = req->comm_waitany.comms;
515
516   xbt_dynar_foreach(actions, cursor, action){
517     xbt_fifo_remove(action->request_list, req);
518   }
519 }
520
521 /**
522  *  \brief Start the simulation of a communication request
523  *  \param action The communication action
524  */
525
526 XBT_INLINE void SIMIX_comm_start(smx_action_t action)
527 {
528   /* If both the sender and the receiver are already there, start the communication */
529   if (action->state == SIMIX_READY) {
530
531     smx_host_t sender = action->comm.src_proc->smx_host;
532     smx_host_t receiver = action->comm.dst_proc->smx_host;
533
534     XBT_DEBUG("Starting communication %p from '%s' to '%s'", action,
535            SIMIX_host_get_name(sender), SIMIX_host_get_name(receiver));
536
537     action->comm.surf_comm = surf_workstation_model->extension.workstation.
538         communicate(sender->host, receiver->host, action->comm.task_size, action->comm.rate);
539
540     surf_workstation_model->action_data_set(action->comm.surf_comm, action);
541
542     action->state = SIMIX_RUNNING;
543
544     /* If a link is failed, detect it immediately */
545     if (surf_workstation_model->action_state_get(action->comm.surf_comm) == SURF_ACTION_FAILED) {
546       XBT_DEBUG("Communication from '%s' to '%s' failed to start because of a link failure",
547           SIMIX_host_get_name(sender), SIMIX_host_get_name(receiver));
548       action->state = SIMIX_LINK_FAILURE;
549       SIMIX_comm_destroy_internal_actions(action);
550     }
551
552     /* If any of the process is suspend, create the action but stop its execution,
553        it will be restarted when the sender process resume */
554     if (SIMIX_process_is_suspended(action->comm.src_proc) ||
555         SIMIX_process_is_suspended(action->comm.dst_proc)) {
556       /* FIXME: check what should happen with the action state */
557       surf_workstation_model->suspend(action->comm.surf_comm);
558     }
559   }
560 }
561
562 /**
563  * \brief Answers the SIMIX requests associated to a communication action.
564  * \param action a finished communication action
565  */
566 void SIMIX_comm_finish(smx_action_t action)
567 {
568   volatile unsigned int destroy_count = 0;
569   smx_req_t req;
570
571   while ((req = xbt_fifo_shift(action->request_list))) {
572
573     /* If a waitany request is waiting for this action to finish, then remove
574        it from the other actions in the waitany list. Afterwards, get the
575        position of the actual action in the waitany request's actions dynar and
576        return it as the result of the call */
577     if (req->call == REQ_COMM_WAITANY) {
578       SIMIX_waitany_req_remove_from_actions(req);
579       if (!MC_IS_ENABLED)
580         req->comm_waitany.result = xbt_dynar_search(req->comm_waitany.comms, &action);
581     }
582
583     /* If the action is still in a rendez-vous point then remove from it */
584     if (action->comm.rdv)
585       SIMIX_rdv_remove(action->comm.rdv, action);
586
587     XBT_DEBUG("SIMIX_comm_finish: action state = %d", action->state);
588
589     /* Check out for errors */
590     switch (action->state) {
591
592       case SIMIX_DONE:
593         XBT_DEBUG("Communication %p complete!", action);
594         SIMIX_comm_copy_data(action);
595         break;
596
597       case SIMIX_SRC_TIMEOUT:
598         TRY {
599           THROWF(timeout_error, 0, "Communication timeouted because of sender");
600         }
601         CATCH(req->issuer->running_ctx->exception) {
602           req->issuer->doexception = 1;
603         }
604         break;
605
606       case SIMIX_DST_TIMEOUT:
607         TRY {
608           THROWF(timeout_error, 0, "Communication timeouted because of receiver");
609         }
610         CATCH(req->issuer->running_ctx->exception) {
611           req->issuer->doexception = 1;
612         }
613         break;
614
615       case SIMIX_SRC_HOST_FAILURE:
616         TRY {
617           if (req->issuer == action->comm.src_proc)
618             THROWF(host_error, 0, "Host failed");
619           else
620             THROWF(network_error, 0, "Remote peer failed");
621         }
622         CATCH(req->issuer->running_ctx->exception) {
623           req->issuer->doexception = 1;
624         }
625         break;
626
627       case SIMIX_DST_HOST_FAILURE:
628         TRY {
629           if (req->issuer == action->comm.dst_proc)
630             THROWF(host_error, 0, "Host failed");
631           else
632             THROWF(network_error, 0, "Remote peer failed");
633         }
634         CATCH(req->issuer->running_ctx->exception) {
635           req->issuer->doexception = 1;
636         }
637         break;
638
639       case SIMIX_LINK_FAILURE:
640         TRY {
641           XBT_INFO("Link failure in action %p between '%s' and '%s': posting an exception to the issuer: %s (%p) detached:%d",
642               action,
643               action->comm.src_proc ? action->comm.src_proc->smx_host->name : NULL,
644               action->comm.dst_proc ? action->comm.dst_proc->smx_host->name : NULL,
645               req->issuer->name, req->issuer,action->comm.detached);
646           if (action->comm.src_proc == req->issuer) {
647                   XBT_INFO("I'm source");
648           } else if (action->comm.dst_proc == req->issuer) {
649                   XBT_INFO("I'm dest");
650           } else {
651                   XBT_INFO("I'm neither source nor dest");
652           }
653           THROWF(network_error, 0, "Link failure");
654         }
655         CATCH(req->issuer->running_ctx->exception) {
656           req->issuer->doexception = 1;
657         }
658         break;
659
660       case SIMIX_CANCELED:
661         TRY {
662           if (req->issuer == action->comm.dst_proc) {
663             THROWF(cancel_error, 0, "Communication canceled by the sender");
664           }
665           else {
666             THROWF(cancel_error, 0, "Communication canceled by the receiver");
667           }
668         }
669         CATCH(req->issuer->running_ctx->exception) {
670           req->issuer->doexception = 1;
671         }
672         break;
673
674       default:
675         xbt_die("Unexpected action state in SIMIX_comm_finish: %d", action->state);
676     }
677
678     /* if there is an exception during a waitany or a testany, indicate the position of the failed communication */
679     if (req->issuer->doexception) {
680       if (req->call == REQ_COMM_WAITANY) {
681         req->issuer->running_ctx->exception.value = xbt_dynar_search(req->comm_waitany.comms, &action);
682       }
683       else if (req->call == REQ_COMM_TESTANY) {
684         req->issuer->running_ctx->exception.value = xbt_dynar_search(req->comm_testany.comms, &action);
685       }
686     }
687
688     req->issuer->waiting_action = NULL;
689     xbt_fifo_remove(req->issuer->comms, action);
690     SIMIX_request_answer(req);
691     destroy_count++;
692   }
693
694   while (destroy_count-- > 0)
695     SIMIX_comm_destroy(action);
696 }
697
698 /**
699  * \brief This function is called when a Surf communication action is finished.
700  * \param action the corresponding Simix communication
701  */
702 void SIMIX_post_comm(smx_action_t action)
703 {
704   /* Update action state */
705   if (action->comm.src_timeout &&
706      surf_workstation_model->action_state_get(action->comm.src_timeout) == SURF_ACTION_DONE)
707      action->state = SIMIX_SRC_TIMEOUT;
708   else if (action->comm.dst_timeout &&
709           surf_workstation_model->action_state_get(action->comm.dst_timeout) == SURF_ACTION_DONE)
710      action->state = SIMIX_DST_TIMEOUT;
711   else if (action->comm.src_timeout &&
712           surf_workstation_model->action_state_get(action->comm.src_timeout) == SURF_ACTION_FAILED)
713      action->state = SIMIX_SRC_HOST_FAILURE;
714   else if (action->comm.dst_timeout &&
715           surf_workstation_model->action_state_get(action->comm.dst_timeout) == SURF_ACTION_FAILED)
716      action->state = SIMIX_DST_HOST_FAILURE;
717   else if (action->comm.surf_comm &&
718           surf_workstation_model->action_state_get(action->comm.surf_comm) == SURF_ACTION_FAILED) {
719           XBT_INFO("Puta madre. Surf says that the link broke");
720      action->state = SIMIX_LINK_FAILURE;
721   } else
722     action->state = SIMIX_DONE;
723
724   XBT_DEBUG("SIMIX_post_comm: comm %p, state %d, src_proc %p, dst_proc %p, detached: %d",
725       action, action->state, action->comm.src_proc, action->comm.dst_proc, action->comm.detached);
726
727   /* destroy the surf actions associated with the Simix communication */
728   SIMIX_comm_destroy_internal_actions(action);
729
730   /* remove the communication action from the list of pending communications
731    * of both processes (if they still exist) */
732   if (action->comm.src_proc) {
733     xbt_fifo_remove(action->comm.src_proc->comms, action);
734   }
735   if (action->comm.dst_proc) {
736     xbt_fifo_remove(action->comm.dst_proc->comms, action);
737   }
738
739   /* if there are requests associated with the action, then answer them */
740   if (xbt_fifo_size(action->request_list)) {
741     SIMIX_comm_finish(action);
742   }
743 }
744
745 void SIMIX_comm_cancel(smx_action_t action)
746 {
747   /* if the action is a waiting state means that it is still in a rdv */
748   /* so remove from it and delete it */
749   if (action->state == SIMIX_WAITING) {
750     SIMIX_rdv_remove(action->comm.rdv, action);
751     action->state = SIMIX_CANCELED;
752   }
753   else if (!MC_IS_ENABLED /* when running the MC there are no surf actions */
754       && (action->state == SIMIX_READY || action->state == SIMIX_RUNNING)) {
755
756     surf_workstation_model->action_cancel(action->comm.surf_comm);
757   }
758 }
759
760 void SIMIX_comm_suspend(smx_action_t action)
761 {
762   /*FIXME: shall we suspend also the timeout actions? */
763   surf_workstation_model->suspend(action->comm.surf_comm);
764 }
765
766 void SIMIX_comm_resume(smx_action_t action)
767 {
768   /*FIXME: check what happen with the timeouts */
769   surf_workstation_model->resume(action->comm.surf_comm);
770 }
771
772
773 /************* Action Getters **************/
774
775 /**
776  *  \brief get the amount remaining from the communication
777  *  \param action The communication
778  */
779 double SIMIX_comm_get_remains(smx_action_t action)
780 {
781   double remains;
782
783   if(!action){
784       return 0;
785   }
786
787   switch (action->state) {
788
789     case SIMIX_RUNNING:
790       remains = surf_workstation_model->get_remains(action->comm.surf_comm);
791       break;
792
793     case SIMIX_WAITING:
794     case SIMIX_READY:
795       remains = 0; /*FIXME: check what should be returned */
796       break;
797
798     default:
799       remains = 0; /*FIXME: is this correct? */
800       break;
801   }
802   return remains;
803 }
804
805 e_smx_state_t SIMIX_comm_get_state(smx_action_t action)
806 {
807   return action->state;
808 }
809
810 /**
811  *  \brief Return the user data associated to the sender of the communication
812  *  \param action The communication
813  *  \return the user data
814  */
815 void* SIMIX_comm_get_src_data(smx_action_t action)
816 {
817   return action->comm.src_data;
818 }
819
820 /**
821  *  \brief Return the user data associated to the receiver of the communication
822  *  \param action The communication
823  *  \return the user data
824  */
825 void* SIMIX_comm_get_dst_data(smx_action_t action)
826 {
827   return action->comm.dst_data;
828 }
829
830 smx_process_t SIMIX_comm_get_src_proc(smx_action_t action)
831 {
832   return action->comm.src_proc;
833 }
834
835 smx_process_t SIMIX_comm_get_dst_proc(smx_action_t action)
836 {
837   return action->comm.dst_proc;
838 }
839
840 #ifdef HAVE_LATENCY_BOUND_TRACKING
841 /**
842  *  \brief verify if communication is latency bounded
843  *  \param comm The communication
844  */
845 XBT_INLINE int SIMIX_comm_is_latency_bounded(smx_action_t action)
846 {
847   if(!action){
848       return 0;
849   }
850   if (action->comm.surf_comm){
851       XBT_DEBUG("Getting latency limited for surf_action (%p)", action->comm.surf_comm);
852       action->latency_limited = surf_workstation_model->get_latency_limited(action->comm.surf_comm);
853       XBT_DEBUG("Action limited is %d", action->latency_limited);
854   }
855   return action->latency_limited;
856 }
857 #endif
858
859 /******************************************************************************/
860 /*                    SIMIX_comm_copy_data callbacks                       */
861 /******************************************************************************/
862 static void (*SIMIX_comm_copy_data_callback) (smx_action_t, size_t) =
863     &SIMIX_comm_copy_pointer_callback;
864
865 void
866 SIMIX_comm_set_copy_data_callback(void (*callback) (smx_action_t, size_t))
867 {
868   SIMIX_comm_copy_data_callback = callback;
869 }
870
871 void SIMIX_comm_copy_pointer_callback(smx_action_t comm, size_t buff_size)
872 {
873   xbt_assert((buff_size == sizeof(void *)),
874               "Cannot copy %zu bytes: must be sizeof(void*)", buff_size);
875   *(void **) (comm->comm.dst_buff) = comm->comm.src_buff;
876 }
877
878 void SIMIX_comm_copy_buffer_callback(smx_action_t comm, size_t buff_size)
879 {
880   memcpy(comm->comm.dst_buff, comm->comm.src_buff, buff_size);
881 }
882
883 void smpi_comm_copy_data_callback(smx_action_t comm, size_t buff_size)
884 {
885   XBT_INFO("Copy the data over");
886   memcpy(comm->comm.dst_buff, comm->comm.src_buff, buff_size);
887   if (comm->comm.detached) { // if this is a detached send, the source buffer was duplicated by SMPI sender to make the original buffer available to the application ASAP
888           comm->comm.clean_fun(comm->comm.src_buff);
889           comm->comm.src_buff = NULL;
890   }
891 }
892
893 /**
894  *  \brief Copy the communication data from the sender's buffer to the receiver's one
895  *  \param comm The communication
896  */
897 void SIMIX_comm_copy_data(smx_action_t comm)
898 {
899   size_t buff_size = comm->comm.src_buff_size;
900   /* If there is no data to be copy then return */
901   if (!comm->comm.src_buff || !comm->comm.dst_buff || comm->comm.copied == 1)
902     return;
903
904   XBT_DEBUG("Copying comm %p data from %s (%p) -> %s (%p) (%zu bytes)",
905          comm,
906          comm->comm.src_proc->smx_host->name, comm->comm.src_buff,
907          comm->comm.dst_proc->smx_host->name, comm->comm.dst_buff, buff_size);
908
909   /* Copy at most dst_buff_size bytes of the message to receiver's buffer */
910   if (comm->comm.dst_buff_size)
911     buff_size = MIN(buff_size, *(comm->comm.dst_buff_size));
912
913   /* Update the receiver's buffer size to the copied amount */
914   if (comm->comm.dst_buff_size)
915     *comm->comm.dst_buff_size = buff_size;
916
917   if (buff_size > 0)
918     SIMIX_comm_copy_data_callback (comm, buff_size);
919
920   /* Set the copied flag so we copy data only once */
921   /* (this function might be called from both communication ends) */
922   comm->comm.copied = 1;
923 }