Logo AND Algorithmique Numérique Distribuée

Public GIT Repository
30ff57c592fdc9700356fdae31e8ea845155103d
[simgrid.git] / src / simix / smx_process.c
1 /* Copyright (c) 2007-2014. The SimGrid Team.
2  * All rights reserved.                                                     */
3
4 /* This program is free software; you can redistribute it and/or modify it
5  * under the terms of the license (GNU LGPL) which comes with this package. */
6
7 #include "smx_private.h"
8 #include "xbt/sysdep.h"
9 #include "xbt/log.h"
10 #include "xbt/dict.h"
11 #include "mc/mc.h"
12
13 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(simix_process, simix,
14                                 "Logging specific to SIMIX (process)");
15
16 unsigned long simix_process_maxpid = 0;
17
18 /**
19  * \brief Returns the current agent.
20  *
21  * This functions returns the currently running SIMIX process.
22  *
23  * \return The SIMIX process
24  */
25 XBT_INLINE smx_process_t SIMIX_process_self(void)
26 {
27   smx_context_t self_context = SIMIX_context_self();
28
29   return self_context ? SIMIX_context_get_process(self_context) : NULL;
30 }
31
32 /**
33  * \brief Returns whether a process has pending asynchronous communications.
34  * \return true if there are asynchronous communications in this process
35  */
36 int SIMIX_process_has_pending_comms(smx_process_t process) {
37
38   return xbt_fifo_size(process->comms) > 0;
39 }
40
41 void simcall_HANDLER_process_cleanup(smx_simcall_t simcall, smx_process_t process) {
42   SIMIX_process_cleanup(process);
43 }
44 /**
45  * \brief Moves a process to the list of processes to destroy.
46  */
47 void SIMIX_process_cleanup(smx_process_t process)
48 {
49   XBT_DEBUG("Cleanup process %s (%p), waiting action %p",
50       process->name, process, process->waiting_action);
51
52   SIMIX_process_on_exit_runall(process);
53
54   /* cancel non-blocking communications */
55   smx_action_t action;
56   while ((action = xbt_fifo_pop(process->comms))) {
57
58     /* make sure no one will finish the comm after this process is destroyed,
59      * because src_proc or dst_proc would be an invalid pointer */
60     SIMIX_comm_cancel(action);
61
62     if (action->comm.src_proc == process) {
63       XBT_DEBUG("Found an unfinished send comm %p (detached = %d), state %d, src = %p, dst = %p",
64           action, action->comm.detached, (int)action->state, action->comm.src_proc, action->comm.dst_proc);
65       action->comm.src_proc = NULL;
66
67       /* I'm not supposed to destroy a detached comm from the sender side, */
68       if (!action->comm.detached)
69         SIMIX_comm_destroy(action);
70       else
71         XBT_DEBUG("Don't destroy it since it's a detached comm");
72
73     }
74     else if (action->comm.dst_proc == process){
75       XBT_DEBUG("Found an unfinished recv comm %p, state %d, src = %p, dst = %p",
76           action, (int)action->state, action->comm.src_proc, action->comm.dst_proc);
77       action->comm.dst_proc = NULL;
78
79       if (action->comm.detached && action->comm.refcount == 1
80           && action->comm.src_proc != NULL) {
81         /* the comm will be freed right now, remove it from the sender */
82         xbt_fifo_remove(action->comm.src_proc->comms, action);
83       }
84       SIMIX_comm_destroy(action);
85     }
86     else {
87       xbt_die("Communication action %p is in my list but I'm not the sender "
88           "or the receiver", action);
89     }
90   }
91
92   xbt_swag_remove(process, simix_global->process_list);
93   xbt_swag_remove(process, SIMIX_host_priv(process->smx_host)->process_list);
94   xbt_swag_insert(process, simix_global->process_to_destroy);
95   process->context->iwannadie = 0;
96 }
97
98 /**
99  * Garbage collection
100  *
101  * Should be called some time to time to free the memory allocated for processes
102  * that have finished (or killed).
103  */
104 void SIMIX_process_empty_trash(void)
105 {
106   smx_process_t process = NULL;
107
108   while ((process = xbt_swag_extract(simix_global->process_to_destroy))) {
109     SIMIX_context_free(process->context);
110
111     /* Free the exception allocated at creation time */
112     free(process->running_ctx);
113     xbt_dict_free(&process->properties);
114
115     xbt_fifo_free(process->comms);
116
117     xbt_dynar_free(&process->on_exit);
118
119     xbt_free(process->name);
120     xbt_free(process);
121   }
122 }
123
124 /**
125  * \brief Creates and runs the maestro process
126  */
127 void SIMIX_create_maestro_process()
128 {
129   smx_process_t maestro = NULL;
130
131   /* Create maestro process and intilialize it */
132   maestro = xbt_new0(s_smx_process_t, 1);
133   maestro->pid = simix_process_maxpid++;
134   maestro->ppid = -1;
135   maestro->name = (char *) "";
136   maestro->running_ctx = xbt_new(xbt_running_ctx_t, 1);
137   XBT_RUNNING_CTX_INITIALIZE(maestro->running_ctx);
138   maestro->context = SIMIX_context_new(NULL, 0, NULL, NULL, maestro);
139   maestro->simcall.issuer = maestro;
140   simix_global->maestro_process = maestro;
141   return;
142 }
143 /**
144  * \brief Stops a process.
145  *
146  * Stops the process, execute all the registered on_exit functions,
147  * register it to the list of the process to restart if needed
148  * and stops its context.
149  */
150 void SIMIX_process_stop(smx_process_t arg) {
151   /* execute the on_exit functions */
152   SIMIX_process_on_exit_runall(arg);
153   /* Add the process to the list of process to restart, only if
154    * the host is down
155    */
156   if (arg->auto_restart && !SIMIX_host_get_state(arg->smx_host)) {
157     SIMIX_host_add_auto_restart_process(arg->smx_host,arg->name,arg->code, arg->data,
158                                         sg_host_name(arg->smx_host),
159                                         arg->kill_time,
160                                         arg->argc,arg->argv,arg->properties,
161                                         arg->auto_restart);
162   }
163   XBT_DEBUG("Process %s (%s) is dead",arg->name,sg_host_name(arg->smx_host));
164   /* stop the context */
165   SIMIX_context_stop(arg->context);
166 }
167
168 /**
169  * \brief Same as SIMIX_process_create() but with only one argument (used by timers).
170  * This function frees the argument.
171  * \return the process created
172  */
173 smx_process_t SIMIX_process_create_from_wrapper(smx_process_arg_t args) {
174
175   smx_process_t process;
176   simix_global->create_process_function(&process,
177                                         args->name,
178                                         args->code,
179                                         args->data,
180                                         args->hostname,
181                                         args->kill_time,
182                                         args->argc,
183                                         args->argv,
184                                         args->properties,
185                                         args->auto_restart,
186                                         NULL);
187   xbt_free(args);
188   return process;
189 }
190
191
192 void simcall_HANDLER_process_create(smx_simcall_t simcall,
193                           smx_process_t *process,
194                           const char *name,
195                           xbt_main_func_t code,
196                           void *data,
197                           const char *hostname,
198                           double kill_time,
199                           int argc, char **argv,
200                           xbt_dict_t properties,
201                           int auto_restart){
202   SIMIX_process_create(process, name, code, data, hostname,
203                        kill_time, argc, argv, properties, auto_restart,
204                        simcall->issuer);
205 }
206 /**
207  * \brief Internal function to create a process.
208  *
209  * This function actually creates the process.
210  * It may be called when a SIMCALL_PROCESS_CREATE simcall occurs,
211  * or directly for SIMIX internal purposes. The sure thing is that it's called from maestro context.
212  *
213  * \return the process created
214  */
215 void SIMIX_process_create(smx_process_t *process,
216                           const char *name,
217                           xbt_main_func_t code,
218                           void *data,
219                           const char *hostname,
220                           double kill_time,
221                           int argc, char **argv,
222                           xbt_dict_t properties,
223                           int auto_restart,
224                           smx_process_t parent_process)
225 {
226   *process = NULL;
227   smx_host_t host = SIMIX_host_get_by_name(hostname);
228
229   XBT_DEBUG("Start process %s on host '%s'", name, hostname);
230
231   if (!SIMIX_host_get_state(host)) {
232     int i;
233     XBT_WARN("Cannot launch process '%s' on failed host '%s'", name,
234           hostname);
235     for (i = 0; i < argc; i++)
236       xbt_free(argv[i]);
237     xbt_free(argv);
238   }
239   else {
240     *process = xbt_new0(s_smx_process_t, 1);
241
242     xbt_assert(((code != NULL) && (host != NULL)), "Invalid parameters");
243     /* Process data */
244     (*process)->pid = simix_process_maxpid++;
245     (*process)->name = xbt_strdup(name);
246     (*process)->smx_host = host;
247     (*process)->data = data;
248     (*process)->comms = xbt_fifo_new();
249     (*process)->simcall.issuer = *process;
250
251      if (parent_process) {
252        (*process)->ppid = SIMIX_process_get_PID(parent_process);
253      } else {
254        (*process)->ppid = -1;
255      }
256
257     /* Process data for auto-restart */
258     (*process)->auto_restart = auto_restart;
259     (*process)->code = code;
260     (*process)->argc = argc;
261     (*process)->argv = argv;
262     (*process)->kill_time = kill_time;
263
264
265     XBT_VERB("Create context %s", (*process)->name);
266     (*process)->context = SIMIX_context_new(code, argc, argv,
267       simix_global->cleanup_process_function, *process);
268
269     (*process)->running_ctx = xbt_new(xbt_running_ctx_t, 1);
270     XBT_RUNNING_CTX_INITIALIZE((*process)->running_ctx);
271
272     if(MC_is_active()){
273       MC_ignore_heap((*process)->running_ctx, sizeof(*(*process)->running_ctx));
274     }
275
276     /* Add properties */
277     (*process)->properties = properties;
278
279     /* Add the process to it's host process list */
280     xbt_swag_insert(*process, SIMIX_host_priv(host)->process_list);
281
282     XBT_DEBUG("Start context '%s'", (*process)->name);
283
284     /* Now insert it in the global process list and in the process to run list */
285     xbt_swag_insert(*process, simix_global->process_list);
286     XBT_DEBUG("Inserting %s(%s) in the to_run list", (*process)->name, sg_host_name(host));
287     xbt_dynar_push_as(simix_global->process_to_run, smx_process_t, *process);
288
289     if (kill_time > SIMIX_get_clock() && simix_global->kill_process_function) {
290       XBT_DEBUG("Process %s(%s) will be kill at time %f", (*process)->name,
291           sg_host_name((*process)->smx_host), kill_time);
292       SIMIX_timer_set(kill_time, simix_global->kill_process_function, *process);
293     }
294   }
295 }
296
297 /**
298  * \brief Executes the processes from simix_global->process_to_run.
299  *
300  * The processes of simix_global->process_to_run are run (in parallel if
301  * possible).  On exit, simix_global->process_to_run is empty, and
302  * simix_global->process_that_ran contains the list of processes that just ran.
303  * The two lists are swapped so, be careful when using them before and after a
304  * call to this function.
305  */
306 void SIMIX_process_runall(void)
307 {
308   SIMIX_context_runall();
309
310   xbt_dynar_t tmp = simix_global->process_that_ran;
311   simix_global->process_that_ran = simix_global->process_to_run;
312   simix_global->process_to_run = tmp;
313   xbt_dynar_reset(simix_global->process_to_run);
314 }
315
316 void simcall_HANDLER_process_kill(smx_simcall_t simcall, smx_process_t process) {
317   SIMIX_process_kill(process, simcall->issuer);
318 }
319 /**
320  * \brief Internal function to kill a SIMIX process.
321  *
322  * This function may be called when a SIMCALL_PROCESS_KILL simcall occurs,
323  * or directly for SIMIX internal purposes.
324  *
325  * \param process poor victim
326  * \param issuer the process which has sent the PROCESS_KILL. Important to not schedule twice the same process.
327  */
328 void SIMIX_process_kill(smx_process_t process, smx_process_t issuer) {
329
330   XBT_DEBUG("Killing process %s on %s", process->name, sg_host_name(process->smx_host));
331
332   process->context->iwannadie = 1;
333   process->blocked = 0;
334   process->suspended = 0;
335   process->doexception = 0;
336
337   /* destroy the blocking action if any */
338   if (process->waiting_action) {
339
340     switch (process->waiting_action->type) {
341
342     case SIMIX_ACTION_EXECUTE:
343     case SIMIX_ACTION_PARALLEL_EXECUTE:
344       SIMIX_host_execution_destroy(process->waiting_action);
345       break;
346
347     case SIMIX_ACTION_COMMUNICATE:
348       xbt_fifo_remove(process->comms, process->waiting_action);
349       SIMIX_comm_cancel(process->waiting_action);
350       SIMIX_comm_destroy(process->waiting_action);
351       break;
352
353     case SIMIX_ACTION_SLEEP:
354       SIMIX_process_sleep_destroy(process->waiting_action);
355       break;
356
357     case SIMIX_ACTION_JOIN:
358       SIMIX_process_sleep_destroy(process->waiting_action);
359       break;
360
361     case SIMIX_ACTION_SYNCHRO:
362       SIMIX_synchro_stop_waiting(process, &process->simcall);
363       SIMIX_synchro_destroy(process->waiting_action);
364       break;
365
366     case SIMIX_ACTION_IO:
367       SIMIX_io_destroy(process->waiting_action);
368       break;
369
370     }
371   }
372   if(!xbt_dynar_member(simix_global->process_to_run, &(process)) && process != issuer) {
373     xbt_dynar_push_as(simix_global->process_to_run, smx_process_t, process);
374   }
375
376 }
377
378 /** @brief Ask another process to raise the given exception
379  *
380  * @param cat category of exception
381  * @param value value associated to the exception
382  * @param msg string information associated to the exception
383  */
384 void SIMIX_process_throw(smx_process_t process, xbt_errcat_t cat, int value, const char *msg) {
385   SMX_EXCEPTION(process, cat, value, msg);
386
387   if (process->suspended)
388     SIMIX_process_resume(process,SIMIX_process_self());
389
390   /* cancel the blocking action if any */
391   if (process->waiting_action) {
392
393     switch (process->waiting_action->type) {
394
395     case SIMIX_ACTION_EXECUTE:
396     case SIMIX_ACTION_PARALLEL_EXECUTE:
397       SIMIX_host_execution_cancel(process->waiting_action);
398       break;
399
400     case SIMIX_ACTION_COMMUNICATE:
401       xbt_fifo_remove(process->comms, process->waiting_action);
402       SIMIX_comm_cancel(process->waiting_action);
403       break;
404
405     case SIMIX_ACTION_SLEEP:
406       SIMIX_process_sleep_destroy(process->waiting_action);
407       break;
408
409     case SIMIX_ACTION_JOIN:
410       SIMIX_process_sleep_destroy(process->waiting_action);
411       break;
412
413     case SIMIX_ACTION_SYNCHRO:
414       SIMIX_synchro_stop_waiting(process, &process->simcall);
415       break;
416
417     case SIMIX_ACTION_IO:
418       SIMIX_io_destroy(process->waiting_action);
419       break;
420
421     }
422   }
423   process->waiting_action = NULL;
424
425   if (!xbt_dynar_member(simix_global->process_to_run, &(process)) && process != SIMIX_process_self())
426     xbt_dynar_push_as(simix_global->process_to_run, smx_process_t, process);
427 }
428
429 void simcall_HANDLER_process_killall(smx_simcall_t simcall, int reset_pid) {
430   SIMIX_process_killall(simcall->issuer, reset_pid);
431 }
432 /**
433  * \brief Kills all running processes.
434  * \param issuer this one will not be killed
435  */
436 void SIMIX_process_killall(smx_process_t issuer, int reset_pid)
437 {
438   smx_process_t p = NULL;
439
440   while ((p = xbt_swag_extract(simix_global->process_list))) {
441     if (p != issuer) {
442       SIMIX_process_kill(p,issuer);
443     }
444   }
445
446   if (reset_pid > 0)
447     simix_process_maxpid = reset_pid;
448
449   SIMIX_context_runall();
450
451   SIMIX_process_empty_trash();
452 }
453
454 void simcall_HANDLER_process_change_host(smx_simcall_t simcall, smx_process_t process,
455                                    smx_host_t dest)
456 {
457   process->new_host = dest;
458 }
459 void SIMIX_process_change_host(smx_process_t process,
460              smx_host_t dest)
461 {
462   xbt_assert((process != NULL), "Invalid parameters");
463   xbt_swag_remove(process, SIMIX_host_priv(process->smx_host)->process_list);
464   process->smx_host = dest;
465   xbt_swag_insert(process, SIMIX_host_priv(dest)->process_list);
466 }
467
468
469 void simcall_HANDLER_process_suspend(smx_simcall_t simcall, smx_process_t process)
470 {
471   smx_action_t action_suspend =
472       SIMIX_process_suspend(process, simcall->issuer);
473
474   if (process != simcall->issuer) {
475     SIMIX_simcall_answer(simcall);
476   } else {
477     xbt_fifo_push(action_suspend->simcalls, simcall);
478     process->waiting_action = action_suspend;
479     SIMIX_host_execution_suspend(process->waiting_action);
480   }
481   /* If we are suspending ourselves, then just do not finish the simcall now */
482 }
483
484 smx_action_t SIMIX_process_suspend(smx_process_t process, smx_process_t issuer)
485 {
486   xbt_assert((process != NULL), "Invalid parameters");
487
488   if (process->suspended) {
489     XBT_DEBUG("Process '%s' is already suspended", process->name);
490     return NULL;
491   }
492
493   process->suspended = 1;
494
495   /* If we are suspending another process, and it is waiting on an action,
496      suspend its action. */
497   if (process != issuer) {
498
499     if (process->waiting_action) {
500
501       switch (process->waiting_action->type) {
502
503         case SIMIX_ACTION_EXECUTE:
504         case SIMIX_ACTION_PARALLEL_EXECUTE:
505           SIMIX_host_execution_suspend(process->waiting_action);
506           break;
507
508         case SIMIX_ACTION_COMMUNICATE:
509           SIMIX_comm_suspend(process->waiting_action);
510           break;
511
512         case SIMIX_ACTION_SLEEP:
513           SIMIX_process_sleep_suspend(process->waiting_action);
514           break;
515
516         case SIMIX_ACTION_SYNCHRO:
517           /* Suspension is delayed to when the process is rescheduled. */
518           break;
519
520         default:
521           xbt_die("Internal error in SIMIX_process_suspend: unexpected action type %d",
522               (int)process->waiting_action->type);
523       }
524       return NULL;
525     } else {
526       /* Suspension is delayed to when the process is rescheduled. */
527       return NULL;
528     }
529   } else {
530     /* FIXME: computation size is zero. Is it okay that bound is zero ? */
531     return SIMIX_host_execute("suspend", process->smx_host, 0.0, 1.0, 0.0, 0);
532   }
533 }
534
535 void simcall_HANDLER_process_resume(smx_simcall_t simcall, smx_process_t process){
536   SIMIX_process_resume(process, simcall->issuer);
537 }
538
539 void SIMIX_process_resume(smx_process_t process, smx_process_t issuer)
540 {
541   XBT_IN("process = %p, issuer = %p", process, issuer);
542
543   if(process->context->iwannadie) {
544     XBT_VERB("Ignoring request to suspend a process that is currently dying.");
545     return;
546   }
547
548   if(!process->suspended) return;
549   process->suspended = 0;
550
551   /* If we are resuming another process, resume the action it was waiting for
552      if any. Otherwise add it to the list of process to run in the next round. */
553   if (process != issuer) {
554
555     if (process->waiting_action) {
556
557       switch (process->waiting_action->type) {
558
559         case SIMIX_ACTION_EXECUTE:
560         case SIMIX_ACTION_PARALLEL_EXECUTE:
561           SIMIX_host_execution_resume(process->waiting_action);
562           break;
563
564         case SIMIX_ACTION_COMMUNICATE:
565           SIMIX_comm_resume(process->waiting_action);
566           break;
567
568         case SIMIX_ACTION_SLEEP:
569           SIMIX_process_sleep_resume(process->waiting_action);
570           break;
571
572         case SIMIX_ACTION_SYNCHRO:
573           /* I cannot resume it now. This is delayed to when the process is rescheduled at
574            * the end of the synchro. */
575           break;
576
577         default:
578           xbt_die("Internal error in SIMIX_process_resume: unexpected action type %d",
579               (int)process->waiting_action->type);
580       }
581     }
582   } else XBT_WARN("Strange. Process %p is trying to resume himself.", issuer);
583
584   XBT_OUT();
585 }
586
587 int SIMIX_process_get_maxpid(void) {
588   return simix_process_maxpid;
589 }
590
591 int simcall_HANDLER_process_count(smx_simcall_t simcall){
592   return SIMIX_process_count();
593 }
594 int SIMIX_process_count(void)
595 {
596   return xbt_swag_size(simix_global->process_list);
597 }
598
599 int simcall_HANDLER_process_get_PID(smx_simcall_t simcall, smx_process_t self){
600    return SIMIX_process_get_PID(self);
601 }
602
603 int SIMIX_process_get_PID(smx_process_t self){
604   if (self == NULL)
605     return 0;
606   else
607     return self->pid;
608 }
609
610 int simcall_HANDLER_process_get_PPID(smx_simcall_t simcall, smx_process_t self){
611   return SIMIX_process_get_PPID(self);
612 }
613
614 int SIMIX_process_get_PPID(smx_process_t self){
615   if (self == NULL)
616     return 0;
617   else
618     return self->ppid;
619 }
620
621 void* simcall_HANDLER_process_self_get_data(smx_simcall_t simcall, smx_process_t self){
622   return SIMIX_process_self_get_data(self);
623 }
624
625 void* SIMIX_process_self_get_data(smx_process_t self)
626 {
627   xbt_assert(self == SIMIX_process_self(), "This is not the current process");
628
629   if (!self) {
630     return NULL;
631   }
632   return SIMIX_process_get_data(self);
633 }
634
635 void simcall_HANDLER_process_set_data(smx_simcall_t simcall, smx_process_t process,
636                                 void *data){
637   SIMIX_process_set_data(process, data);
638 }
639 void SIMIX_process_self_set_data(smx_process_t self, void *data)
640 {
641   xbt_assert(self == SIMIX_process_self(), "This is not the current process");
642
643   SIMIX_process_set_data(self, data);
644 }
645
646 void* simcall_HANDLER_process_get_data(smx_simcall_t simcall, smx_process_t process){
647   return SIMIX_process_get_data(process);
648 }
649 void* SIMIX_process_get_data(smx_process_t process)
650 {
651   return process->data;
652 }
653
654 void SIMIX_process_set_data(smx_process_t process, void *data)
655 {
656   process->data = data;
657 }
658
659 smx_host_t simcall_HANDLER_process_get_host(smx_simcall_t simcall, smx_process_t process){
660   return SIMIX_process_get_host(process);
661 }
662 smx_host_t SIMIX_process_get_host(smx_process_t process)
663 {
664   return process->smx_host;
665 }
666
667 /* needs to be public and without simcall because it is called
668    by exceptions and logging events */
669 const char* SIMIX_process_self_get_name(void) {
670
671   smx_process_t process = SIMIX_process_self();
672   if (process == NULL || process == simix_global->maestro_process)
673     return "";
674
675   return SIMIX_process_get_name(process);
676 }
677
678 const char* simcall_HANDLER_process_get_name(smx_simcall_t simcall, smx_process_t process) {
679   return SIMIX_process_get_name(process);
680 }
681 const char* SIMIX_process_get_name(smx_process_t process)
682 {
683   return process->name;
684 }
685
686 smx_process_t SIMIX_process_get_by_name(const char* name)
687 {
688   smx_process_t proc;
689
690   xbt_swag_foreach(proc, simix_global->process_list)
691   {
692     if(!strcmp(name, proc->name))
693       return proc;
694   }
695   return NULL;
696 }
697
698 int simcall_HANDLER_process_is_suspended(smx_simcall_t simcall, smx_process_t process){
699   return SIMIX_process_is_suspended(process);
700 }
701 int SIMIX_process_is_suspended(smx_process_t process)
702 {
703   return process->suspended;
704 }
705
706 xbt_dict_t simcall_HANDLER_process_get_properties(smx_simcall_t simcall, smx_process_t process){
707   return SIMIX_process_get_properties(process);
708 }
709 xbt_dict_t SIMIX_process_get_properties(smx_process_t process)
710 {
711   return process->properties;
712 }
713
714 void simcall_HANDLER_process_join(smx_simcall_t simcall, smx_process_t process, double timeout)
715 {
716   smx_action_t action = SIMIX_process_join(simcall->issuer, process, timeout);
717   xbt_fifo_push(action->simcalls, simcall);
718   simcall->issuer->waiting_action = action;
719 }
720
721 static int SIMIX_process_join_finish(smx_process_exit_status_t status, smx_action_t action){
722   if (action->sleep.surf_sleep) {
723     surf_action_cancel(action->sleep.surf_sleep);
724
725     smx_simcall_t simcall;
726     while ((simcall = xbt_fifo_shift(action->simcalls))) {
727       simcall_process_sleep__set__result(simcall, SIMIX_DONE);
728       simcall->issuer->waiting_action = NULL;
729       if (simcall->issuer->suspended) {
730         XBT_DEBUG("Wait! This process is suspended and can't wake up now.");
731         simcall->issuer->suspended = 0;
732         simcall_HANDLER_process_suspend(simcall, simcall->issuer);
733       } else {
734         SIMIX_simcall_answer(simcall);
735       }
736     }
737     surf_action_unref(action->sleep.surf_sleep);
738     action->sleep.surf_sleep = NULL;
739   }
740   xbt_mallocator_release(simix_global->action_mallocator, action);
741   return 0;
742 }
743
744 smx_action_t SIMIX_process_join(smx_process_t issuer, smx_process_t process, double timeout)
745 {
746   smx_action_t res = SIMIX_process_sleep(issuer, timeout);
747   res->type = SIMIX_ACTION_JOIN;
748   SIMIX_process_on_exit(process, (int_f_pvoid_pvoid_t)SIMIX_process_join_finish, res);
749   return res;
750 }
751
752 void simcall_HANDLER_process_sleep(smx_simcall_t simcall, double duration)
753 {
754   if (MC_is_active()) {
755     MC_process_clock_add(simcall->issuer, duration);
756     simcall_process_sleep__set__result(simcall, SIMIX_DONE);
757     SIMIX_simcall_answer(simcall);
758     return;
759   }
760   smx_action_t action = SIMIX_process_sleep(simcall->issuer, duration);
761   xbt_fifo_push(action->simcalls, simcall);
762   simcall->issuer->waiting_action = action;
763 }
764
765 smx_action_t SIMIX_process_sleep(smx_process_t process, double duration)
766 {
767   smx_action_t action;
768   smx_host_t host = process->smx_host;
769
770   /* check if the host is active */
771   if (surf_resource_get_state(surf_workstation_resource_priv(host)) != SURF_RESOURCE_ON) {
772     THROWF(host_error, 0, "Host %s failed, you cannot call this function",
773            sg_host_name(host));
774   }
775
776   action = xbt_mallocator_get(simix_global->action_mallocator);
777   action->type = SIMIX_ACTION_SLEEP;
778   action->name = NULL;
779 #ifdef HAVE_TRACING
780   action->category = NULL;
781 #endif
782
783   action->sleep.host = host;
784   action->sleep.surf_sleep =
785       surf_workstation_sleep(host, duration);
786
787   surf_action_set_data(action->sleep.surf_sleep, action);
788   XBT_DEBUG("Create sleep action %p", action);
789
790   return action;
791 }
792
793 void SIMIX_post_process_sleep(smx_action_t action)
794 {
795   smx_simcall_t simcall;
796   e_smx_state_t state;
797   xbt_assert(action->type == SIMIX_ACTION_SLEEP || action->type == SIMIX_ACTION_JOIN);
798
799   while ((simcall = xbt_fifo_shift(action->simcalls))) {
800
801     switch(surf_action_get_state(action->sleep.surf_sleep)){
802       case SURF_ACTION_FAILED:
803         simcall->issuer->context->iwannadie = 1;
804         //SMX_EXCEPTION(simcall->issuer, host_error, 0, "Host failed");
805         state = SIMIX_SRC_HOST_FAILURE;
806         break;
807
808       case SURF_ACTION_DONE:
809         state = SIMIX_DONE;
810         break;
811
812       default:
813         THROW_IMPOSSIBLE;
814         break;
815     }
816     if (surf_resource_get_state(surf_workstation_resource_priv(simcall->issuer->smx_host)) != SURF_RESOURCE_ON) {
817       simcall->issuer->context->iwannadie = 1;
818     }
819     simcall_process_sleep__set__result(simcall, state);
820     simcall->issuer->waiting_action = NULL;
821     if (simcall->issuer->suspended) {
822       XBT_DEBUG("Wait! This process is suspended and can't wake up now.");
823       simcall->issuer->suspended = 0;
824       simcall_HANDLER_process_suspend(simcall, simcall->issuer);
825     } else {
826       SIMIX_simcall_answer(simcall);
827     }
828   }
829
830   SIMIX_process_sleep_destroy(action);
831 }
832
833 void SIMIX_process_sleep_destroy(smx_action_t action)
834 {
835   XBT_DEBUG("Destroy action %p", action);
836   xbt_assert(action->type == SIMIX_ACTION_SLEEP || action->type == SIMIX_ACTION_JOIN);
837
838   if (action->sleep.surf_sleep) {
839     surf_action_unref(action->sleep.surf_sleep);
840     action->sleep.surf_sleep = NULL;
841   }
842   if (action->type == SIMIX_ACTION_SLEEP)
843     xbt_mallocator_release(simix_global->action_mallocator, action);
844 }
845
846 void SIMIX_process_sleep_suspend(smx_action_t action)
847 {
848   xbt_assert(action->type == SIMIX_ACTION_SLEEP);
849   surf_action_suspend(action->sleep.surf_sleep);
850 }
851
852 void SIMIX_process_sleep_resume(smx_action_t action)
853 {
854   XBT_DEBUG("Action state is %d on process_sleep_resume.", action->state);
855   xbt_assert(action->type == SIMIX_ACTION_SLEEP);
856   surf_action_resume(action->sleep.surf_sleep);
857 }
858
859 /**
860  * \brief Calling this function makes the process to yield.
861  *
862  * Only the current process can call this function, giving back the control to
863  * maestro.
864  *
865  * \param self the current process
866  */
867 void SIMIX_process_yield(smx_process_t self)
868 {
869   XBT_DEBUG("Yield process '%s'", self->name);
870
871   /* Go into sleep and return control to maestro */
872   SIMIX_context_suspend(self->context);
873
874   /* Ok, maestro returned control to us */
875   XBT_DEBUG("Control returned to me: '%s'", self->name);
876
877   if (self->new_host) {
878     SIMIX_process_change_host(self, self->new_host);
879     self->new_host = NULL;
880   }
881
882   if (self->context->iwannadie){
883     XBT_DEBUG("I wanna die!");
884     SIMIX_process_stop(self);
885   }
886
887   if (self->suspended) {
888     XBT_DEBUG("Hey! I'm suspended.");
889     xbt_assert(!self->doexception, "Gasp! This exception may be lost by subsequent calls.");
890     self->suspended = 0;
891     SIMIX_process_suspend(self, self);
892   }
893
894   if (self->doexception) {
895     XBT_DEBUG("Wait, maestro left me an exception");
896     self->doexception = 0;
897     SMX_THROW();
898   }
899
900 }
901
902 /* callback: context fetching */
903 xbt_running_ctx_t *SIMIX_process_get_running_context(void)
904 {
905   return SIMIX_process_self()->running_ctx;
906 }
907
908 /* callback: termination */
909 void SIMIX_process_exception_terminate(xbt_ex_t * e)
910 {
911   xbt_ex_display(e);
912   xbt_abort();
913 }
914
915 smx_context_t SIMIX_process_get_context(smx_process_t p) {
916   return p->context;
917 }
918
919 void SIMIX_process_set_context(smx_process_t p,smx_context_t c) {
920   p->context = c;
921 }
922
923 /**
924  * \brief Returns the list of processes to run.
925  */
926 xbt_dynar_t SIMIX_process_get_runnable(void)
927 {
928   return simix_global->process_to_run;
929 }
930
931 /**
932  * \brief Returns the process from PID.
933  */
934 smx_process_t SIMIX_process_from_PID(int PID)
935 {
936   smx_process_t proc;
937   xbt_swag_foreach(proc, simix_global->process_list)
938   {
939    if(proc->pid == PID)
940    return proc;
941   }
942   return NULL;
943 }
944
945 /** @brief returns a dynar containg all currently existing processes */
946 xbt_dynar_t SIMIX_processes_as_dynar(void) {
947   smx_process_t proc;
948   xbt_dynar_t res = xbt_dynar_new(sizeof(smx_process_t),NULL);
949   xbt_swag_foreach(proc, simix_global->process_list) {
950     xbt_dynar_push(res,&proc);
951   }
952   return res;
953 }
954
955
956 void SIMIX_process_on_exit_runall(smx_process_t process) {
957   s_smx_process_exit_fun_t exit_fun;
958   smx_process_exit_status_t exit_status = (process->context->iwannadie) ?
959                                          SMX_EXIT_FAILURE : SMX_EXIT_SUCCESS;
960   while (!xbt_dynar_is_empty(process->on_exit)) {
961     exit_fun = xbt_dynar_pop_as(process->on_exit,s_smx_process_exit_fun_t);
962     (exit_fun.fun)((void*)exit_status, exit_fun.arg);
963   }
964 }
965
966 void simcall_HANDLER_process_on_exit(smx_simcall_t simcall, smx_process_t process,
967                                int_f_pvoid_pvoid_t fun, void *data) {
968   SIMIX_process_on_exit(process, fun, data);
969 }
970
971 void SIMIX_process_on_exit(smx_process_t process, int_f_pvoid_pvoid_t fun, void *data) {
972   xbt_assert(process, "current process not found: are you in maestro context ?");
973
974   if (!process->on_exit) {
975     process->on_exit = xbt_dynar_new(sizeof(s_smx_process_exit_fun_t), NULL);
976   }
977
978   s_smx_process_exit_fun_t exit_fun = {fun, data};
979
980   xbt_dynar_push_as(process->on_exit,s_smx_process_exit_fun_t,exit_fun);
981 }
982
983 void simcall_HANDLER_process_auto_restart_set(smx_simcall_t simcall, smx_process_t process,
984                                         int auto_restart) {
985   SIMIX_process_auto_restart_set(process, auto_restart);
986 }
987 /**
988  * \brief Sets the auto-restart status of the process.
989  * If set to 1, the process will be automatically restarted when its host
990  * comes back.
991  */
992 void SIMIX_process_auto_restart_set(smx_process_t process, int auto_restart) {
993   process->auto_restart = auto_restart;
994 }
995
996 smx_process_t simcall_HANDLER_process_restart(smx_simcall_t simcall, smx_process_t process) {
997   return SIMIX_process_restart(process, simcall->issuer);
998 }
999 /**
1000  * \brief Restart a process.
1001  * Restart a process, starting it again from the beginning.
1002  */
1003 smx_process_t SIMIX_process_restart(smx_process_t process, smx_process_t issuer) {
1004   XBT_DEBUG("Restarting process %s on %s", process->name, sg_host_name(process->smx_host));
1005   //retrieve the arguments of the old process
1006   //FIXME: Factorise this with SIMIX_host_add_auto_restart_process ?
1007   s_smx_process_arg_t arg;
1008   arg.code = process->code;
1009   arg.hostname = sg_host_name(process->smx_host);
1010   arg.kill_time = process->kill_time;
1011   arg.argc = process->argc;
1012   arg.data = process->data;
1013   int i;
1014   arg.argv = xbt_new(char*,process->argc + 1);
1015   for (i = 0; i < arg.argc; i++) {
1016     arg.argv[i] = xbt_strdup(process->argv[i]);
1017   }
1018   arg.argv[process->argc] = NULL;
1019   arg.properties = NULL;
1020   arg.auto_restart = process->auto_restart;
1021   //kill the old process
1022   SIMIX_process_kill(process,issuer);
1023   //start the new process
1024   smx_process_t new_process;
1025   if (simix_global->create_process_function) {
1026     simix_global->create_process_function(&new_process,
1027                                           arg.argv[0],
1028                                           arg.code,
1029                                           arg.data,
1030                                           arg.hostname,
1031                                           arg.kill_time,
1032                                           arg.argc,
1033                                           arg.argv,
1034                                           arg.properties,
1035                                           arg.auto_restart,
1036                                           NULL);
1037   } else {
1038     simcall_process_create(&new_process,
1039                            arg.argv[0],
1040                            arg.code,
1041                            arg.data,
1042                            arg.hostname,
1043                            arg.kill_time,
1044                            arg.argc,
1045                            arg.argv,
1046                            arg.properties,
1047                            arg.auto_restart);
1048
1049   }
1050   return new_process;
1051 }