Logo AND Algorithmique Numérique Distribuée

Public GIT Repository
don't destroy detached comm from the sender side during process cleanup
[simgrid.git] / src / simix / smx_process.c
1 /* Copyright (c) 2007-2014. The SimGrid Team.
2  * All rights reserved.                                                     */
3
4 /* This program is free software; you can redistribute it and/or modify it
5  * under the terms of the license (GNU LGPL) which comes with this package. */
6
7 #include "smx_private.h"
8 #include "xbt/sysdep.h"
9 #include "xbt/log.h"
10 #include "xbt/dict.h"
11 #include "mc/mc.h"
12
13 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(simix_process, simix,
14                                 "Logging specific to SIMIX (process)");
15
16 unsigned long simix_process_maxpid = 0;
17
18 /**
19  * \brief Returns the current agent.
20  *
21  * This functions returns the currently running SIMIX process.
22  *
23  * \return The SIMIX process
24  */
25 XBT_INLINE smx_process_t SIMIX_process_self(void)
26 {
27   smx_context_t self_context = SIMIX_context_self();
28
29   return self_context ? SIMIX_context_get_process(self_context) : NULL;
30 }
31
32 /**
33  * \brief Returns whether a process has pending asynchronous communications.
34  * \return true if there are asynchronous communications in this process
35  */
36 int SIMIX_process_has_pending_comms(smx_process_t process) {
37
38   return xbt_fifo_size(process->comms) > 0;
39 }
40
41 void SIMIX_pre_process_cleanup(smx_simcall_t simcall, smx_process_t process) {
42   SIMIX_process_cleanup(process);
43 }
44 /**
45  * \brief Moves a process to the list of processes to destroy.
46  */
47 void SIMIX_process_cleanup(smx_process_t process)
48 {
49   XBT_DEBUG("Cleanup process %s (%p), waiting action %p",
50       process->name, process, process->waiting_action);
51
52   SIMIX_process_on_exit_runall(process);
53
54   /* cancel non-blocking communications */
55   smx_action_t action;
56   while ((action = xbt_fifo_pop(process->comms))) {
57
58     /* make sure no one will finish the comm after this process is destroyed,
59      * because src_proc or dst_proc would be an invalid pointer */
60     SIMIX_comm_cancel(action);
61
62     if (action->comm.src_proc == process) {
63       XBT_DEBUG("Found an unfinished send comm %p (detached = %d), state %d, src = %p, dst = %p",
64           action, action->comm.detached, (int)action->state, action->comm.src_proc, action->comm.dst_proc);
65       action->comm.src_proc = NULL;
66
67       /* I'm not supposed to destroy a detached comm from the sender side, */
68       if (!action->comm.detached)
69         SIMIX_comm_destroy(action);
70       else
71         XBT_DEBUG("Don't destroy it since it's a detached comm");
72       
73     }
74     else if (action->comm.dst_proc == process){
75       XBT_DEBUG("Found an unfinished recv comm %p, state %d, src = %p, dst = %p",
76           action, (int)action->state, action->comm.src_proc, action->comm.dst_proc);
77       action->comm.dst_proc = NULL;
78
79       if (action->comm.detached && action->comm.refcount == 1
80           && action->comm.src_proc != NULL) {
81         /* the comm will be freed right now, remove it from the sender */
82         xbt_fifo_remove(action->comm.src_proc->comms, action);
83       }
84       SIMIX_comm_destroy(action);
85     }
86     else {
87       xbt_die("Communication action %p is in my list but I'm not the sender "
88           "or the receiver", action);
89     }
90   }
91
92   xbt_swag_remove(process, simix_global->process_list);
93   xbt_swag_remove(process, SIMIX_host_priv(process->smx_host)->process_list);
94   xbt_swag_insert(process, simix_global->process_to_destroy);
95   process->context->iwannadie = 0;
96 }
97
98 /**
99  * Garbage collection
100  *
101  * Should be called some time to time to free the memory allocated for processes
102  * that have finished (or killed).
103  */
104 void SIMIX_process_empty_trash(void)
105 {
106   smx_process_t process = NULL;
107
108   while ((process = xbt_swag_extract(simix_global->process_to_destroy))) {
109     SIMIX_context_free(process->context);
110
111     /* Free the exception allocated at creation time */
112     free(process->running_ctx);
113     xbt_dict_free(&process->properties);
114
115     xbt_fifo_free(process->comms);
116
117     xbt_dynar_free(&process->on_exit);
118
119     xbt_free(process->name);
120     xbt_free(process);
121   }
122 }
123
124 /**
125  * \brief Creates and runs the maestro process
126  */
127 void SIMIX_create_maestro_process()
128 {
129   smx_process_t maestro = NULL;
130
131   /* Create maestro process and intilialize it */
132   maestro = xbt_new0(s_smx_process_t, 1);
133   maestro->pid = simix_process_maxpid++;
134   maestro->ppid = -1;
135   maestro->name = (char *) "";
136   maestro->running_ctx = xbt_new(xbt_running_ctx_t, 1);
137   XBT_RUNNING_CTX_INITIALIZE(maestro->running_ctx);
138   maestro->context = SIMIX_context_new(NULL, 0, NULL, NULL, maestro);
139   maestro->simcall.issuer = maestro;
140   simix_global->maestro_process = maestro;
141   return;
142 }
143 /**
144  * \brief Stops a process.
145  *
146  * Stops the process, execute all the registered on_exit functions,
147  * register it to the list of the process to restart if needed
148  * and stops its context.
149  */
150 void SIMIX_process_stop(smx_process_t arg) {
151   /* execute the on_exit functions */
152   SIMIX_process_on_exit_runall(arg);
153   /* Add the process to the list of process to restart, only if
154    * the host is down
155    */
156   if (arg->auto_restart && !SIMIX_host_get_state(arg->smx_host)) {
157     SIMIX_host_add_auto_restart_process(arg->smx_host,arg->name,arg->code, arg->data,
158                                         sg_host_name(arg->smx_host),
159                                         arg->kill_time,
160                                         arg->argc,arg->argv,arg->properties,
161                                         arg->auto_restart);
162   }
163   XBT_DEBUG("Process %s (%s) is dead",arg->name,sg_host_name(arg->smx_host));
164   /* stop the context */
165   SIMIX_context_stop(arg->context);
166 }
167
168 /**
169  * \brief Same as SIMIX_process_create() but with only one argument (used by timers).
170  * This function frees the argument.
171  * \return the process created
172  */
173 smx_process_t SIMIX_process_create_from_wrapper(smx_process_arg_t args) {
174
175   smx_process_t process;
176   simix_global->create_process_function(&process,
177                                         args->name,
178                                         args->code,
179                                         args->data,
180                                         args->hostname,
181                                         args->kill_time,
182                                         args->argc,
183                                         args->argv,
184                                         args->properties,
185                                         args->auto_restart,
186                                         NULL);
187   xbt_free(args);
188   return process;
189 }
190
191
192 void SIMIX_pre_process_create(smx_simcall_t simcall,
193                           smx_process_t *process,
194                           const char *name,
195                           xbt_main_func_t code,
196                           void *data,
197                           const char *hostname,
198                           double kill_time,
199                           int argc, char **argv,
200                           xbt_dict_t properties,
201                           int auto_restart){
202   SIMIX_process_create(process, name, code, data, hostname,
203                        kill_time, argc, argv, properties, auto_restart,
204                        simcall->issuer);
205 }
206 /**
207  * \brief Internal function to create a process.
208  *
209  * This function actually creates the process.
210  * It may be called when a SIMCALL_PROCESS_CREATE simcall occurs,
211  * or directly for SIMIX internal purposes. The sure thing is that it's called from maestro context.
212  *
213  * \return the process created
214  */
215 void SIMIX_process_create(smx_process_t *process,
216                           const char *name,
217                           xbt_main_func_t code,
218                           void *data,
219                           const char *hostname,
220                           double kill_time,
221                           int argc, char **argv,
222                           xbt_dict_t properties,
223                           int auto_restart,
224                           smx_process_t parent_process)
225 {
226   *process = NULL;
227   smx_host_t host = SIMIX_host_get_by_name(hostname);
228
229   XBT_DEBUG("Start process %s on host '%s'", name, hostname);
230
231   if (!SIMIX_host_get_state(host)) {
232     int i;
233     XBT_WARN("Cannot launch process '%s' on failed host '%s'", name,
234           hostname);
235     for (i = 0; i < argc; i++)
236       xbt_free(argv[i]);
237     xbt_free(argv);
238   }
239   else {
240     *process = xbt_new0(s_smx_process_t, 1);
241
242     xbt_assert(((code != NULL) && (host != NULL)), "Invalid parameters");
243     /* Process data */
244     (*process)->pid = simix_process_maxpid++;
245     (*process)->name = xbt_strdup(name);
246     (*process)->smx_host = host;
247     (*process)->data = data;
248     (*process)->comms = xbt_fifo_new();
249     (*process)->simcall.issuer = *process;
250
251      if (parent_process) {
252        (*process)->ppid = SIMIX_process_get_PID(parent_process);
253      } else {
254        (*process)->ppid = -1;
255      }
256
257     /* Process data for auto-restart */
258     (*process)->auto_restart = auto_restart;
259     (*process)->code = code;
260     (*process)->argc = argc;
261     (*process)->argv = argv;
262     (*process)->kill_time = kill_time;
263
264
265     XBT_VERB("Create context %s", (*process)->name);
266     (*process)->context = SIMIX_context_new(code, argc, argv,
267       simix_global->cleanup_process_function, *process);
268
269     (*process)->running_ctx = xbt_new(xbt_running_ctx_t, 1);
270     XBT_RUNNING_CTX_INITIALIZE((*process)->running_ctx);
271
272     if(MC_is_active()){
273       MC_ignore_heap((*process)->running_ctx, sizeof(*(*process)->running_ctx));
274     }
275
276     /* Add properties */
277     (*process)->properties = properties;
278
279     /* Add the process to it's host process list */
280     xbt_swag_insert(*process, SIMIX_host_priv(host)->process_list);
281
282     XBT_DEBUG("Start context '%s'", (*process)->name);
283
284     /* Now insert it in the global process list and in the process to run list */
285     xbt_swag_insert(*process, simix_global->process_list);
286     XBT_DEBUG("Inserting %s(%s) in the to_run list", (*process)->name, sg_host_name(host));
287     xbt_dynar_push_as(simix_global->process_to_run, smx_process_t, *process);
288
289     if (kill_time > SIMIX_get_clock() && simix_global->kill_process_function) {
290       XBT_DEBUG("Process %s(%s) will be kill at time %f", (*process)->name,
291           sg_host_name((*process)->smx_host), kill_time);
292       SIMIX_timer_set(kill_time, simix_global->kill_process_function, *process);
293     }
294   }
295 }
296
297 /**
298  * \brief Executes the processes from simix_global->process_to_run.
299  *
300  * The processes of simix_global->process_to_run are run (in parallel if
301  * possible).  On exit, simix_global->process_to_run is empty, and
302  * simix_global->process_that_ran contains the list of processes that just ran.
303  * The two lists are swapped so, be careful when using them before and after a
304  * call to this function.
305  */
306 void SIMIX_process_runall(void)
307 {
308   SIMIX_context_runall();
309
310   xbt_dynar_t tmp = simix_global->process_that_ran;
311   simix_global->process_that_ran = simix_global->process_to_run;
312   simix_global->process_to_run = tmp;
313   xbt_dynar_reset(simix_global->process_to_run);
314 }
315
316 void SIMIX_pre_process_kill(smx_simcall_t simcall, smx_process_t process) {
317   SIMIX_process_kill(process, simcall->issuer);
318 }
319 /**
320  * \brief Internal function to kill a SIMIX process.
321  *
322  * This function may be called when a SIMCALL_PROCESS_KILL simcall occurs,
323  * or directly for SIMIX internal purposes.
324  *
325  * \param process poor victim
326  * \param issuer the process which has sent the PROCESS_KILL. Important to not schedule twice the same process.
327  */
328 void SIMIX_process_kill(smx_process_t process, smx_process_t issuer) {
329
330   XBT_DEBUG("Killing process %s on %s", process->name, sg_host_name(process->smx_host));
331
332   process->context->iwannadie = 1;
333   process->blocked = 0;
334   process->suspended = 0;
335   /* FIXME: set doexception to 0 also? */
336
337   /* destroy the blocking action if any */
338   if (process->waiting_action) {
339
340     switch (process->waiting_action->type) {
341
342     case SIMIX_ACTION_EXECUTE:
343     case SIMIX_ACTION_PARALLEL_EXECUTE:
344       SIMIX_host_execution_destroy(process->waiting_action);
345       break;
346
347     case SIMIX_ACTION_COMMUNICATE:
348       xbt_fifo_remove(process->comms, process->waiting_action);
349       SIMIX_comm_cancel(process->waiting_action);
350       SIMIX_comm_destroy(process->waiting_action);
351       break;
352
353     case SIMIX_ACTION_SLEEP:
354       SIMIX_process_sleep_destroy(process->waiting_action);
355       break;
356
357     case SIMIX_ACTION_JOIN:
358       SIMIX_process_sleep_destroy(process->waiting_action);
359       break;
360
361     case SIMIX_ACTION_SYNCHRO:
362       SIMIX_synchro_stop_waiting(process, &process->simcall);
363       SIMIX_synchro_destroy(process->waiting_action);
364       break;
365
366     case SIMIX_ACTION_IO:
367       SIMIX_io_destroy(process->waiting_action);
368       break;
369
370       /* **************************************/
371       /* TUTORIAL: New API                    */
372     case SIMIX_ACTION_NEW_API:
373       SIMIX_new_api_destroy(process->waiting_action);
374       break;
375       /* **************************************/
376
377     }
378   }
379   if(!xbt_dynar_member(simix_global->process_to_run, &(process)) && process != issuer) {
380     xbt_dynar_push_as(simix_global->process_to_run, smx_process_t, process);
381   }
382
383 }
384
385 void SIMIX_pre_process_killall(smx_simcall_t simcall, int reset_pid) {
386   SIMIX_process_killall(simcall->issuer, reset_pid);
387 }
388 /**
389  * \brief Kills all running processes.
390  * \param issuer this one will not be killed
391  */
392 void SIMIX_process_killall(smx_process_t issuer, int reset_pid)
393 {
394   smx_process_t p = NULL;
395
396   while ((p = xbt_swag_extract(simix_global->process_list))) {
397     if (p != issuer) {
398       SIMIX_process_kill(p,issuer);
399     }
400   }
401
402   if (reset_pid > 0)
403     simix_process_maxpid = reset_pid;
404
405   SIMIX_context_runall();
406
407   SIMIX_process_empty_trash();
408 }
409
410 void SIMIX_pre_process_change_host(smx_simcall_t simcall, smx_process_t process,
411                                    smx_host_t dest)
412 {
413   process->new_host = dest;
414 }
415 void SIMIX_process_change_host(smx_process_t process,
416              smx_host_t dest)
417 {
418   xbt_assert((process != NULL), "Invalid parameters");
419   xbt_swag_remove(process, SIMIX_host_priv(process->smx_host)->process_list);
420   process->smx_host = dest;
421   xbt_swag_insert(process, SIMIX_host_priv(dest)->process_list);
422 }
423
424
425 void SIMIX_pre_process_suspend(smx_simcall_t simcall, smx_process_t process)
426 {
427   smx_action_t action_suspend =
428       SIMIX_process_suspend(process, simcall->issuer);
429
430   if (process != simcall->issuer) {
431     SIMIX_simcall_answer(simcall);
432   } else {
433     xbt_fifo_push(action_suspend->simcalls, simcall);
434     process->waiting_action = action_suspend;
435     SIMIX_host_execution_suspend(process->waiting_action);
436   }
437   /* If we are suspending ourselves, then just do not finish the simcall now */
438 }
439
440 smx_action_t SIMIX_process_suspend(smx_process_t process, smx_process_t issuer)
441 {
442   xbt_assert((process != NULL), "Invalid parameters");
443
444   if (process->suspended) {
445     XBT_DEBUG("Process '%s' is already suspended", process->name);
446     return NULL;
447   }
448
449   process->suspended = 1;
450
451   /* If we are suspending another process, and it is waiting on an action,
452      suspend its action. */
453   if (process != issuer) {
454
455     if (process->waiting_action) {
456
457       switch (process->waiting_action->type) {
458
459         case SIMIX_ACTION_EXECUTE:
460         case SIMIX_ACTION_PARALLEL_EXECUTE:
461           SIMIX_host_execution_suspend(process->waiting_action);
462           break;
463
464         case SIMIX_ACTION_COMMUNICATE:
465           SIMIX_comm_suspend(process->waiting_action);
466           break;
467
468         case SIMIX_ACTION_SLEEP:
469           SIMIX_process_sleep_suspend(process->waiting_action);
470           break;
471
472         case SIMIX_ACTION_SYNCHRO:
473           /* Suspension is delayed to when the process is rescheduled. */
474           break;
475
476         default:
477           xbt_die("Internal error in SIMIX_process_suspend: unexpected action type %d",
478               (int)process->waiting_action->type);
479       }
480       return NULL;
481     } else {
482       /* Suspension is delayed to when the process is rescheduled. */
483       return NULL;
484     }
485   } else {
486     /* FIXME: computation size is zero. Is it okay that bound is zero ? */
487     return SIMIX_host_execute("suspend", process->smx_host, 0.0, 1.0, 0.0, 0);
488   }
489 }
490
491 void SIMIX_pre_process_resume(smx_simcall_t simcall, smx_process_t process){
492   SIMIX_process_resume(process, simcall->issuer);
493 }
494
495 void SIMIX_process_resume(smx_process_t process, smx_process_t issuer)
496 {
497   xbt_assert((process != NULL), "Invalid parameters");
498
499   XBT_IN("process = %p, issuer = %p", process, issuer);
500
501   if(process->context->iwannadie) {
502     XBT_VERB("Ignoring request to suspend a process that is currently dying.");
503     return;
504   }
505
506   if(!process->suspended) return;
507   process->suspended = 0;
508
509   /* If we are resuming another process, resume the action it was waiting for
510      if any. Otherwise add it to the list of process to run in the next round. */
511   if (process != issuer) {
512
513     if (process->waiting_action) {
514
515       switch (process->waiting_action->type) {
516
517         case SIMIX_ACTION_EXECUTE:
518         case SIMIX_ACTION_PARALLEL_EXECUTE:
519           SIMIX_host_execution_resume(process->waiting_action);
520           break;
521
522         case SIMIX_ACTION_COMMUNICATE:
523           SIMIX_comm_resume(process->waiting_action);
524           break;
525
526         case SIMIX_ACTION_SLEEP:
527           SIMIX_process_sleep_resume(process->waiting_action);
528           break;
529
530         case SIMIX_ACTION_SYNCHRO:
531           /* I cannot resume it now. This is delayed to when the process is rescheduled at
532            * the end of the synchro. */
533           break;
534
535         default:
536           xbt_die("Internal error in SIMIX_process_resume: unexpected action type %d",
537               (int)process->waiting_action->type);
538       }
539     }
540   } else XBT_WARN("Strange. Process %p is trying to resume himself.", issuer);
541
542   XBT_OUT();
543 }
544
545 int SIMIX_process_get_maxpid(void) {
546   return simix_process_maxpid;
547 }
548
549 int SIMIX_pre_process_count(smx_simcall_t simcall){
550   return SIMIX_process_count();
551 }
552 int SIMIX_process_count(void)
553 {
554   return xbt_swag_size(simix_global->process_list);
555 }
556
557 int SIMIX_pre_process_get_PID(smx_simcall_t simcall, smx_process_t self){
558    return SIMIX_process_get_PID(self);
559 }
560
561 int SIMIX_process_get_PID(smx_process_t self){
562   if (self == NULL)
563     return 0;
564   else
565     return self->pid;
566 }
567
568 int SIMIX_pre_process_get_PPID(smx_simcall_t simcall, smx_process_t self){
569   return SIMIX_process_get_PPID(self);
570 }
571
572 int SIMIX_process_get_PPID(smx_process_t self){
573   if (self == NULL)
574     return 0;
575   else
576     return self->ppid;
577 }
578
579 void* SIMIX_pre_process_self_get_data(smx_simcall_t simcall, smx_process_t self){
580   return SIMIX_process_self_get_data(self);
581 }
582
583 void* SIMIX_process_self_get_data(smx_process_t self)
584 {
585   xbt_assert(self == SIMIX_process_self(), "This is not the current process");
586
587   if (!self) {
588     return NULL;
589   }
590   return SIMIX_process_get_data(self);
591 }
592
593 void SIMIX_pre_process_set_data(smx_simcall_t simcall, smx_process_t process,
594                                 void *data){
595   SIMIX_process_set_data(process, data);
596 }
597 void SIMIX_process_self_set_data(smx_process_t self, void *data)
598 {
599   xbt_assert(self == SIMIX_process_self(), "This is not the current process");
600
601   SIMIX_process_set_data(self, data);
602 }
603
604 void* SIMIX_pre_process_get_data(smx_simcall_t simcall, smx_process_t process){
605   return SIMIX_process_get_data(process);
606 }
607 void* SIMIX_process_get_data(smx_process_t process)
608 {
609   return process->data;
610 }
611
612 void SIMIX_process_set_data(smx_process_t process, void *data)
613 {
614   process->data = data;
615 }
616
617 smx_host_t SIMIX_pre_process_get_host(smx_simcall_t simcall, smx_process_t process){
618   return SIMIX_process_get_host(process);
619 }
620 smx_host_t SIMIX_process_get_host(smx_process_t process)
621 {
622   return process->smx_host;
623 }
624
625 /* needs to be public and without simcall because it is called
626    by exceptions and logging events */
627 const char* SIMIX_process_self_get_name(void) {
628
629   smx_process_t process = SIMIX_process_self();
630   if (process == NULL || process == simix_global->maestro_process)
631     return "";
632
633   return SIMIX_process_get_name(process);
634 }
635
636 const char* SIMIX_pre_process_get_name(smx_simcall_t simcall, smx_process_t process) {
637   return SIMIX_process_get_name(process);
638 }
639 const char* SIMIX_process_get_name(smx_process_t process)
640 {
641   return process->name;
642 }
643
644 smx_process_t SIMIX_process_get_by_name(const char* name)
645 {
646   smx_process_t proc;
647
648   xbt_swag_foreach(proc, simix_global->process_list)
649   {
650     if(!strcmp(name, proc->name))
651       return proc;
652   }
653   return NULL;
654 }
655
656 int SIMIX_pre_process_is_suspended(smx_simcall_t simcall, smx_process_t process){
657   return SIMIX_process_is_suspended(process);
658 }
659 int SIMIX_process_is_suspended(smx_process_t process)
660 {
661   return process->suspended;
662 }
663
664 xbt_dict_t SIMIX_pre_process_get_properties(smx_simcall_t simcall, smx_process_t process){
665   return SIMIX_process_get_properties(process);
666 }
667 xbt_dict_t SIMIX_process_get_properties(smx_process_t process)
668 {
669   return process->properties;
670 }
671
672 void SIMIX_pre_process_join(smx_simcall_t simcall, smx_process_t process, double timeout)
673 {
674   smx_action_t action = SIMIX_process_join(simcall->issuer, process, timeout);
675   xbt_fifo_push(action->simcalls, simcall);
676   simcall->issuer->waiting_action = action;
677 }
678
679 static int SIMIX_process_join_finish(smx_process_exit_status_t status, smx_action_t action){
680   if (action->sleep.surf_sleep) {
681     surf_action_cancel(action->sleep.surf_sleep);
682
683     smx_simcall_t simcall;
684     while ((simcall = xbt_fifo_shift(action->simcalls))) {
685       simcall_process_sleep__set__result(simcall, SIMIX_DONE);
686       simcall->issuer->waiting_action = NULL;
687       if (simcall->issuer->suspended) {
688         XBT_DEBUG("Wait! This process is suspended and can't wake up now.");
689         simcall->issuer->suspended = 0;
690         SIMIX_pre_process_suspend(simcall, simcall->issuer);
691       } else {
692         SIMIX_simcall_answer(simcall);
693       }
694     }
695     surf_action_unref(action->sleep.surf_sleep);
696     action->sleep.surf_sleep = NULL;
697   }
698   xbt_mallocator_release(simix_global->action_mallocator, action);
699   return 0;
700 }
701
702 smx_action_t SIMIX_process_join(smx_process_t issuer, smx_process_t process, double timeout)
703 {
704   smx_action_t res = SIMIX_process_sleep(issuer, timeout);
705   res->type = SIMIX_ACTION_JOIN;
706   SIMIX_process_on_exit(process, (int_f_pvoid_pvoid_t)SIMIX_process_join_finish, res);
707   return res;
708 }
709
710 void SIMIX_pre_process_sleep(smx_simcall_t simcall, double duration)
711 {
712   if (MC_is_active()) {
713     MC_process_clock_add(simcall->issuer, duration);
714     simcall_process_sleep__set__result(simcall, SIMIX_DONE);
715     SIMIX_simcall_answer(simcall);
716     return;
717   }
718   smx_action_t action = SIMIX_process_sleep(simcall->issuer, duration);
719   xbt_fifo_push(action->simcalls, simcall);
720   simcall->issuer->waiting_action = action;
721 }
722
723 smx_action_t SIMIX_process_sleep(smx_process_t process, double duration)
724 {
725   smx_action_t action;
726   smx_host_t host = process->smx_host;
727
728   /* check if the host is active */
729   if (surf_resource_get_state(surf_workstation_resource_priv(host)) != SURF_RESOURCE_ON) {
730     THROWF(host_error, 0, "Host %s failed, you cannot call this function",
731            sg_host_name(host));
732   }
733
734   action = xbt_mallocator_get(simix_global->action_mallocator);
735   action->type = SIMIX_ACTION_SLEEP;
736   action->name = NULL;
737 #ifdef HAVE_TRACING
738   action->category = NULL;
739 #endif
740
741   action->sleep.host = host;
742   action->sleep.surf_sleep =
743       surf_workstation_sleep(host, duration);
744
745   surf_action_set_data(action->sleep.surf_sleep, action);
746   XBT_DEBUG("Create sleep action %p", action);
747
748   return action;
749 }
750
751 void SIMIX_post_process_sleep(smx_action_t action)
752 {
753   smx_simcall_t simcall;
754   e_smx_state_t state;
755   xbt_assert(action->type == SIMIX_ACTION_SLEEP || action->type == SIMIX_ACTION_JOIN);
756
757   while ((simcall = xbt_fifo_shift(action->simcalls))) {
758
759     switch(surf_action_get_state(action->sleep.surf_sleep)){
760       case SURF_ACTION_FAILED:
761         simcall->issuer->context->iwannadie = 1;
762         //SMX_EXCEPTION(simcall->issuer, host_error, 0, "Host failed");
763         state = SIMIX_SRC_HOST_FAILURE;
764         break;
765
766       case SURF_ACTION_DONE:
767         state = SIMIX_DONE;
768         break;
769
770       default:
771         THROW_IMPOSSIBLE;
772         break;
773     }
774     if (surf_resource_get_state(surf_workstation_resource_priv(simcall->issuer->smx_host)) != SURF_RESOURCE_ON) {
775       simcall->issuer->context->iwannadie = 1;
776     }
777     simcall_process_sleep__set__result(simcall, state);
778     simcall->issuer->waiting_action = NULL;
779     if (simcall->issuer->suspended) {
780       XBT_DEBUG("Wait! This process is suspended and can't wake up now.");
781       simcall->issuer->suspended = 0;
782       SIMIX_pre_process_suspend(simcall, simcall->issuer);
783     } else {
784       SIMIX_simcall_answer(simcall);
785     }
786   }
787
788   SIMIX_process_sleep_destroy(action);
789 }
790
791 void SIMIX_process_sleep_destroy(smx_action_t action)
792 {
793   XBT_DEBUG("Destroy action %p", action);
794   xbt_assert(action->type == SIMIX_ACTION_SLEEP || action->type == SIMIX_ACTION_JOIN);
795
796   if (action->sleep.surf_sleep) {
797     surf_action_unref(action->sleep.surf_sleep);
798     action->sleep.surf_sleep = NULL;
799   }
800   if (action->type == SIMIX_ACTION_SLEEP)
801     xbt_mallocator_release(simix_global->action_mallocator, action);
802 }
803
804 void SIMIX_process_sleep_suspend(smx_action_t action)
805 {
806   xbt_assert(action->type == SIMIX_ACTION_SLEEP);
807   surf_action_suspend(action->sleep.surf_sleep);
808 }
809
810 void SIMIX_process_sleep_resume(smx_action_t action)
811 {
812   XBT_DEBUG("Action state is %d on process_sleep_resume.", action->state);
813   xbt_assert(action->type == SIMIX_ACTION_SLEEP);
814   surf_action_resume(action->sleep.surf_sleep);
815 }
816
817 /**
818  * \brief Calling this function makes the process to yield.
819  *
820  * Only the current process can call this function, giving back the control to
821  * maestro.
822  *
823  * \param self the current process
824  */
825 void SIMIX_process_yield(smx_process_t self)
826 {
827   XBT_DEBUG("Yield process '%s'", self->name);
828
829   /* Go into sleep and return control to maestro */
830   SIMIX_context_suspend(self->context);
831
832   /* Ok, maestro returned control to us */
833   XBT_DEBUG("Control returned to me: '%s'", self->name);
834
835   if (self->new_host) {
836     SIMIX_process_change_host(self, self->new_host);
837     self->new_host = NULL;
838   }
839
840   if (self->context->iwannadie){
841     XBT_DEBUG("I wanna die!");
842     SIMIX_process_stop(self);
843   }
844
845   if (self->suspended) {
846     XBT_DEBUG("Hey! I'm suspended.");
847     xbt_assert(!self->doexception, "Gloups! This exception may be lost by subsequent calls.");
848     self->suspended = 0;
849     SIMIX_process_suspend(self, self);
850   }
851
852   if (self->doexception) {
853     XBT_DEBUG("Wait, maestro left me an exception");
854     self->doexception = 0;
855     SMX_THROW();
856   }
857
858 }
859
860 /* callback: context fetching */
861 xbt_running_ctx_t *SIMIX_process_get_running_context(void)
862 {
863   return SIMIX_process_self()->running_ctx;
864 }
865
866 /* callback: termination */
867 void SIMIX_process_exception_terminate(xbt_ex_t * e)
868 {
869   xbt_ex_display(e);
870   xbt_abort();
871 }
872
873 smx_context_t SIMIX_process_get_context(smx_process_t p) {
874   return p->context;
875 }
876
877 void SIMIX_process_set_context(smx_process_t p,smx_context_t c) {
878   p->context = c;
879 }
880
881 /**
882  * \brief Returns the list of processes to run.
883  */
884 xbt_dynar_t SIMIX_process_get_runnable(void)
885 {
886   return simix_global->process_to_run;
887 }
888
889 /**
890  * \brief Returns the process from PID.
891  */
892 smx_process_t SIMIX_process_from_PID(int PID)
893 {
894   smx_process_t proc;
895   xbt_swag_foreach(proc, simix_global->process_list)
896   {
897    if(proc->pid == PID)
898    return proc;
899   }
900   return NULL;
901 }
902
903 /** @brief returns a dynar containg all currently existing processes */
904 xbt_dynar_t SIMIX_processes_as_dynar(void) {
905   smx_process_t proc;
906   xbt_dynar_t res = xbt_dynar_new(sizeof(smx_process_t),NULL);
907   xbt_swag_foreach(proc, simix_global->process_list) {
908     xbt_dynar_push(res,&proc);
909   }
910   return res;
911 }
912
913
914 void SIMIX_process_on_exit_runall(smx_process_t process) {
915   s_smx_process_exit_fun_t exit_fun;
916   smx_process_exit_status_t exit_status = (process->context->iwannadie) ?
917                                          SMX_EXIT_FAILURE : SMX_EXIT_SUCCESS;
918   while (!xbt_dynar_is_empty(process->on_exit)) {
919     exit_fun = xbt_dynar_pop_as(process->on_exit,s_smx_process_exit_fun_t);
920     (exit_fun.fun)((void*)exit_status, exit_fun.arg);
921   }
922 }
923
924 void SIMIX_pre_process_on_exit(smx_simcall_t simcall, smx_process_t process,
925                                int_f_pvoid_pvoid_t fun, void *data) {
926   SIMIX_process_on_exit(process, fun, data);
927 }
928
929 void SIMIX_process_on_exit(smx_process_t process, int_f_pvoid_pvoid_t fun, void *data) {
930   xbt_assert(process, "current process not found: are you in maestro context ?");
931
932   if (!process->on_exit) {
933     process->on_exit = xbt_dynar_new(sizeof(s_smx_process_exit_fun_t), NULL);
934   }
935
936   s_smx_process_exit_fun_t exit_fun = {fun, data};
937
938   xbt_dynar_push_as(process->on_exit,s_smx_process_exit_fun_t,exit_fun);
939 }
940
941 void SIMIX_pre_process_auto_restart_set(smx_simcall_t simcall, smx_process_t process,
942                                         int auto_restart) {
943   SIMIX_process_auto_restart_set(process, auto_restart);
944 }
945 /**
946  * \brief Sets the auto-restart status of the process.
947  * If set to 1, the process will be automatically restarted when its host
948  * comes back.
949  */
950 void SIMIX_process_auto_restart_set(smx_process_t process, int auto_restart) {
951   process->auto_restart = auto_restart;
952 }
953
954 smx_process_t SIMIX_pre_process_restart(smx_simcall_t simcall, smx_process_t process) {
955   return SIMIX_process_restart(process, simcall->issuer);
956 }
957 /**
958  * \brief Restart a process.
959  * Restart a process, starting it again from the beginning.
960  */
961 smx_process_t SIMIX_process_restart(smx_process_t process, smx_process_t issuer) {
962   XBT_DEBUG("Restarting process %s on %s", process->name, sg_host_name(process->smx_host));
963   //retrieve the arguments of the old process
964   //FIXME: Factorise this with SIMIX_host_add_auto_restart_process ?
965   s_smx_process_arg_t arg;
966   arg.code = process->code;
967   arg.hostname = sg_host_name(process->smx_host);
968   arg.kill_time = process->kill_time;
969   arg.argc = process->argc;
970   arg.data = process->data;
971   int i;
972   arg.argv = xbt_new(char*,process->argc + 1);
973   for (i = 0; i < arg.argc; i++) {
974     arg.argv[i] = xbt_strdup(process->argv[i]);
975   }
976   arg.argv[process->argc] = NULL;
977   arg.properties = NULL;
978   arg.auto_restart = process->auto_restart;
979   //kill the old process
980   SIMIX_process_kill(process,issuer);
981   //start the new process
982   smx_process_t new_process;
983   if (simix_global->create_process_function) {
984     simix_global->create_process_function(&new_process,
985                                           arg.argv[0],
986                                           arg.code,
987                                           arg.data,
988                                           arg.hostname,
989                                           arg.kill_time,
990                                           arg.argc,
991                                           arg.argv,
992                                           arg.properties,
993                                           arg.auto_restart,
994                                           NULL);
995   } else {
996     simcall_process_create(&new_process,
997                            arg.argv[0],
998                            arg.code,
999                            arg.data,
1000                            arg.hostname,
1001                            arg.kill_time,
1002                            arg.argc,
1003                            arg.argv,
1004                            arg.properties,
1005                            arg.auto_restart);
1006
1007   }
1008   return new_process;
1009 }