1 /* Copyright (c) 2007-2012. The SimGrid Team.
2 * All rights reserved. */
4 /* This program is free software; you can redistribute it and/or modify it
5 * under the terms of the license (GNU LGPL) which comes with this package. */
7 #include "smx_private.h"
8 #include "xbt/sysdep.h"
13 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(simix_vm, simix,
14 "Logging specific to SIMIX (hosts)");
16 static void SIMIX_execution_finish(smx_action_t action);
19 * \brief Internal function to create a SIMIX host.
20 * \param name name of the host to create
21 * \param data some user data (may be NULL)
23 smx_host_t SIMIX_vm_create(const char *name, smx_host_t phys_host)
26 smx_host_priv_t smx_host = xbt_new0(s_smx_host_priv_t, 1);
29 // TODO check why we do not have any VM here and why we have the host_proc_hookup ?
32 smx_host->data = NULL;
33 smx_host->process_list =
34 xbt_swag_new(xbt_swag_offset(proc, host_proc_hookup));
36 /* Update global variables */
37 xbt_lib_set(host_lib,name,SIMIX_HOST_LEVEL,smx_host);
39 /* Create surf associated resource */
40 surf_vm_workstation_model->extension.vm_workstation.create();
41 return xbt_lib_get_elm_or_null(host_lib, name);
45 * \brief Internal function to destroy a SIMIX host.
47 * \param h the host to destroy (a smx_host_t)
49 void SIMIX_vm_host_destroy(void *h)
51 smx_host_priv_t host = (smx_host_priv_t) h;
54 xbt_lib_(host_lib,name,SIMIX_HOST_LEVEL,smx_host);
56 /* jump to vm_ws_destroy() */
57 surf_vm_workstation_model->extension.vm_workstation.destroy(name);
59 xbt_assert((host != NULL), "Invalid parameters");
61 /* Clean Simulator data */
62 if (xbt_swag_size(host->process_list) != 0) {
64 bprintf("Shutting down host, but it's not empty:");
66 smx_process_t process = NULL;
68 xbt_swag_foreach(process, host->process_list) {
69 tmp = bprintf("%s\n\t%s", msg, process->name);
73 SIMIX_display_process_status();
74 THROWF(arg_error, 0, "%s", msg);
76 xbt_dynar_free(&host->auto_restart_processes);
77 xbt_swag_free(host->process_list);
79 /* Clean host structure */
85 // * \brief Returns a dict of all hosts.
87 // * \return List of all hosts (as a #xbt_dict_t)
89 //xbt_dict_t SIMIX_host_get_dict(void)
91 // xbt_dict_t host_dict = xbt_dict_new_homogeneous(NULL);
92 // xbt_lib_cursor_t cursor = NULL;
94 // void **host = NULL;
96 // xbt_lib_foreach(host_lib, cursor, name, host){
97 // if(host[SIMIX_HOST_LEVEL])
98 // xbt_dict_set(host_dict,name,host[SIMIX_HOST_LEVEL], NULL);
102 smx_host_t SIMIX_pre_vm_create(smx_simcall_t simcall, const char *name, smx_host_t phys_host){
103 return SIMIX_vm_create(name, phys_host);
106 smx_host_t SIMIX_host_get_by_name(const char *name){
107 xbt_assert(((simix_global != NULL)
108 && (host_lib != NULL)),
109 "Environment not set yet");
111 return xbt_lib_get_elm_or_null(host_lib, name);
114 smx_host_t SIMIX_host_self(void)
116 smx_process_t process = SIMIX_process_self();
117 return (process == NULL) ? NULL : SIMIX_process_get_host(process);
120 const char* SIMIX_pre_host_self_get_name(smx_simcall_t simcall){
121 return SIMIX_host_self_get_name();
123 /* needs to be public and without simcall because it is called
124 by exceptions and logging events */
125 const char* SIMIX_host_self_get_name(void)
127 smx_host_t host = SIMIX_host_self();
128 if (host == NULL || SIMIX_process_self() == simix_global->maestro_process)
131 return SIMIX_host_get_name(host);
134 const char* SIMIX_pre_host_get_name(smx_simcall_t simcall, smx_host_t host){
135 return SIMIX_host_get_name(host);
137 const char* SIMIX_host_get_name(smx_host_t host){
138 xbt_assert((host != NULL), "Invalid parameters");
140 return sg_host_name(host);
143 xbt_dict_t SIMIX_pre_host_get_properties(smx_simcall_t simcall, smx_host_t host){
144 return SIMIX_host_get_properties(host);
146 xbt_dict_t SIMIX_host_get_properties(smx_host_t host){
147 xbt_assert((host != NULL), "Invalid parameters (simix host is NULL)");
149 return surf_workstation_model->extension.workstation.get_properties(host);
152 double SIMIX_pre_host_get_speed(smx_simcall_t simcall, smx_host_t host){
153 return SIMIX_host_get_speed(host);
155 double SIMIX_host_get_speed(smx_host_t host){
156 xbt_assert((host != NULL), "Invalid parameters (simix host is NULL)");
158 return surf_workstation_model->extension.workstation.
159 get_speed(host, 1.0);
162 double SIMIX_pre_host_get_available_speed(smx_simcall_t simcall, smx_host_t host){
163 return SIMIX_host_get_available_speed(host);
165 double SIMIX_host_get_available_speed(smx_host_t host){
166 xbt_assert((host != NULL), "Invalid parameters (simix host is NULL)");
168 return surf_workstation_model->extension.workstation.
169 get_available_speed(host);
172 int SIMIX_pre_host_get_state(smx_simcall_t simcall, smx_host_t host){
173 return SIMIX_host_get_state(host);
175 int SIMIX_host_get_state(smx_host_t host){
176 xbt_assert((host != NULL), "Invalid parameters (simix host is NULL)");
178 return surf_workstation_model->extension.workstation.
182 void* SIMIX_pre_host_self_get_data(smx_simcall_t simcall){
183 return SIMIX_host_self_get_data();
185 void* SIMIX_host_self_get_data(void)
187 smx_host_t self = SIMIX_host_self();
188 return SIMIX_host_get_data(self);
191 void SIMIX_host_self_set_data(void *data)
193 smx_host_t self = SIMIX_host_self();
194 SIMIX_host_set_data(self, data);
197 void* SIMIX_pre_host_get_data(smx_simcall_t simcall,smx_host_t host){
198 return SIMIX_host_get_data(host);
200 void* SIMIX_host_get_data(smx_host_t host){
201 xbt_assert((host != NULL), "Invalid parameters (simix host is NULL)");
203 return SIMIX_host_priv(host)->data;
205 void _SIMIX_host_free_process_arg(void *);
206 void _SIMIX_host_free_process_arg(void *data)
208 smx_process_arg_t arg = *(void**)data;
213 * \brief Add a process to the list of the processes that the host will restart when it comes back
214 * This function add a process to the list of the processes that will be restarted when the host comes
215 * back. It is expected that this function is called when the host is down.
216 * The processes will only be restarted once, meaning that you will have to register the process
217 * again to restart the process again.
219 void SIMIX_host_add_auto_restart_process(smx_host_t host,
221 xbt_main_func_t code,
223 const char *hostname,
225 int argc, char **argv,
226 xbt_dict_t properties,
229 if (!SIMIX_host_priv(host)->auto_restart_processes) {
230 SIMIX_host_priv(host)->auto_restart_processes = xbt_dynar_new(sizeof(smx_process_arg_t),_SIMIX_host_free_process_arg);
232 smx_process_arg_t arg = xbt_new(s_smx_process_arg_t,1);
233 arg->name = xbt_strdup(name);
236 arg->hostname = hostname;
237 arg->kill_time = kill_time;
240 arg->argv = xbt_new(char*,argc + 1);
243 for (i = 0; i < argc; i++) {
244 arg->argv[i] = xbt_strdup(argv[i]);
246 arg->argv[argc] = NULL;
248 arg->properties = properties;
249 arg->auto_restart = auto_restart;
251 if( SIMIX_host_get_state(host) == SURF_RESOURCE_OFF
252 && !xbt_dict_get_or_null(watched_hosts_lib,sg_host_name(host))){
253 xbt_dict_set(watched_hosts_lib,sg_host_name(host),host,NULL);
254 XBT_DEBUG("Have push host %s to watched_hosts_lib because state == SURF_RESOURCE_OFF",sg_host_name(host));
256 xbt_dynar_push_as(SIMIX_host_priv(host)->auto_restart_processes,smx_process_arg_t,arg);
259 * \brief Restart the list of processes that have been registered to the host
261 void SIMIX_host_restart_processes(smx_host_t host)
264 smx_process_arg_t arg;
265 xbt_dynar_foreach(SIMIX_host_priv(host)->auto_restart_processes,cpt,arg) {
267 smx_process_t process;
269 XBT_DEBUG("Restarting Process %s(%s) right now", arg->argv[0], arg->hostname);
270 if (simix_global->create_process_function) {
271 simix_global->create_process_function(&process,
283 simcall_process_create(&process,
296 xbt_dynar_reset(SIMIX_host_priv(host)->auto_restart_processes);
299 void SIMIX_host_autorestart(smx_host_t host)
301 if(simix_global->autorestart)
302 simix_global->autorestart(host);
304 xbt_die("No function for simix_global->autorestart");
307 void SIMIX_pre_host_set_data(smx_simcall_t simcall, smx_host_t host, void *data) {
308 SIMIX_host_set_data(host, data);
310 void SIMIX_host_set_data(smx_host_t host, void *data){
311 xbt_assert((host != NULL), "Invalid parameters");
312 xbt_assert((SIMIX_host_priv(host)->data == NULL), "Data already set");
314 SIMIX_host_priv(host)->data = data;
317 smx_action_t SIMIX_pre_host_execute(smx_simcall_t simcall,const char *name,
318 smx_host_t host, double computation_amount, double priority){
319 return SIMIX_host_execute(name, host, computation_amount, priority);
321 smx_action_t SIMIX_host_execute(const char *name,
322 smx_host_t host, double computation_amount, double priority){
324 /* alloc structures and initialize */
325 smx_action_t action = xbt_mallocator_get(simix_global->action_mallocator);
326 action->type = SIMIX_ACTION_EXECUTE;
327 action->name = xbt_strdup(name);
328 action->state = SIMIX_RUNNING;
329 action->execution.host = host;
332 action->category = NULL;
335 /* set surf's action */
336 if (!MC_is_active()) {
337 action->execution.surf_exec =
338 surf_workstation_model->extension.workstation.execute(host,
340 surf_workstation_model->action_data_set(action->execution.surf_exec, action);
341 surf_workstation_model->set_priority(action->execution.surf_exec, priority);
344 XBT_DEBUG("Create execute action %p", action);
349 smx_action_t SIMIX_pre_host_parallel_execute(smx_simcall_t simcall, const char *name,
350 int host_nb, smx_host_t *host_list,
351 double *computation_amount, double *communication_amount,
352 double amount, double rate){
353 return SIMIX_host_parallel_execute(name, host_nb, host_list, computation_amount,
354 communication_amount, amount, rate);
356 smx_action_t SIMIX_host_parallel_execute(const char *name,
357 int host_nb, smx_host_t *host_list,
358 double *computation_amount, double *communication_amount,
359 double amount, double rate){
361 void **workstation_list = NULL;
364 /* alloc structures and initialize */
365 smx_action_t action = xbt_mallocator_get(simix_global->action_mallocator);
366 action->type = SIMIX_ACTION_PARALLEL_EXECUTE;
367 action->name = xbt_strdup(name);
368 action->state = SIMIX_RUNNING;
369 action->execution.host = NULL; /* FIXME: do we need the list of hosts? */
372 action->category = NULL;
375 /* set surf's action */
376 workstation_list = xbt_new0(void *, host_nb);
377 for (i = 0; i < host_nb; i++)
378 workstation_list[i] = host_list[i];
380 /* set surf's action */
381 if (!MC_is_active()) {
382 action->execution.surf_exec =
383 surf_workstation_model->extension.workstation.
384 execute_parallel_task(host_nb, workstation_list, computation_amount,
385 communication_amount, rate);
387 surf_workstation_model->action_data_set(action->execution.surf_exec, action);
389 XBT_DEBUG("Create parallel execute action %p", action);
394 void SIMIX_pre_host_execution_destroy(smx_simcall_t simcall, smx_action_t action){
395 SIMIX_host_execution_destroy(action);
397 void SIMIX_host_execution_destroy(smx_action_t action){
398 XBT_DEBUG("Destroy action %p", action);
400 if (action->execution.surf_exec) {
401 surf_workstation_model->action_unref(action->execution.surf_exec);
402 action->execution.surf_exec = NULL;
404 xbt_free(action->name);
405 xbt_mallocator_release(simix_global->action_mallocator, action);
408 void SIMIX_pre_host_execution_cancel(smx_simcall_t simcall, smx_action_t action){
409 SIMIX_host_execution_cancel(action);
411 void SIMIX_host_execution_cancel(smx_action_t action){
412 XBT_DEBUG("Cancel action %p", action);
414 if (action->execution.surf_exec)
415 surf_workstation_model->action_cancel(action->execution.surf_exec);
418 double SIMIX_pre_host_execution_get_remains(smx_simcall_t simcall, smx_action_t action){
419 return SIMIX_host_execution_get_remains(action);
421 double SIMIX_host_execution_get_remains(smx_action_t action){
424 if (action->state == SIMIX_RUNNING)
425 result = surf_workstation_model->get_remains(action->execution.surf_exec);
430 e_smx_state_t SIMIX_pre_host_execution_get_state(smx_simcall_t simcall, smx_action_t action){
431 return SIMIX_host_execution_get_state(action);
433 e_smx_state_t SIMIX_host_execution_get_state(smx_action_t action){
434 return action->state;
437 void SIMIX_pre_host_execution_set_priority(smx_simcall_t simcall, smx_action_t action,
439 return SIMIX_host_execution_set_priority(action, priority);
441 void SIMIX_host_execution_set_priority(smx_action_t action, double priority){
442 if(action->execution.surf_exec)
443 surf_workstation_model->set_priority(action->execution.surf_exec, priority);
446 void SIMIX_pre_host_execution_wait(smx_simcall_t simcall, smx_action_t action){
448 XBT_DEBUG("Wait for execution of action %p, state %d", action, (int)action->state);
450 /* Associate this simcall to the action */
451 xbt_fifo_push(action->simcalls, simcall);
452 simcall->issuer->waiting_action = action;
454 /* set surf's action */
455 if (MC_is_active()) {
456 action->state = SIMIX_DONE;
457 SIMIX_execution_finish(action);
461 /* If the action is already finished then perform the error handling */
462 if (action->state != SIMIX_RUNNING)
463 SIMIX_execution_finish(action);
466 void SIMIX_host_execution_suspend(smx_action_t action)
468 if(action->execution.surf_exec)
469 surf_workstation_model->suspend(action->execution.surf_exec);
472 void SIMIX_host_execution_resume(smx_action_t action)
474 if(action->execution.surf_exec)
475 surf_workstation_model->resume(action->execution.surf_exec);
478 void SIMIX_execution_finish(smx_action_t action)
480 xbt_fifo_item_t item;
481 smx_simcall_t simcall;
483 xbt_fifo_foreach(action->simcalls, item, simcall, smx_simcall_t) {
485 switch (action->state) {
488 /* do nothing, action done */
489 XBT_DEBUG("SIMIX_execution_finished: execution successful");
493 XBT_DEBUG("SIMIX_execution_finished: host '%s' failed", sg_host_name(simcall->issuer->smx_host));
494 simcall->issuer->context->iwannadie = 1;
495 //SMX_EXCEPTION(simcall->issuer, host_error, 0, "Host failed");
499 XBT_DEBUG("SIMIX_execution_finished: execution canceled");
500 SMX_EXCEPTION(simcall->issuer, cancel_error, 0, "Canceled");
504 xbt_die("Internal error in SIMIX_execution_finish: unexpected action state %d",
507 /* check if the host is down */
508 if (surf_workstation_model->extension.
509 workstation.get_state(simcall->issuer->smx_host) != SURF_RESOURCE_ON) {
510 simcall->issuer->context->iwannadie = 1;
513 simcall->issuer->waiting_action = NULL;
514 simcall_host_execution_wait__set__result(simcall, action->state);
515 SIMIX_simcall_answer(simcall);
518 /* We no longer need it */
519 SIMIX_host_execution_destroy(action);
522 void SIMIX_post_host_execute(smx_action_t action)
524 if (action->type == SIMIX_ACTION_EXECUTE && /* FIMXE: handle resource failure
525 * for parallel tasks too */
526 surf_workstation_model->extension.workstation.get_state(action->execution.host) == SURF_RESOURCE_OFF) {
527 /* If the host running the action failed, notice it so that the asking
528 * process can be killed if it runs on that host itself */
529 action->state = SIMIX_FAILED;
530 } else if (surf_workstation_model->action_state_get(action->execution.surf_exec) == SURF_ACTION_FAILED) {
531 /* If the host running the action didn't fail, then the action was
533 action->state = SIMIX_CANCELED;
535 action->state = SIMIX_DONE;
538 if (action->execution.surf_exec) {
539 surf_workstation_model->action_unref(action->execution.surf_exec);
540 action->execution.surf_exec = NULL;
543 /* If there are simcalls associated with the action, then answer them */
544 if (xbt_fifo_size(action->simcalls)) {
545 SIMIX_execution_finish(action);
551 void SIMIX_pre_set_category(smx_simcall_t simcall, smx_action_t action,
552 const char *category){
553 SIMIX_set_category(action, category);
555 void SIMIX_set_category(smx_action_t action, const char *category)
557 if (action->state != SIMIX_RUNNING) return;
558 if (action->type == SIMIX_ACTION_EXECUTE){
559 surf_workstation_model->set_category(action->execution.surf_exec, category);
560 }else if (action->type == SIMIX_ACTION_COMMUNICATE){
561 surf_workstation_model->set_category(action->comm.surf_comm, category);