1 /* Copyright (c) 2007-2012. The SimGrid Team.
2 * All rights reserved. */
4 /* This program is free software; you can redistribute it and/or modify it
5 * under the terms of the license (GNU LGPL) which comes with this package. */
7 #include "smx_private.h"
8 #include "xbt/sysdep.h"
13 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(simix_host, simix,
14 "Logging specific to SIMIX (hosts)");
16 static void SIMIX_execution_finish(smx_action_t action);
19 * \brief Internal function to create a SIMIX host.
20 * \param name name of the host to create
21 * \param workstation the SURF workstation to encapsulate
22 * \param data some user data (may be NULL)
24 smx_host_t SIMIX_host_create(const char *name,
25 void *workstation, void *data)
27 smx_host_t smx_host = xbt_new0(s_smx_host_t, 1);
31 smx_host->name = xbt_strdup(name);
32 smx_host->data = data;
33 smx_host->host = workstation;
34 smx_host->process_list =
35 xbt_swag_new(xbt_swag_offset(proc, host_proc_hookup));
37 /* Update global variables */
38 xbt_lib_set(host_lib,smx_host->name,SIMIX_HOST_LEVEL,smx_host);
44 * \brief Internal function to destroy a SIMIX host.
46 * \param h the host to destroy (a smx_host_t)
48 void SIMIX_host_destroy(void *h)
50 smx_host_t host = (smx_host_t) h;
52 xbt_assert((host != NULL), "Invalid parameters");
54 /* Clean Simulator data */
55 if (xbt_swag_size(host->process_list) != 0) {
57 bprintf("Shutting down host %s, but it's not empty:", host->name);
59 smx_process_t process = NULL;
61 xbt_swag_foreach(process, host->process_list) {
62 tmp = bprintf("%s\n\t%s", msg, process->name);
66 SIMIX_display_process_status();
67 THROWF(arg_error, 0, "%s", msg);
69 xbt_dynar_free(&host->auto_restart_processes);
70 xbt_swag_free(host->process_list);
72 /* Clean host structure */
80 * \brief Returns a dict of all hosts.
82 * \return List of all hosts (as a #xbt_dict_t)
84 xbt_dict_t SIMIX_host_get_dict(void)
86 xbt_dict_t host_dict = xbt_dict_new_homogeneous(NULL);
87 xbt_lib_cursor_t cursor = NULL;
91 xbt_lib_foreach(host_lib, cursor, name, host){
92 if(host[SIMIX_HOST_LEVEL])
93 xbt_dict_set(host_dict,name,host[SIMIX_HOST_LEVEL], NULL);
98 smx_host_t SIMIX_host_get_by_name(const char *name)
100 xbt_assert(((simix_global != NULL)
101 && (host_lib != NULL)),
102 "Environment not set yet");
104 return xbt_lib_get_or_null(host_lib, name, SIMIX_HOST_LEVEL);
107 smx_host_t SIMIX_host_self(void)
109 smx_process_t process = SIMIX_process_self();
110 return (process == NULL) ? NULL : SIMIX_process_get_host(process);
113 /* needs to be public and without simcall because it is called
114 by exceptions and logging events */
115 const char* SIMIX_host_self_get_name(void)
117 smx_host_t host = SIMIX_host_self();
118 if (host == NULL || SIMIX_process_self() == simix_global->maestro_process)
121 return SIMIX_host_get_name(host);
124 const char* SIMIX_host_get_name(smx_host_t host)
126 xbt_assert((host != NULL), "Invalid parameters");
131 xbt_dict_t SIMIX_host_get_properties(smx_host_t host)
133 xbt_assert((host != NULL), "Invalid parameters (simix host is NULL)");
135 return surf_workstation_model->extension.workstation.get_properties(host->host);
138 double SIMIX_host_get_speed(smx_host_t host)
140 xbt_assert((host != NULL), "Invalid parameters (simix host is NULL)");
142 return surf_workstation_model->extension.workstation.
143 get_speed(host->host, 1.0);
146 double SIMIX_host_get_available_speed(smx_host_t host)
148 xbt_assert((host != NULL), "Invalid parameters (simix host is NULL)");
150 return surf_workstation_model->extension.workstation.
151 get_available_speed(host->host);
154 int SIMIX_host_get_state(smx_host_t host)
156 xbt_assert((host != NULL), "Invalid parameters (simix host is NULL)");
158 return surf_workstation_model->extension.workstation.
159 get_state(host->host);
162 void* SIMIX_host_self_get_data(void)
164 return SIMIX_host_get_data(SIMIX_host_self());
167 void SIMIX_host_self_set_data(void *data)
169 SIMIX_host_set_data(SIMIX_host_self(), data);
172 void* SIMIX_host_get_data(smx_host_t host)
174 xbt_assert((host != NULL), "Invalid parameters (simix host is NULL)");
178 void _SIMIX_host_free_process_arg(void *);
179 void _SIMIX_host_free_process_arg(void *data)
181 smx_process_arg_t arg = *(void**)data;
184 for (i = 0; i < arg->argc; i++) {
185 xbt_free(arg->argv[i]);
191 * \brief Add a process to the list of the processes that the host will restart when it comes back
192 * This function add a process to the list of the processes that will be restarted when the host comes
193 * back. It is expected that this function is called when the host is down.
194 * The processes will only be restarted once, meaning that you will have to register the process
195 * again to restart the process again.
197 void SIMIX_host_add_auto_restart_process(smx_host_t host,
199 xbt_main_func_t code,
201 const char *hostname,
203 int argc, char **argv,
204 xbt_dict_t properties,
207 if (!host->auto_restart_processes) {
208 host->auto_restart_processes = xbt_dynar_new(sizeof(smx_process_arg_t),_SIMIX_host_free_process_arg);
210 smx_process_arg_t arg = xbt_new(s_smx_process_arg_t,1);
212 arg->name = xbt_strdup(name);
215 arg->hostname = hostname;
216 arg->kill_time = kill_time;
218 arg->argv = xbt_new(char*,argc + 1);
221 for (i = 0; i < argc; i++) {
222 arg->argv[i] = xbt_strdup(argv[i]);
225 arg->properties = properties;
226 arg->auto_restart = auto_restart;
228 if( SIMIX_host_get_state(host) == SURF_RESOURCE_OFF
229 && !xbt_dict_get_or_null(watched_hosts_lib,host->name)){
230 xbt_dict_set(watched_hosts_lib,host->name,host,NULL);
231 XBT_DEBUG("Have push host %s to watched_hosts_lib because state == SURF_RESOURCE_OFF",host->name);
233 xbt_dynar_push_as(host->auto_restart_processes,smx_process_arg_t,arg);
236 * \brief Restart the list of processes that have been registered to the host
238 void SIMIX_host_restart_processes(smx_host_t host)
241 smx_process_arg_t arg;
242 xbt_dynar_foreach(host->auto_restart_processes,cpt,arg) {
244 smx_process_t process;
246 XBT_DEBUG("Restarting Process %s(%s) right now", arg->argv[0], arg->hostname);
247 if (simix_global->create_process_function) {
248 simix_global->create_process_function(&process,
260 simcall_process_create(&process,
273 xbt_dynar_reset(host->auto_restart_processes);
276 void SIMIX_host_autorestart(smx_host_t host)
278 if(simix_global->autorestart)
279 simix_global->autorestart(host);
281 xbt_die("No function for simix_global->autorestart");
284 void SIMIX_host_set_data(smx_host_t host, void *data)
286 xbt_assert((host != NULL), "Invalid parameters");
287 xbt_assert((host->data == NULL), "Data already set");
292 smx_action_t SIMIX_host_execute(const char *name, smx_host_t host,
293 double computation_amount,
296 /* alloc structures and initialize */
297 smx_action_t action = xbt_mallocator_get(simix_global->action_mallocator);
298 action->type = SIMIX_ACTION_EXECUTE;
299 action->name = xbt_strdup(name);
300 action->state = SIMIX_RUNNING;
301 action->execution.host = host;
304 action->category = NULL;
307 /* set surf's action */
308 if (!MC_IS_ENABLED) {
309 action->execution.surf_exec =
310 surf_workstation_model->extension.workstation.execute(host->host,
312 surf_workstation_model->action_data_set(action->execution.surf_exec, action);
313 surf_workstation_model->set_priority(action->execution.surf_exec, priority);
316 XBT_DEBUG("Create execute action %p", action);
321 smx_action_t SIMIX_host_parallel_execute( const char *name,
322 int host_nb, smx_host_t *host_list,
323 double *computation_amount, double *communication_amount,
324 double amount, double rate)
326 void **workstation_list = NULL;
329 /* alloc structures and initialize */
330 smx_action_t action = xbt_mallocator_get(simix_global->action_mallocator);
331 action->type = SIMIX_ACTION_PARALLEL_EXECUTE;
332 action->name = xbt_strdup(name);
333 action->state = SIMIX_RUNNING;
334 action->execution.host = NULL; /* FIXME: do we need the list of hosts? */
337 action->category = NULL;
340 /* set surf's action */
341 workstation_list = xbt_new0(void *, host_nb);
342 for (i = 0; i < host_nb; i++)
343 workstation_list[i] = host_list[i]->host;
345 /* set surf's action */
346 if (!MC_IS_ENABLED) {
347 action->execution.surf_exec =
348 surf_workstation_model->extension.workstation.
349 execute_parallel_task(host_nb, workstation_list, computation_amount,
350 communication_amount, rate);
352 surf_workstation_model->action_data_set(action->execution.surf_exec, action);
354 XBT_DEBUG("Create parallel execute action %p", action);
359 void SIMIX_host_execution_destroy(smx_action_t action)
362 XBT_DEBUG("Destroy action %p", action);
365 if (action->execution.surf_exec) {
366 destroyed = surf_workstation_model->action_unref(action->execution.surf_exec);
367 action->execution.surf_exec = NULL;
371 xbt_free(action->name);
372 xbt_mallocator_release(simix_global->action_mallocator, action);
376 void SIMIX_host_execution_cancel(smx_action_t action)
378 XBT_DEBUG("Cancel action %p", action);
380 if (action->execution.surf_exec)
381 surf_workstation_model->action_cancel(action->execution.surf_exec);
384 double SIMIX_host_execution_get_remains(smx_action_t action)
388 if (action->state == SIMIX_RUNNING)
389 result = surf_workstation_model->get_remains(action->execution.surf_exec);
394 e_smx_state_t SIMIX_host_execution_get_state(smx_action_t action)
396 return action->state;
399 void SIMIX_host_execution_set_priority(smx_action_t action, double priority)
401 if(action->execution.surf_exec)
402 surf_workstation_model->set_priority(action->execution.surf_exec, priority);
405 void SIMIX_pre_host_execution_wait(smx_simcall_t simcall)
407 smx_action_t action = simcall->host_execution_wait.execution;
409 XBT_DEBUG("Wait for execution of action %p, state %d", action, (int)action->state);
411 /* Associate this simcall to the action */
412 xbt_fifo_push(action->simcalls, simcall);
413 simcall->issuer->waiting_action = action;
415 /* set surf's action */
417 action->state = SIMIX_DONE;
418 SIMIX_execution_finish(action);
422 /* If the action is already finished then perform the error handling */
423 if (action->state != SIMIX_RUNNING)
424 SIMIX_execution_finish(action);
427 void SIMIX_host_execution_suspend(smx_action_t action)
429 if(action->execution.surf_exec)
430 surf_workstation_model->suspend(action->execution.surf_exec);
433 void SIMIX_host_execution_resume(smx_action_t action)
435 if(action->execution.surf_exec)
436 surf_workstation_model->resume(action->execution.surf_exec);
439 void SIMIX_execution_finish(smx_action_t action)
441 xbt_fifo_item_t item;
442 smx_simcall_t simcall;
444 xbt_fifo_foreach(action->simcalls, item, simcall, smx_simcall_t) {
446 switch (action->state) {
449 /* do nothing, action done */
450 XBT_DEBUG("SIMIX_execution_finished: execution successful");
454 XBT_DEBUG("SIMIX_execution_finished: host '%s' failed", simcall->issuer->smx_host->name);
455 simcall->issuer->context->iwannadie = 1;
456 //SMX_EXCEPTION(simcall->issuer, host_error, 0, "Host failed");
460 XBT_DEBUG("SIMIX_execution_finished: execution canceled");
461 SMX_EXCEPTION(simcall->issuer, cancel_error, 0, "Canceled");
465 xbt_die("Internal error in SIMIX_execution_finish: unexpected action state %d",
468 /* check if the host is down */
469 if (surf_workstation_model->extension.
470 workstation.get_state(simcall->issuer->smx_host->host) != SURF_RESOURCE_ON) {
471 simcall->issuer->context->iwannadie = 1;
474 simcall->issuer->waiting_action = NULL;
475 simcall->host_execution_wait.result = action->state;
476 SIMIX_simcall_answer(simcall);
479 /* We no longer need it */
480 SIMIX_host_execution_destroy(action);
483 void SIMIX_post_host_execute(smx_action_t action)
485 if (action->type == SIMIX_ACTION_EXECUTE && /* FIMXE: handle resource failure
486 * for parallel tasks too */
487 surf_workstation_model->extension.workstation.get_state(action->execution.host->host) == SURF_RESOURCE_OFF) {
488 /* If the host running the action failed, notice it so that the asking
489 * process can be killed if it runs on that host itself */
490 action->state = SIMIX_FAILED;
491 } else if (surf_workstation_model->action_state_get(action->execution.surf_exec) == SURF_ACTION_FAILED) {
492 /* If the host running the action didn't fail, then the action was
494 action->state = SIMIX_CANCELED;
496 action->state = SIMIX_DONE;
499 if (action->execution.surf_exec) {
500 surf_workstation_model->action_unref(action->execution.surf_exec);
501 action->execution.surf_exec = NULL;
504 /* If there are simcalls associated with the action, then answer them */
505 if (xbt_fifo_size(action->simcalls)) {
506 SIMIX_execution_finish(action);
512 void SIMIX_set_category(smx_action_t action, const char *category)
514 if (action->state != SIMIX_RUNNING) return;
515 if (action->type == SIMIX_ACTION_EXECUTE){
516 surf_workstation_model->set_category(action->execution.surf_exec, category);
517 }else if (action->type == SIMIX_ACTION_COMMUNICATE){
518 surf_workstation_model->set_category(action->comm.surf_comm, category);