X-Git-Url: http://info.iut-bm.univ-fcomte.fr/pub/gitweb/simgrid.git/blobdiff_plain/be25aefab9c2c610e764c6b3ddd0df1c2c9a4797..dba3d7f060245c8df8f6dbb627f5ecf65ddc2ea7:/src/msg/msg_mailbox.c diff --git a/src/msg/msg_mailbox.c b/src/msg/msg_mailbox.c index 3e26bd59af..5de723af44 100644 --- a/src/msg/msg_mailbox.c +++ b/src/msg/msg_mailbox.c @@ -1,150 +1,62 @@ +/* Mailboxes in MSG */ + +/* Copyright (c) 2008, 2009, 2010. The SimGrid Team. + * All rights reserved. */ + +/* This program is free software; you can redistribute it and/or modify it + * under the terms of the license (GNU LGPL) which comes with this package. */ + #include "mailbox.h" #include "msg/private.h" - XBT_LOG_NEW_DEFAULT_SUBCATEGORY(msg_mailbox, msg, "Logging specific to MSG (mailbox)"); -static xbt_dict_t msg_mailboxes = NULL; - -void MSG_mailbox_mod_init(void) -{ - msg_mailboxes = xbt_dict_new(); -} - -void MSG_mailbox_mod_exit(void) -{ - xbt_dict_free(&msg_mailboxes); -} - -msg_mailbox_t MSG_mailbox_create(const char *alias) -{ - msg_mailbox_t mailbox = xbt_new0(s_msg_mailbox_t, 1); - - mailbox->tasks = xbt_fifo_new(); - mailbox->cond = NULL; - mailbox->alias = alias ? xbt_strdup(alias) : NULL; - mailbox->hostname = NULL; - - return mailbox; -} - msg_mailbox_t MSG_mailbox_new(const char *alias) { - msg_mailbox_t mailbox = MSG_mailbox_create(alias); - - /* add the mbox in the dictionary */ - xbt_dict_set(msg_mailboxes, alias, mailbox, MSG_mailbox_free); - - return mailbox; + return SIMIX_req_rdv_create(alias); } void MSG_mailbox_free(void *mailbox) { - msg_mailbox_t _mailbox = (msg_mailbox_t) mailbox; - - if (_mailbox->hostname) - free(_mailbox->hostname); - - xbt_fifo_free(_mailbox->tasks); - free(_mailbox->alias); - - free(_mailbox); -} - -smx_cond_t MSG_mailbox_get_cond(msg_mailbox_t mailbox) -{ - return mailbox->cond; -} - -void MSG_mailbox_remove(msg_mailbox_t mailbox, m_task_t task) -{ - xbt_fifo_remove(mailbox->tasks, task); + SIMIX_req_rdv_destroy((msg_mailbox_t)mailbox); } int MSG_mailbox_is_empty(msg_mailbox_t mailbox) { - return (NULL == xbt_fifo_get_first_item(mailbox->tasks)); -} - -m_task_t MSG_mailbox_pop_head(msg_mailbox_t mailbox) -{ - return (m_task_t) xbt_fifo_shift(mailbox->tasks); + return (NULL == SIMIX_req_rdv_get_head(mailbox)); } m_task_t MSG_mailbox_get_head(msg_mailbox_t mailbox) { - xbt_fifo_item_t item; + smx_action_t comm = SIMIX_req_rdv_get_head(mailbox); - if (!(item = xbt_fifo_get_first_item(mailbox->tasks))) + if (!comm) return NULL; - return (m_task_t) xbt_fifo_get_item_content(item); -} - - -m_task_t MSG_mailbox_get_first_host_task(msg_mailbox_t mailbox, m_host_t host) -{ - m_task_t task = NULL; - xbt_fifo_item_t item = NULL; - - xbt_fifo_foreach(mailbox->tasks, item, task, m_task_t) - if (task->simdata->source == host) { - xbt_fifo_remove_item(mailbox->tasks, item); - return task; - } - - return NULL; + return (m_task_t) SIMIX_req_comm_get_src_data(comm); } int -MSG_mailbox_get_count_host_waiting_tasks(msg_mailbox_t mailbox, m_host_t host) -{ - m_task_t task = NULL; - xbt_fifo_item_t item = NULL; - int count = 0; - - xbt_fifo_foreach(mailbox->tasks, item, task, m_task_t) { - if (task->simdata->source == host) - count++; - } - - return count; -} - -void MSG_mailbox_set_cond(msg_mailbox_t mailbox, smx_cond_t cond) -{ - mailbox->cond = cond; -} - -const char *MSG_mailbox_get_alias(msg_mailbox_t mailbox) -{ - return mailbox->alias; -} - -const char *MSG_mailbox_get_hostname(msg_mailbox_t mailbox) -{ - return mailbox->hostname; -} - -void MSG_mailbox_set_hostname(msg_mailbox_t mailbox, const char *hostname) +MSG_mailbox_get_count_host_waiting_tasks(msg_mailbox_t mailbox, + m_host_t host) { - mailbox->hostname = xbt_strdup(hostname); + return SIMIX_req_rdv_comm_count_by_host(mailbox, + host->simdata->smx_host); } msg_mailbox_t MSG_mailbox_get_by_alias(const char *alias) { - msg_mailbox_t mailbox = xbt_dict_get_or_null(msg_mailboxes, alias); + msg_mailbox_t mailbox = SIMIX_req_rdv_get_by_name(alias); - if (!mailbox) { + if (!mailbox) mailbox = MSG_mailbox_new(alias); - MSG_mailbox_set_hostname(mailbox, MSG_host_self()->name); - } return mailbox; } -msg_mailbox_t MSG_mailbox_get_by_channel(m_host_t host, m_channel_t channel) +msg_mailbox_t MSG_mailbox_get_by_channel(m_host_t host, + m_channel_t channel) { xbt_assert0((host != NULL), "Invalid host"); xbt_assert1((channel >= 0) @@ -158,283 +70,133 @@ MSG_error_t MSG_mailbox_get_task_ext(msg_mailbox_t mailbox, m_task_t * task, m_host_t host, double timeout) { - m_process_t process = MSG_process_self(); - m_task_t t = NULL; - m_host_t h = NULL; - simdata_task_t t_simdata = NULL; - simdata_host_t h_simdata = NULL; - double start_time = SIMIX_get_clock(); - - smx_cond_t cond = NULL; //conditional wait if the task isn't on the channel yet + xbt_ex_t e; + MSG_error_t ret = MSG_OK; + smx_action_t comm = NULL; +#ifdef HAVE_TRACING + double start_time = 0; +#endif + /* We no longer support getting a task from a specific host */ + if (host) + THROW_UNIMPLEMENTED; CHECK_HOST(); +#ifdef HAVE_TRACING + TRACE_msg_task_get_start(); + start_time = MSG_get_clock(); +#endif /* Sanity check */ xbt_assert0(task, "Null pointer for the task storage"); if (*task) CRITICAL0 - ("MSG_task_get() was asked to write in a non empty task struct."); - - /* Get the task */ - h = MSG_host_self(); - h_simdata = h->simdata; - - SIMIX_mutex_lock(h_simdata->mutex); //FIXME: lock the mailbox instead - - if (MSG_mailbox_get_cond(mailbox)) { - CRITICAL1 - ("A process is already blocked on the channel %s (meaning that someone is already doing a get on this)", - MSG_mailbox_get_alias(mailbox)); - SIMIX_cond_display_info(MSG_mailbox_get_cond(mailbox)); - xbt_die("Go fix your code!"); + ("MSG_task_get() was asked to write in a non empty task struct."); + + /* Try to receive it by calling SIMIX network layer */ + TRY { + comm = SIMIX_req_comm_irecv(mailbox, task, NULL, NULL, NULL); + SIMIX_req_comm_wait(comm, timeout); + (*task)->simdata->comm = comm; + SIMIX_req_comm_destroy(comm); + DEBUG2("Got task %s from %p",(*task)->name,mailbox); + (*task)->simdata->isused=0; } - - while (1) { - /* if the mailbox is not empty (has a task) */ - if (!MSG_mailbox_is_empty(mailbox)) { - if (!host) { - /* pop the head of the mailbox */ - t = MSG_mailbox_pop_head(mailbox); - break; - } else { - /* get the first task of the host */ - if ((t = MSG_mailbox_get_first_host_task(mailbox, host))) - break; - } - } - - if ((timeout > 0) && (SIMIX_get_clock() - start_time >= timeout)) { // Timeout already elapsed - SIMIX_mutex_unlock(h_simdata->mutex); - MSG_mailbox_set_cond(mailbox, NULL); - SIMIX_cond_destroy(cond); - MSG_RETURN(MSG_TRANSFER_FAILURE); - } - - if (!cond) { - cond = SIMIX_cond_init(); - MSG_mailbox_set_cond(mailbox, cond); - } - - if (timeout > 0) - SIMIX_cond_wait_timeout(cond, h_simdata->mutex, timeout - start_time); - else - SIMIX_cond_wait(MSG_mailbox_get_cond(mailbox), h_simdata->mutex); - - if (SIMIX_host_get_state(h_simdata->smx_host) == 0) { - SIMIX_mutex_unlock(h_simdata->mutex); - MSG_mailbox_set_cond(mailbox, NULL); - SIMIX_cond_destroy(cond); - MSG_RETURN(MSG_HOST_FAILURE); - } - } - - - DEBUG1("OK, got a task (%s)", t->name); - /* clean conditional */ - if (cond) { - MSG_mailbox_set_cond(mailbox, NULL); - SIMIX_cond_destroy(cond); - } - - SIMIX_mutex_unlock(h_simdata->mutex); - - t_simdata = t->simdata; - t_simdata->receiver = process; - *task = t; - - SIMIX_mutex_lock(t_simdata->mutex); - - /* Transfer */ - /* create SIMIX action to the communication */ - t_simdata->comm = - SIMIX_action_communicate(t_simdata->sender->simdata->m_host-> - simdata->smx_host, - process->simdata->m_host->simdata->smx_host, - t->name, t_simdata->message_size, - t_simdata->rate); - - SIMIX_action_use(t_simdata->comm); - - /* if the process is suspend, create the action but stop its execution, it will be restart when the sender process resume */ - if (MSG_process_is_suspended(t_simdata->sender)) { - DEBUG1("Process sender (%s) suspended", t_simdata->sender->name); - SIMIX_action_set_priority(t_simdata->comm, 0); - } - SIMIX_register_action_to_condition(t_simdata->comm, t_simdata->cond); - // breaking point if asynchrounous - process->simdata->waiting_task = t; - - while (1) { - SIMIX_cond_wait(t_simdata->cond, t_simdata->mutex); - - if (SIMIX_action_get_state(t_simdata->comm) != SURF_ACTION_RUNNING) + CATCH(e) { + switch (e.category) { + case host_error: + ret = MSG_HOST_FAILURE; break; - if (!SIMIX_host_get_state(h_simdata->smx_host)) + case network_error: + ret = MSG_TRANSFER_FAILURE; break; - if (!SIMIX_host_get_state(process->simdata->m_host->simdata->smx_host)) + case timeout_error: + ret = MSG_TIMEOUT; break; + default: + xbt_backtrace_display(&e); + xbt_die(bprintf("Unhandled SIMIX network exception: %s", e.msg)); + } + xbt_ex_free(e); } - SIMIX_unregister_action_to_condition(t_simdata->comm, t_simdata->cond); - process->simdata->waiting_task = NULL; - - /* for this process, don't need to change in get function */ - SIMIX_mutex_unlock(t_simdata->mutex); - - if (SIMIX_action_get_state(t_simdata->comm) == SURF_ACTION_DONE) { - if (SIMIX_action_destroy(t_simdata->comm)) - t_simdata->comm = NULL; - MSG_RETURN(MSG_OK); - } else if (SIMIX_host_get_state(h_simdata->smx_host) == 0) { - if (SIMIX_action_destroy(t_simdata->comm)) - t_simdata->comm = NULL; - MSG_RETURN(MSG_HOST_FAILURE); - } else { - if (SIMIX_action_destroy(t_simdata->comm)) - t_simdata->comm = NULL; - MSG_RETURN(MSG_TRANSFER_FAILURE); + if (ret != MSG_HOST_FAILURE && + ret != MSG_TRANSFER_FAILURE && ret != MSG_TIMEOUT) { +#ifdef HAVE_TRACING + TRACE_msg_task_get_end(start_time, *task); +#endif } + MSG_RETURN(ret); } MSG_error_t MSG_mailbox_put_with_timeout(msg_mailbox_t mailbox, m_task_t task, double timeout) { - m_process_t process = MSG_process_self(); - const char *hostname; + xbt_ex_t e; + MSG_error_t ret = MSG_OK; simdata_task_t t_simdata = NULL; - m_host_t local_host = NULL; - m_host_t remote_host = NULL; - smx_cond_t cond = NULL; - + m_process_t process = MSG_process_self(); + smx_action_t comm; +#ifdef HAVE_TRACING + int call_end = 0; +#endif CHECK_HOST(); +#ifdef HAVE_TRACING + call_end = TRACE_msg_task_put_start(task); //must be after CHECK_HOST() +#endif + + + /* Prepare the task to send */ t_simdata = task->simdata; t_simdata->sender = process; - t_simdata->source = MSG_process_get_host(process); + t_simdata->source = MSG_host_self(); - xbt_assert0(t_simdata->refcount == 1, + xbt_assert0(t_simdata->isused == 0, "This task is still being used somewhere else. You cannot send it now. Go fix your code!"); - t_simdata->comm = NULL; - - t_simdata->refcount++; - local_host = ((simdata_process_t) process->simdata)->m_host; + t_simdata->isused=1; msg_global->sent_msg++; - /* get the host name containing the mailbox */ - hostname = MSG_mailbox_get_hostname(mailbox); - - remote_host = MSG_get_host_by_name(hostname); - - if (!remote_host) - THROW1(not_found_error, 0, "Host %s not fount", hostname); - - - DEBUG4("Trying to send a task (%g kB) from %s to %s on the channel %s", - t_simdata->message_size / 1000, local_host->name, - remote_host->name, MSG_mailbox_get_alias(mailbox)); - - SIMIX_mutex_lock(remote_host->simdata->mutex); /* FIXME: lock the mailbox instead */ - - /* put the task in the mailbox */ - xbt_fifo_push(mailbox->tasks, task); - - if ((cond = MSG_mailbox_get_cond(mailbox))) { - DEBUG0("Somebody is listening. Let's wake him up!"); - SIMIX_cond_signal(cond); + process->simdata->waiting_task = task; + + /* Try to send it by calling SIMIX network layer */ + TRY { + comm = SIMIX_req_comm_isend(mailbox, t_simdata->message_size, + t_simdata->rate, task, sizeof(void *), NULL, NULL); + t_simdata->comm = comm; +#ifdef HAVE_TRACING + SIMIX_req_set_category(comm, task->category); +#endif + SIMIX_req_comm_wait(comm, timeout); + SIMIX_req_comm_destroy(comm); } - SIMIX_mutex_unlock(remote_host->simdata->mutex); - - SIMIX_mutex_lock(t_simdata->mutex); - - process->simdata->waiting_task = task; // for debugging and status displaying purpose - - if (timeout > 0) { - xbt_ex_t e; - double time; - double time_elapsed; - time = SIMIX_get_clock(); - - TRY { - /*verify if the action that ends is the correct. Call the wait_timeout with the new time. If the timeout occurs, an exception is raised */ - while (1) { - time_elapsed = SIMIX_get_clock() - time; - SIMIX_cond_wait_timeout(t_simdata->cond, t_simdata->mutex, - timeout - time_elapsed); - - if (t_simdata->comm) - SIMIX_action_use(t_simdata->comm); - if (t_simdata->comm && (SIMIX_action_get_state(t_simdata->comm) != - SURF_ACTION_RUNNING)) - break; - if (!SIMIX_host_get_state(local_host->simdata->smx_host)) - break; - if (!SIMIX_host_get_state(remote_host->simdata->smx_host)) - break; - } - } - CATCH(e) { - if (e.category == timeout_error) { - xbt_ex_free(e); - /* verify if the timeout happened and the communication didn't started yet */ - if (t_simdata->comm == NULL) { - DEBUG1("Action terminated %s (there was a timeout)", task->name); - process->simdata->waiting_task = NULL; - - /* remove the task from the mailbox */ - MSG_mailbox_remove(mailbox, task); - -/* if (t_simdata->receiver && t_simdata->receiver->simdata) { /\* receiver still around *\/ */ -/* t_simdata->receiver->simdata->waiting_task = NULL; */ -/* } */ - - SIMIX_mutex_unlock(t_simdata->mutex); - MSG_RETURN(MSG_TRANSFER_FAILURE); - } - } else { - RETHROW; - } - } - } else { - while (1) { //FIXME: factorize with the code right above - SIMIX_cond_wait(t_simdata->cond, t_simdata->mutex); - - if (t_simdata->comm) - SIMIX_action_use(t_simdata->comm); - if (t_simdata->comm - && SIMIX_action_get_state(t_simdata->comm) != SURF_ACTION_RUNNING) - break; - if (!SIMIX_host_get_state(local_host->simdata->smx_host)) - break; - if (!SIMIX_host_get_state(remote_host->simdata->smx_host)) - break; + CATCH(e) { + switch (e.category) { + case host_error: + ret = MSG_HOST_FAILURE; + break; + case network_error: + ret = MSG_TRANSFER_FAILURE; + break; + case timeout_error: + ret = MSG_TIMEOUT; + break; + default: + xbt_die(bprintf("Unhandled SIMIX network exception: %s", e.msg)); } + xbt_ex_free(e); + + /* If the send failed, it is not used anymore */ + t_simdata->isused=0; } - DEBUG1("Action terminated %s", task->name); process->simdata->waiting_task = NULL; -/* if (t_simdata->receiver && t_simdata->receiver->simdata) { /\* receiver still around *\/ */ -/* t_simdata->receiver->simdata->waiting_task = NULL; */ -/* } */ - - SIMIX_mutex_unlock(t_simdata->mutex); - - if (t_simdata->comm - && SIMIX_action_get_state(t_simdata->comm) == SURF_ACTION_DONE) { - if (SIMIX_action_destroy(t_simdata->comm)) - t_simdata->comm = NULL; - t_simdata->refcount--; - MSG_RETURN(MSG_OK); - } else if (SIMIX_host_get_state(local_host->simdata->smx_host) == 0) { - if (t_simdata->comm && SIMIX_action_destroy(t_simdata->comm)) - t_simdata->comm = NULL; - MSG_RETURN(MSG_HOST_FAILURE); - } else { - if (t_simdata->comm && SIMIX_action_destroy(t_simdata->comm)) - t_simdata->comm = NULL; - MSG_RETURN(MSG_TRANSFER_FAILURE); - } +#ifdef HAVE_TRACING + if (call_end) + TRACE_msg_task_put_end(); +#endif + MSG_RETURN(ret); }