Logo AND Algorithmique Numérique Distribuée

Public GIT Repository
[trace] Do not split comm if trace is not active.
[simgrid.git] / src / msg / msg_mailbox.c
index b6cba21..cd5990b 100644 (file)
+/* Mailboxes in MSG */
+
+/* Copyright (c) 2008, 2009, 2010. The SimGrid Team.
+ * All rights reserved.                                                     */
+
+/* This program is free software; you can redistribute it and/or modify it
+ * under the terms of the license (GNU LGPL) which comes with this package. */
+
 #include "mailbox.h"
 #include "msg/private.h"
-
 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(msg_mailbox, msg,
                                 "Logging specific to MSG (mailbox)");
 
-static xbt_dict_t msg_mailboxes = NULL;
-
-void MSG_mailbox_mod_init(void)
-{
-  msg_mailboxes = xbt_dict_new();
-}
-
-void MSG_mailbox_mod_exit(void)
-{
-  xbt_dict_free(&msg_mailboxes);
-}
-
-msg_mailbox_t MSG_mailbox_create(const char *alias)
-{
-  msg_mailbox_t mailbox = xbt_new0(s_msg_mailbox_t, 1);
-
-  mailbox->tasks = xbt_fifo_new();
-  mailbox->cond = NULL;
-  mailbox->alias = alias ? xbt_strdup(alias) : NULL;
-  mailbox->hostname = NULL;
-
-  return mailbox;
-}
-
 msg_mailbox_t MSG_mailbox_new(const char *alias)
 {
-  msg_mailbox_t mailbox = MSG_mailbox_create(alias);
-
-  /* add the mbox in the dictionary */
-  xbt_dict_set(msg_mailboxes, alias, mailbox, MSG_mailbox_free);
-
-  return mailbox;
+  return SIMIX_req_rdv_create(alias);
 }
 
 void MSG_mailbox_free(void *mailbox)
 {
-  msg_mailbox_t _mailbox = (msg_mailbox_t) mailbox;
-
-  if (_mailbox->hostname)
-    free(_mailbox->hostname);
-
-  xbt_fifo_free(_mailbox->tasks);
-  free(_mailbox->alias);
-
-  free(_mailbox);
-}
-
-smx_cond_t MSG_mailbox_get_cond(msg_mailbox_t mailbox)
-{
-  return mailbox->cond;
-}
-
-void MSG_mailbox_remove(msg_mailbox_t mailbox, m_task_t task)
-{
-  xbt_fifo_remove(mailbox->tasks, task);
+  SIMIX_req_rdv_destroy((msg_mailbox_t)mailbox);
 }
 
 int MSG_mailbox_is_empty(msg_mailbox_t mailbox)
 {
-  return (NULL == xbt_fifo_get_first_item(mailbox->tasks));
-}
-
-m_task_t MSG_mailbox_pop_head(msg_mailbox_t mailbox)
-{
-  return (m_task_t) xbt_fifo_shift(mailbox->tasks);
+  return (NULL == SIMIX_req_rdv_get_head(mailbox));
 }
 
 m_task_t MSG_mailbox_get_head(msg_mailbox_t mailbox)
 {
-  xbt_fifo_item_t item;
+  smx_action_t comm = SIMIX_req_rdv_get_head(mailbox);
 
-  if (!(item = xbt_fifo_get_first_item(mailbox->tasks)))
+  if (!comm)
     return NULL;
 
-  return (m_task_t) xbt_fifo_get_item_content(item);
-}
-
-
-m_task_t MSG_mailbox_get_first_host_task(msg_mailbox_t mailbox, m_host_t host)
-{
-  m_task_t task = NULL;
-  xbt_fifo_item_t item = NULL;
-
-  xbt_fifo_foreach(mailbox->tasks, item, task, m_task_t)
-    if (task->simdata->source == host) {
-    xbt_fifo_remove_item(mailbox->tasks, item);
-    return task;
-  }
-
-  return NULL;
+  return (m_task_t) SIMIX_req_comm_get_src_data(comm);
 }
 
 int
-MSG_mailbox_get_count_host_waiting_tasks(msg_mailbox_t mailbox, m_host_t host)
-{
-  m_task_t task = NULL;
-  xbt_fifo_item_t item = NULL;
-  int count = 0;
-
-  xbt_fifo_foreach(mailbox->tasks, item, task, m_task_t) {
-    if (task->simdata->source == host)
-      count++;
-  }
-
-  return count;
-}
-
-void MSG_mailbox_set_cond(msg_mailbox_t mailbox, smx_cond_t cond)
-{
-  mailbox->cond = cond;
-}
-
-const char *MSG_mailbox_get_alias(msg_mailbox_t mailbox)
-{
-  return mailbox->alias;
-}
-
-const char *MSG_mailbox_get_hostname(msg_mailbox_t mailbox)
-{
-  return mailbox->hostname;
-}
-
-void MSG_mailbox_set_hostname(msg_mailbox_t mailbox, const char *hostname)
+MSG_mailbox_get_count_host_waiting_tasks(msg_mailbox_t mailbox,
+                                         m_host_t host)
 {
-  mailbox->hostname = xbt_strdup(hostname);
+  return SIMIX_req_rdv_comm_count_by_host(mailbox,
+                                      host->simdata->smx_host);
 }
 
 msg_mailbox_t MSG_mailbox_get_by_alias(const char *alias)
 {
 
-  msg_mailbox_t mailbox = xbt_dict_get_or_null(msg_mailboxes, alias);
+  msg_mailbox_t mailbox = SIMIX_req_rdv_get_by_name(alias);
 
-  if (!mailbox) {
+  if (!mailbox)
     mailbox = MSG_mailbox_new(alias);
-    MSG_mailbox_set_hostname(mailbox, MSG_host_self()->name);
-  }
 
   return mailbox;
 }
 
-msg_mailbox_t MSG_mailbox_get_by_channel(m_host_t host, m_channel_t channel)
+msg_mailbox_t MSG_mailbox_get_by_channel(m_host_t host,
+                                         m_channel_t channel)
 {
-  xbt_assert0((host != NULL), "Invalid host");
-  xbt_assert1((channel >= 0)
+  xbt_assert((host != NULL), "Invalid host");
+  xbt_assert((channel >= 0)
               && (channel < msg_global->max_channel), "Invalid channel %d",
               channel);
 
@@ -158,282 +70,135 @@ MSG_error_t
 MSG_mailbox_get_task_ext(msg_mailbox_t mailbox, m_task_t * task,
                          m_host_t host, double timeout)
 {
-  m_process_t process = MSG_process_self();
-  m_task_t t = NULL;
-  m_host_t h = NULL;
-  simdata_task_t t_simdata = NULL;
-  simdata_host_t h_simdata = NULL;
-  double start_time = SIMIX_get_clock();
-
-  smx_cond_t cond = NULL;       //conditional wait if the task isn't on the channel yet
+  xbt_ex_t e;
+  MSG_error_t ret = MSG_OK;
+  /* We no longer support getting a task from a specific host */
+  if (host)
+    THROW_UNIMPLEMENTED;
 
   CHECK_HOST();
+#ifdef HAVE_TRACING
+  TRACE_msg_task_get_start();
+  double start_time = MSG_get_clock();
+#endif
 
   /* Sanity check */
-  xbt_assert0(task, "Null pointer for the task storage");
+  xbt_assert(task, "Null pointer for the task storage");
 
   if (*task)
-    CRITICAL0
-      ("MSG_task_get() was asked to write in a non empty task struct.");
-
-  /* Get the task */
-  h = MSG_host_self();
-  h_simdata = h->simdata;
-
-  SIMIX_mutex_lock(h->simdata->mutex);
-
-  if (MSG_mailbox_get_cond(mailbox)) {
-    CRITICAL1("A process is already blocked on the channel %s",
-              MSG_mailbox_get_alias(mailbox));
-    SIMIX_cond_display_info(MSG_mailbox_get_cond(mailbox));
-    xbt_die("Go fix your code!");
-  }
-
-  while (1) {
-    /* if the mailbox is empty (has no task */
-    if (!MSG_mailbox_is_empty(mailbox)) {
-      if (!host) {
-        /* pop the head of the mailbox */
-        t = MSG_mailbox_pop_head(mailbox);
-        break;
-      } else {
-        /* get the first task of the host */
-        if ((t = MSG_mailbox_get_first_host_task(mailbox, host)))
-          break;
-      }
-    }
-
-    if ((timeout > 0) && (SIMIX_get_clock() - start_time >= timeout)) {
-      SIMIX_mutex_unlock(h->simdata->mutex);
-      MSG_mailbox_set_cond(mailbox, NULL);
-      SIMIX_cond_destroy(cond);
-      MSG_RETURN(MSG_TRANSFER_FAILURE);
-    }
-
-    if (!cond) {
-      cond = SIMIX_cond_init();
-      MSG_mailbox_set_cond(mailbox, cond);
-    }
-
-    if (timeout > 0)
-      SIMIX_cond_wait_timeout(cond, h->simdata->mutex, timeout - start_time);
-    else
-      SIMIX_cond_wait(MSG_mailbox_get_cond(mailbox), h->simdata->mutex);
-
-    if (SIMIX_host_get_state(h_simdata->smx_host) == 0) {
-      SIMIX_mutex_unlock(h->simdata->mutex);
-      MSG_mailbox_set_cond(mailbox, NULL);
-      SIMIX_cond_destroy(cond);
-      MSG_RETURN(MSG_HOST_FAILURE);
-    }
-  }
-
-
-  DEBUG1("OK, got a task (%s)", t->name);
-  /* clean conditional */
-  if (cond) {
-    MSG_mailbox_set_cond(mailbox, NULL);
-    SIMIX_cond_destroy(cond);
-  }
-
-  SIMIX_mutex_unlock(h->simdata->mutex);
-
-  t_simdata = t->simdata;
-  t_simdata->receiver = process;
-  *task = t;
-
-  SIMIX_mutex_lock(t_simdata->mutex);
-
-  /* Transfer */
-  /* create SIMIX action to the communication */
-  t_simdata->comm =
-    SIMIX_action_communicate(t_simdata->sender->simdata->m_host->simdata->
-                             smx_host,
-                             process->simdata->m_host->simdata->smx_host,
-                             t->name, t_simdata->message_size,
-                             t_simdata->rate);
-
-  SIMIX_action_use(t_simdata->comm);
-
-  /* if the process is suspend, create the action but stop its execution, it will be restart when the sender process resume */
-  if (MSG_process_is_suspended(t_simdata->sender)) {
-    DEBUG1("Process sender (%s) suspended", t_simdata->sender->name);
-    SIMIX_action_set_priority(t_simdata->comm, 0);
+    XBT_CRITICAL
+        ("MSG_task_get() was asked to write in a non empty task struct.");
+
+  /* Try to receive it by calling SIMIX network layer */
+  TRY {
+    SIMIX_req_comm_recv(mailbox, task, NULL, NULL, NULL, timeout);
+    XBT_DEBUG("Got task %s from %p",(*task)->name,mailbox);
+    (*task)->simdata->isused=0;
   }
-
-  process->simdata->waiting_task = t;
-  SIMIX_register_action_to_condition(t_simdata->comm, t_simdata->cond);
-
-  while (1) {
-    SIMIX_cond_wait(t_simdata->cond, t_simdata->mutex);
-
-    if (SIMIX_action_get_state(t_simdata->comm) != SURF_ACTION_RUNNING)
+  CATCH(e) {
+    switch (e.category) {
+    case host_error:
+      ret = MSG_HOST_FAILURE;
       break;
-    if (!SIMIX_host_get_state(h_simdata->smx_host))
+    case network_error:
+      ret = MSG_TRANSFER_FAILURE;
       break;
-    if (!SIMIX_host_get_state(process->simdata->m_host->simdata->smx_host))
+    case timeout_error:
+      ret = MSG_TIMEOUT;
       break;
+    default:
+      RETHROW;
+    }
+    xbt_ex_free(e);
   }
 
-  SIMIX_unregister_action_to_condition(t_simdata->comm, t_simdata->cond);
-  process->simdata->waiting_task = NULL;
-
-  /* for this process, don't need to change in get function */
-  SIMIX_mutex_unlock(t_simdata->mutex);
-
-  if (SIMIX_action_get_state(t_simdata->comm) == SURF_ACTION_DONE) {
-    if (SIMIX_action_destroy(t_simdata->comm))
-      t_simdata->comm = NULL;
-    MSG_RETURN(MSG_OK);
-  } else if (SIMIX_host_get_state(h_simdata->smx_host) == 0) {
-    if (SIMIX_action_destroy(t_simdata->comm))
-      t_simdata->comm = NULL;
-    MSG_RETURN(MSG_HOST_FAILURE);
-  } else {
-    if (SIMIX_action_destroy(t_simdata->comm))
-      t_simdata->comm = NULL;
-    MSG_RETURN(MSG_TRANSFER_FAILURE);
+#ifdef HAVE_TRACING
+  if (ret != MSG_HOST_FAILURE &&
+      ret != MSG_TRANSFER_FAILURE &&
+      ret != MSG_TIMEOUT) {
+    TRACE_msg_task_get_end(start_time, *task);
   }
+#endif
+  MSG_RETURN(ret);
 }
 
 MSG_error_t
 MSG_mailbox_put_with_timeout(msg_mailbox_t mailbox, m_task_t task,
                              double timeout)
 {
-  m_process_t process = MSG_process_self();
-  const char *hostname;
+  xbt_ex_t e;
+  MSG_error_t ret = MSG_OK;
   simdata_task_t t_simdata = NULL;
-  m_host_t local_host = NULL;
-  m_host_t remote_host = NULL;
-  smx_cond_t cond = NULL;
-
+  m_process_t process = MSG_process_self();
+  simdata_process_t p_simdata = SIMIX_process_self_get_data();
+#ifdef HAVE_TRACING
+  volatile smx_action_t comm = NULL;
+  int call_end = 0;
+#endif
   CHECK_HOST();
 
+#ifdef HAVE_TRACING
+  call_end = TRACE_msg_task_put_start(task);    //must be after CHECK_HOST()
+#endif
+
+  /* Prepare the task to send */
   t_simdata = task->simdata;
   t_simdata->sender = process;
-  t_simdata->source = MSG_process_get_host(process);
+  t_simdata->source = MSG_host_self();
 
-  xbt_assert0(t_simdata->refcount == 1,
+  xbt_assert(t_simdata->isused == 0,
               "This task is still being used somewhere else. You cannot send it now. Go fix your code!");
 
-  t_simdata->comm = NULL;
-
-  t_simdata->refcount++;
-  local_host = ((simdata_process_t) process->simdata)->m_host;
+  t_simdata->isused=1;
   msg_global->sent_msg++;
 
-  /* get the host name containing the mailbox */
-  hostname = MSG_mailbox_get_hostname(mailbox);
-
-  remote_host = MSG_get_host_by_name(hostname);
 
-  if (!remote_host)
-    THROW1(not_found_error, 0, "Host %s not fount", hostname);
-
-
-  DEBUG4("Trying to send a task (%g kB) from %s to %s on the channel %s",
-         t_simdata->message_size / 1000, local_host->name,
-         remote_host->name, MSG_mailbox_get_alias(mailbox));
-
-  SIMIX_mutex_lock(remote_host->simdata->mutex);
-
-  /* put the task in the mailbox */
-  xbt_fifo_push(mailbox->tasks, task);
-
-  if ((cond = MSG_mailbox_get_cond(mailbox))) {
-    DEBUG0("Somebody is listening. Let's wake him up!");
-    SIMIX_cond_signal(cond);
+  p_simdata->waiting_task = task;
+
+  /* Try to send it by calling SIMIX network layer */
+  TRY {
+#ifdef HAVE_TRACING
+    if (TRACE_is_active()) {
+      comm = SIMIX_req_comm_isend(mailbox, t_simdata->message_size,
+                                  t_simdata->rate, task, sizeof(void *),
+                                  NULL, NULL, 0);
+      t_simdata->comm = comm;
+      SIMIX_req_set_category(comm, task->category);
+      SIMIX_req_comm_wait(comm, timeout);
+    } else {
+#endif
+      SIMIX_req_comm_send(mailbox, t_simdata->message_size,
+                          t_simdata->rate, task, sizeof(void*),
+                          NULL, NULL, timeout);
+#ifdef HAVE_TRACING
+    }
+#endif
   }
 
-  SIMIX_mutex_unlock(remote_host->simdata->mutex);
-
-  SIMIX_mutex_lock(t_simdata->mutex);
-
-  process->simdata->waiting_task = task;
-
-  if (timeout > 0) {
-    xbt_ex_t e;
-    double time;
-    double time_elapsed;
-    time = SIMIX_get_clock();
-
-    TRY {
-      /*verify if the action that ends is the correct. Call the wait_timeout with the new time. If the timeout occurs, an exception is raised */
-      while (1) {
-        time_elapsed = SIMIX_get_clock() - time;
-        SIMIX_cond_wait_timeout(t_simdata->cond, t_simdata->mutex,
-                                timeout - time_elapsed);
-
-        if (t_simdata->comm)
-          SIMIX_action_use(t_simdata->comm);
-        if (t_simdata->comm && (SIMIX_action_get_state(t_simdata->comm) !=
-                                SURF_ACTION_RUNNING))
-          break;
-        if (!SIMIX_host_get_state(local_host->simdata->smx_host))
-          break;
-        if (!SIMIX_host_get_state(remote_host->simdata->smx_host))
-          break;
-      }
-    }
-    CATCH(e) {
-      if (e.category == timeout_error) {
-        xbt_ex_free(e);
-        /* verify if the timeout happened and the communication didn't started yet */
-        if (t_simdata->comm == NULL) {
-          DEBUG1("Action terminated %s (there was a timeout)", task->name);
-          process->simdata->waiting_task = NULL;
-
-          /* remove the task from the mailbox */
-          MSG_mailbox_remove(mailbox, task);
-
-/*           if (t_simdata->receiver && t_simdata->receiver->simdata) {    /\* receiver still around *\/ */
-/*             t_simdata->receiver->simdata->waiting_task = NULL; */
-/*           } */
-
-          SIMIX_mutex_unlock(t_simdata->mutex);
-          MSG_RETURN(MSG_TRANSFER_FAILURE);
-        }
-      } else {
-        RETHROW;
-      }
-    }
-  } else {
-    while (1) {
-      SIMIX_cond_wait(t_simdata->cond, t_simdata->mutex);
-
-      if (t_simdata->comm)
-        SIMIX_action_use(t_simdata->comm);
-      if (t_simdata->comm
-          && SIMIX_action_get_state(t_simdata->comm) != SURF_ACTION_RUNNING)
-        break;
-      if (!SIMIX_host_get_state(local_host->simdata->smx_host))
-        break;
-      if (!SIMIX_host_get_state(remote_host->simdata->smx_host))
-        break;
+  CATCH(e) {
+    switch (e.category) {
+    case host_error:
+      ret = MSG_HOST_FAILURE;
+      break;
+    case network_error:
+      ret = MSG_TRANSFER_FAILURE;
+      break;
+    case timeout_error:
+      ret = MSG_TIMEOUT;
+      break;
+    default:
+      RETHROW;
     }
-  }
+    xbt_ex_free(e);
 
-  DEBUG1("Action terminated %s", task->name);
-  process->simdata->waiting_task = NULL;
-/*   if (t_simdata->receiver && t_simdata->receiver->simdata) {    /\* receiver still around *\/ */
-/*     t_simdata->receiver->simdata->waiting_task = NULL; */
-/*   } */
-
-  SIMIX_mutex_unlock(task->simdata->mutex);
-
-  if (t_simdata->comm
-      && SIMIX_action_get_state(t_simdata->comm) == SURF_ACTION_DONE) {
-    if (SIMIX_action_destroy(t_simdata->comm))
-      t_simdata->comm = NULL;
-    t_simdata->refcount--;
-    MSG_RETURN(MSG_OK);
-  } else if (SIMIX_host_get_state(local_host->simdata->smx_host) == 0) {
-    if (t_simdata->comm && SIMIX_action_destroy(t_simdata->comm))
-      t_simdata->comm = NULL;
-    MSG_RETURN(MSG_HOST_FAILURE);
-  } else {
-    if (t_simdata->comm && SIMIX_action_destroy(t_simdata->comm))
-      t_simdata->comm = NULL;
-    MSG_RETURN(MSG_TRANSFER_FAILURE);
+    /* If the send failed, it is not used anymore */
+    t_simdata->isused = 0;
   }
+
+  p_simdata->waiting_task = NULL;
+#ifdef HAVE_TRACING
+  if (call_end)
+    TRACE_msg_task_put_end();
+#endif
+  MSG_RETURN(ret);
 }