2 #include "msg/private.h"
4 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(msg_mailbox, msg,
5 "Logging specific to MSG (mailbox)");
7 static xbt_dict_t msg_mailboxes = NULL;
9 void MSG_mailbox_mod_init(void)
11 msg_mailboxes = xbt_dict_new();
14 void MSG_mailbox_mod_exit(void)
16 xbt_dict_free(&msg_mailboxes);
19 msg_mailbox_t MSG_mailbox_create(const char *alias)
21 msg_mailbox_t mailbox = xbt_new0(s_msg_mailbox_t, 1);
23 mailbox->tasks = xbt_fifo_new();
25 mailbox->alias = alias ? xbt_strdup(alias) : NULL;
26 mailbox->hostname = NULL;
31 msg_mailbox_t MSG_mailbox_new(const char *alias)
33 msg_mailbox_t mailbox = MSG_mailbox_create(alias);
35 /* add the mbox in the dictionary */
36 xbt_dict_set(msg_mailboxes, alias, mailbox, MSG_mailbox_free);
41 void MSG_mailbox_free(void *mailbox)
43 msg_mailbox_t _mailbox = (msg_mailbox_t) mailbox;
45 if (_mailbox->hostname)
46 free(_mailbox->hostname);
48 xbt_fifo_free(_mailbox->tasks);
49 free(_mailbox->alias);
54 smx_cond_t MSG_mailbox_get_cond(msg_mailbox_t mailbox)
59 void MSG_mailbox_remove(msg_mailbox_t mailbox, m_task_t task)
61 xbt_fifo_remove(mailbox->tasks, task);
64 int MSG_mailbox_is_empty(msg_mailbox_t mailbox)
66 return (NULL == xbt_fifo_get_first_item(mailbox->tasks));
69 m_task_t MSG_mailbox_pop_head(msg_mailbox_t mailbox)
71 return (m_task_t) xbt_fifo_shift(mailbox->tasks);
74 m_task_t MSG_mailbox_get_head(msg_mailbox_t mailbox)
78 if (!(item = xbt_fifo_get_first_item(mailbox->tasks)))
81 return (m_task_t) xbt_fifo_get_item_content(item);
85 m_task_t MSG_mailbox_get_first_host_task(msg_mailbox_t mailbox, m_host_t host)
88 xbt_fifo_item_t item = NULL;
90 xbt_fifo_foreach(mailbox->tasks, item, task, m_task_t)
91 if (task->simdata->source == host) {
92 xbt_fifo_remove_item(mailbox->tasks, item);
100 MSG_mailbox_get_count_host_waiting_tasks(msg_mailbox_t mailbox, m_host_t host)
102 m_task_t task = NULL;
103 xbt_fifo_item_t item = NULL;
106 xbt_fifo_foreach(mailbox->tasks, item, task, m_task_t) {
107 if (task->simdata->source == host)
114 void MSG_mailbox_set_cond(msg_mailbox_t mailbox, smx_cond_t cond)
116 mailbox->cond = cond;
119 const char *MSG_mailbox_get_alias(msg_mailbox_t mailbox)
121 return mailbox->alias;
124 const char *MSG_mailbox_get_hostname(msg_mailbox_t mailbox)
126 return mailbox->hostname;
129 void MSG_mailbox_set_hostname(msg_mailbox_t mailbox, const char *hostname)
131 mailbox->hostname = xbt_strdup(hostname);
134 msg_mailbox_t MSG_mailbox_get_by_alias(const char *alias)
137 msg_mailbox_t mailbox = xbt_dict_get_or_null(msg_mailboxes, alias);
140 mailbox = MSG_mailbox_new(alias);
141 MSG_mailbox_set_hostname(mailbox, MSG_host_self()->name);
147 msg_mailbox_t MSG_mailbox_get_by_channel(m_host_t host, m_channel_t channel)
149 xbt_assert0((host != NULL), "Invalid host");
150 xbt_assert1((channel >= 0)
151 && (channel < msg_global->max_channel), "Invalid channel %d",
154 return host->simdata->mailboxes[(size_t) channel];
158 MSG_mailbox_get_task_ext(msg_mailbox_t mailbox, m_task_t * task,
159 m_host_t host, double timeout)
161 m_process_t process = MSG_process_self();
164 simdata_task_t t_simdata = NULL;
165 simdata_host_t h_simdata = NULL;
166 double start_time = SIMIX_get_clock();
168 smx_cond_t cond = NULL; //conditional wait if the task isn't on the channel yet
173 xbt_assert0(task, "Null pointer for the task storage");
177 ("MSG_task_get() was asked to write in a non empty task struct.");
181 h_simdata = h->simdata;
183 SIMIX_mutex_lock(h->simdata->mutex);
185 if (MSG_mailbox_get_cond(mailbox)) {
186 CRITICAL1("A process is already blocked on the channel %s",
187 MSG_mailbox_get_alias(mailbox));
188 SIMIX_cond_display_info(MSG_mailbox_get_cond(mailbox));
189 xbt_die("Go fix your code!");
193 /* if the mailbox is empty (has no task */
194 if (!MSG_mailbox_is_empty(mailbox)) {
196 /* pop the head of the mailbox */
197 t = MSG_mailbox_pop_head(mailbox);
200 /* get the first task of the host */
201 if ((t = MSG_mailbox_get_first_host_task(mailbox, host)))
206 if ((timeout > 0) && (SIMIX_get_clock() - start_time >= timeout)) {
207 SIMIX_mutex_unlock(h->simdata->mutex);
208 MSG_mailbox_set_cond(mailbox, NULL);
209 SIMIX_cond_destroy(cond);
210 MSG_RETURN(MSG_TRANSFER_FAILURE);
214 cond = SIMIX_cond_init();
215 MSG_mailbox_set_cond(mailbox, cond);
219 SIMIX_cond_wait_timeout(cond, h->simdata->mutex, timeout - start_time);
221 SIMIX_cond_wait(MSG_mailbox_get_cond(mailbox), h->simdata->mutex);
223 if (SIMIX_host_get_state(h_simdata->smx_host) == 0) {
224 SIMIX_mutex_unlock(h->simdata->mutex);
225 MSG_mailbox_set_cond(mailbox, NULL);
226 SIMIX_cond_destroy(cond);
227 MSG_RETURN(MSG_HOST_FAILURE);
232 DEBUG1("OK, got a task (%s)", t->name);
233 /* clean conditional */
235 MSG_mailbox_set_cond(mailbox, NULL);
236 SIMIX_cond_destroy(cond);
239 SIMIX_mutex_unlock(h->simdata->mutex);
241 t_simdata = t->simdata;
242 t_simdata->receiver = process;
245 SIMIX_mutex_lock(t_simdata->mutex);
248 /* create SIMIX action to the communication */
250 SIMIX_action_communicate(t_simdata->sender->simdata->m_host->simdata->
252 process->simdata->m_host->simdata->smx_host,
253 t->name, t_simdata->message_size,
256 /* This is a hack. We know that both the receiver and the sender will
257 need to look at the content of t_simdata->comm. And it needs to be
258 destroyed. However, we don't known whether the receiver or the sender
259 will get to it first. So by setting with refcount to 2 we can enforce
260 that things happen correctly. An alternative would be to only do ++ and
261 -- on this refcount and to sprinkle them judiciously throughout the code,
262 which appears perhaps worse? Or perhaps the refcount field of
263 task->simdata can be used for this? At any rate, this will do for now */
264 t_simdata->comm->refcount = 2;
266 /* if the process is suspend, create the action but stop its execution, it will be restart when the sender process resume */
267 if (MSG_process_is_suspended(t_simdata->sender)) {
268 DEBUG1("Process sender (%s) suspended", t_simdata->sender->name);
269 SIMIX_action_set_priority(t_simdata->comm, 0);
272 process->simdata->waiting_task = t;
273 SIMIX_register_action_to_condition(t_simdata->comm, t_simdata->cond);
276 SIMIX_cond_wait(t_simdata->cond, t_simdata->mutex);
278 if (SIMIX_action_get_state(t_simdata->comm) != SURF_ACTION_RUNNING)
280 if (!SIMIX_host_get_state(h_simdata->smx_host))
282 if (!SIMIX_host_get_state(process->simdata->m_host->simdata->smx_host))
286 SIMIX_unregister_action_to_condition(t_simdata->comm, t_simdata->cond);
287 process->simdata->waiting_task = NULL;
289 /* If sender still around (it didn't free the comm yet), note that it's not waiting anymore */
290 if (t_simdata->comm->refcount == 2) {
291 t->simdata->sender->simdata->waiting_task = NULL;
294 /* for this process, don't need to change in get function */
295 SIMIX_mutex_unlock(t_simdata->mutex);
298 if (SIMIX_action_get_state(t_simdata->comm) == SURF_ACTION_DONE) {
299 if (t_simdata->comm->refcount == 1) {
300 SIMIX_action_destroy(t_simdata->comm);
301 t_simdata->comm = NULL;
303 t_simdata->comm->refcount--;
305 t_simdata->refcount--;
307 } else if (SIMIX_host_get_state(h_simdata->smx_host) == 0) {
308 if (t_simdata->comm->refcount == 1) {
309 SIMIX_action_destroy(t_simdata->comm);
310 t_simdata->comm = NULL;
312 t_simdata->comm->refcount--;
314 t_simdata->refcount--;
315 MSG_RETURN(MSG_HOST_FAILURE);
317 if (t_simdata->comm->refcount == 1) {
318 SIMIX_action_destroy(t_simdata->comm);
319 t_simdata->comm = NULL;
321 t_simdata->comm->refcount--;
323 t_simdata->refcount--;
324 MSG_RETURN(MSG_TRANSFER_FAILURE);
329 MSG_mailbox_put_with_timeout(msg_mailbox_t mailbox, m_task_t task,
332 m_process_t process = MSG_process_self();
333 const char *hostname;
334 simdata_task_t t_simdata = NULL;
335 m_host_t local_host = NULL;
336 m_host_t remote_host = NULL;
337 smx_cond_t cond = NULL;
341 t_simdata = task->simdata;
342 t_simdata->sender = process;
343 t_simdata->source = MSG_process_get_host(process);
345 xbt_assert0(t_simdata->refcount == 1,
346 "This task is still being used somewhere else. You cannot send it now. Go fix your code!");
348 t_simdata->comm = NULL;
350 t_simdata->refcount++;
351 local_host = ((simdata_process_t) process->simdata)->m_host;
352 msg_global->sent_msg++;
354 /* get the host name containing the mailbox */
355 hostname = MSG_mailbox_get_hostname(mailbox);
357 remote_host = MSG_get_host_by_name(hostname);
360 THROW1(not_found_error, 0, "Host %s not fount", hostname);
363 DEBUG4("Trying to send a task (%g kB) from %s to %s on the channel %s",
364 t_simdata->message_size / 1000, local_host->name,
365 remote_host->name, MSG_mailbox_get_alias(mailbox));
367 SIMIX_mutex_lock(remote_host->simdata->mutex);
369 /* put the task in the mailbox */
370 xbt_fifo_push(mailbox->tasks, task);
372 if ((cond = MSG_mailbox_get_cond(mailbox))) {
373 DEBUG0("Somebody is listening. Let's wake him up!");
374 SIMIX_cond_signal(cond);
377 SIMIX_mutex_unlock(remote_host->simdata->mutex);
379 SIMIX_mutex_lock(t_simdata->mutex);
381 process->simdata->waiting_task = task;
387 time = SIMIX_get_clock();
390 /*verify if the action that ends is the correct. Call the wait_timeout with the new time. If the timeout occurs, an exception is raised */
392 time_elapsed = SIMIX_get_clock() - time;
393 SIMIX_cond_wait_timeout(t_simdata->cond, t_simdata->mutex,
394 timeout - time_elapsed);
396 if ((t_simdata->comm != NULL)
397 && (SIMIX_action_get_state(t_simdata->comm) !=
398 SURF_ACTION_RUNNING))
400 if (!SIMIX_host_get_state(local_host->simdata->smx_host))
402 if (!SIMIX_host_get_state(remote_host->simdata->smx_host))
407 if (e.category == timeout_error) {
409 /* verify if the timeout happened and the communication didn't started yet */
410 if (t_simdata->comm == NULL) {
411 process->simdata->waiting_task = NULL;
413 /* remove the task from the mailbox */
414 MSG_mailbox_remove(mailbox, task);
416 if (t_simdata->receiver && t_simdata->receiver->simdata) { /* receiver still around */
417 t_simdata->receiver->simdata->waiting_task = NULL;
420 SIMIX_mutex_unlock(t_simdata->mutex);
421 MSG_RETURN(MSG_TRANSFER_FAILURE);
429 SIMIX_cond_wait(t_simdata->cond, t_simdata->mutex);
431 if (SIMIX_action_get_state(t_simdata->comm) != SURF_ACTION_RUNNING)
433 if (!SIMIX_host_get_state(local_host->simdata->smx_host))
435 if (!SIMIX_host_get_state(remote_host->simdata->smx_host))
440 DEBUG1("Action terminated %s", task->name);
441 process->simdata->waiting_task = NULL;
443 if (t_simdata->comm->refcount == 2) { //receiver didn't free it yet: he's still around
444 t_simdata->receiver->simdata->waiting_task = NULL;
447 SIMIX_mutex_unlock(task->simdata->mutex);
449 if (SIMIX_action_get_state(t_simdata->comm) == SURF_ACTION_DONE) {
450 if (t_simdata->comm->refcount == 1) {
451 SIMIX_action_destroy(t_simdata->comm);
452 t_simdata->comm = NULL;
454 t_simdata->comm->refcount--;
457 } else if (SIMIX_host_get_state(local_host->simdata->smx_host) == 0) {
458 if (t_simdata->comm->refcount == 1) {
459 SIMIX_action_destroy(t_simdata->comm);
460 t_simdata->comm = NULL;
462 t_simdata->comm->refcount--;
464 MSG_RETURN(MSG_HOST_FAILURE);
466 if (t_simdata->comm->refcount == 1) {
467 SIMIX_action_destroy(t_simdata->comm);
468 t_simdata->comm = NULL;
470 t_simdata->comm->refcount--;
472 MSG_RETURN(MSG_TRANSFER_FAILURE);