-#include <stdio.h>
+/* Copyright (c) 2007, 2008, 2009, 2010. The SimGrid Team.
+ * All rights reserved. */
-#include "private.h"
+/* This program is free software; you can redistribute it and/or modify it
+ * under the terms of the license (GNU LGPL) which comes with this package. */
-XBT_LOG_NEW_DEFAULT_SUBCATEGORY(smpi, XBT_LOG_ROOT_CAT, "All SMPI categories");
+#include <stdint.h>
+#include <stdlib.h>
-smpi_global_t smpi_global = NULL;
+#include "private.h"
+#include "smpi_mpi_dt_private.h"
+#include "mc/mc.h"
-void *smpi_request_new(void);
+XBT_LOG_NEW_CATEGORY(smpi, "All SMPI categories");
-void *smpi_request_new()
-{
- smpi_mpi_request_t request = xbt_new(s_smpi_mpi_request_t, 1);
+XBT_LOG_NEW_DEFAULT_SUBCATEGORY(smpi_kernel, smpi,
+ "Logging specific to SMPI (kernel)");
- request->buf = NULL;
- request->completed = 0;
- request->mutex = SIMIX_mutex_init();
- request->cond = SIMIX_cond_init();
- request->data = NULL;
- request->forward = 0;
+typedef struct s_smpi_process_data {
+ int index;
+ int* argc;
+ char*** argv;
+ xbt_fifo_t pending_sent;
+ xbt_fifo_t pending_recv;
+ xbt_os_timer_t timer;
+ double simulated;
+ MPI_Comm comm_self;
+} s_smpi_process_data_t;
- return request;
-}
+static smpi_process_data_t *process_data = NULL;
+static int process_count = 0;
-void smpi_request_free(void *pointer);
+MPI_Comm MPI_COMM_WORLD = MPI_COMM_NULL;
-void smpi_request_free(void *pointer)
+void smpi_process_init(int *argc, char ***argv)
{
+ int index;
+ smpi_process_data_t data;
+ smx_process_t proc;
+
+ if(argc && argv) {
+ proc = SIMIX_process_self();
+ index = atoi((*argv)[1]);
+ data = smpi_process_remote_data(index);
+ SIMIX_process_set_data(proc, data);
+ if (*argc > 2) {
+ free((*argv)[1]);
+ memmove(&(*argv)[1], &(*argv)[2], sizeof(char *) * (*argc - 2));
+ (*argv)[(*argc) - 1] = NULL;
+ }
+ (*argc)--;
+ data->argc = argc;
+ data->argv = argv;
+ DEBUG2("<%d> New process in the game: %p", index, proc);
+ }
+}
- smpi_mpi_request_t request = pointer;
-
- SIMIX_cond_destroy(request->cond);
- SIMIX_mutex_destroy(request->mutex);
- xbt_free(request);
+void smpi_process_destroy(void)
+{
+ int index = smpi_process_index();
- return;
+ DEBUG1("<%d> Process left the game", index);
}
-void smpi_request_reset(void *pointer);
-
-void smpi_request_reset(void *pointer)
-{
- smpi_mpi_request_t request = pointer;
+int smpi_process_argc(void) {
+ smpi_process_data_t data = smpi_process_data();
- request->buf = NULL;
- request->completed = 0;
- request->data = NULL;
- request->forward = 0;
+ return data->argc ? *(data->argc) - 1 : 0;
+}
- return;
+int smpi_process_getarg(integer* index, char* dst, ftnlen len) {
+ smpi_process_data_t data = smpi_process_data();
+ char* arg;
+ size_t i;
+
+ if(!data->argc || !data->argv
+ || *index < 1 || *index >= *(data->argc)) {
+ return -1;
+ }
+ arg = (*data->argv)[*index];
+ for(i = 0; i < len && arg[i] != '\0'; i++) {
+ dst[i] = arg[i];
+ }
+ for(; i < len; i++) {
+ dst[i] = ' ';
+ }
+ return 0;
}
+int smpi_global_rank(void) {
+ return smpi_process_index();
+}
-void *smpi_message_new(void);
+int smpi_global_size(void) {
+ char* value = getenv("SMPI_GLOBAL_SIZE");
-void *smpi_message_new()
-{
- smpi_received_message_t message = xbt_new(s_smpi_received_message_t, 1);
- message->buf = NULL;
- return message;
+ if(!value) {
+ abort();
+ }
+ return atoi(value);
}
-void smpi_message_free(void *pointer);
-
-void smpi_message_free(void *pointer)
+smpi_process_data_t smpi_process_data(void)
{
- xbt_free(pointer);
- return;
+ return SIMIX_process_get_data(SIMIX_process_self());
}
-void smpi_message_reset(void *pointer);
-
-void smpi_message_reset(void *pointer)
+smpi_process_data_t smpi_process_remote_data(int index)
{
- smpi_received_message_t message = pointer;
- message->buf = NULL;
- return;
+ return process_data[index];
}
-int smpi_create_request(void *buf, int count, smpi_mpi_datatype_t datatype,
- int src, int dst, int tag, smpi_mpi_communicator_t comm, smpi_mpi_request_t *requestptr)
+int smpi_process_count(void)
{
- int retval = MPI_SUCCESS;
-
- smpi_mpi_request_t request = NULL;
-
- // parameter checking prob belongs in smpi_mpi, but this is less repeat code
- if (NULL == buf) {
- retval = MPI_ERR_INTERN;
- } else if (0 > count) {
- retval = MPI_ERR_COUNT;
- } else if (NULL == datatype) {
- retval = MPI_ERR_TYPE;
- } else if (MPI_ANY_SOURCE != src && (0 > src || comm->size <= src)) {
- retval = MPI_ERR_RANK;
- } else if (0 > dst || comm->size <= dst) {
- retval = MPI_ERR_RANK;
- } else if (MPI_ANY_TAG != tag && 0 > tag) {
- retval = MPI_ERR_TAG;
- } else if (NULL == comm) {
- retval = MPI_ERR_COMM;
- } else if (NULL == requestptr) {
- retval = MPI_ERR_ARG;
- } else {
- request = xbt_mallocator_get(smpi_global->request_mallocator);
- request->comm = comm;
- request->src = src;
- request->dst = dst;
- request->tag = tag;
- request->buf = buf;
- request->datatype = datatype;
- request->count = count;
-
- *requestptr = request;
- }
- return retval;
+ return process_count;
}
-void smpi_global_init()
+int smpi_process_index(void)
{
- int i;
-
- int size = SIMIX_host_get_number();
-
- smpi_global = xbt_new(s_smpi_global_t, 1);
-
- // config variable
- smpi_global->reference_speed = SMPI_DEFAULT_SPEED;
-
- smpi_global->root_ready = 0;
- smpi_global->ready_process_count = 0;
+ smpi_process_data_t data = smpi_process_data();
- // start/stop
- smpi_global->start_stop_mutex = SIMIX_mutex_init();
- smpi_global->start_stop_cond = SIMIX_cond_init();
+ return data->index;
+}
- // host info blank until sim starts
- // FIXME: is this okay?
- smpi_global->hosts = NULL;
- smpi_global->host_count = 0;
+xbt_os_timer_t smpi_process_timer(void)
+{
+ smpi_process_data_t data = smpi_process_data();
- // running hosts
- smpi_global->running_hosts_count_mutex = SIMIX_mutex_init();
- smpi_global->running_hosts_count = 0;
+ return data->timer;
+}
- // mallocators
- smpi_global->request_mallocator = xbt_mallocator_new(SMPI_REQUEST_MALLOCATOR_SIZE,
- smpi_request_new, smpi_request_free, smpi_request_reset);
- smpi_global->message_mallocator = xbt_mallocator_new(SMPI_MESSAGE_MALLOCATOR_SIZE,
- smpi_message_new, smpi_message_free, smpi_message_reset);
+void smpi_process_simulated_start(void)
+{
+ smpi_process_data_t data = smpi_process_data();
- // queues
- smpi_global->pending_send_request_queues = xbt_new(xbt_fifo_t, size);
- smpi_global->pending_send_request_queues_mutexes = xbt_new(smx_mutex_t, size);
- smpi_global->pending_recv_request_queues = xbt_new(xbt_fifo_t, size);
- smpi_global->pending_recv_request_queues_mutexes = xbt_new(smx_mutex_t, size);
- smpi_global->received_message_queues = xbt_new(xbt_fifo_t, size);
- smpi_global->received_message_queues_mutexes = xbt_new(smx_mutex_t, size);
+ data->simulated = SIMIX_get_clock();
+}
- // sender/receiver processes
- smpi_global->sender_processes = xbt_new(smx_process_t, size);
- smpi_global->receiver_processes = xbt_new(smx_process_t, size);
+double smpi_process_simulated_elapsed(void)
+{
+ smpi_process_data_t data = smpi_process_data();
- // timers
- smpi_global->timer = xbt_os_timer_new();
- smpi_global->timer_mutex = SIMIX_mutex_init();
- smpi_global->timer_cond = SIMIX_cond_init();
+ return SIMIX_get_clock() - data->simulated;
+}
- smpi_global->times_max = 0;
- smpi_global->times_mutex = SIMIX_mutex_init();
+MPI_Comm smpi_process_comm_self(void)
+{
+ smpi_process_data_t data = smpi_process_data();
- smpi_global->execute_mutex = SIMIX_mutex_init();
- smpi_global->execute_cond = SIMIX_cond_init();
+ return data->comm_self;
+}
- for (i = 0; i < size; i++) {
- smpi_global->pending_send_request_queues[i] = xbt_fifo_new();
- smpi_global->pending_send_request_queues_mutexes[i] = SIMIX_mutex_init();
- smpi_global->pending_recv_request_queues[i] = xbt_fifo_new();
- smpi_global->pending_recv_request_queues_mutexes[i] = SIMIX_mutex_init();
- smpi_global->received_message_queues[i] = xbt_fifo_new();
- smpi_global->received_message_queues_mutexes[i] = SIMIX_mutex_init();
- }
+void print_request(const char *message, MPI_Request request)
+{
+ char *req =
+ bprintf
+ ("[buf = %p, size = %zu, src = %d, dst = %d, tag= %d, complete = %d, flags = %u]",
+ request->buf, request->size, request->src, request->dst,
+ request->tag, request->complete, request->flags);
+
+ DEBUG5("%s (request %p with rdv %p and match %p) %s",
+ message, request, request->rdv, request->match, req);
+ free(req);
+}
- for (i = 0; i < SMPI_MAX_TIMES; i++) {
- smpi_global->times[i] = -1.0;
- }
+void smpi_process_post_send(MPI_Comm comm, MPI_Request request)
+{
+ int index = smpi_group_index(smpi_comm_group(comm), request->dst);
+ smpi_process_data_t data = smpi_process_remote_data(index);
+ xbt_fifo_item_t item;
+ MPI_Request req;
+
+ print_request("Isend", request);
+ xbt_fifo_foreach(data->pending_recv, item, req, MPI_Request) {
+ if (req->comm == request->comm
+ && (req->src == MPI_ANY_SOURCE || req->src == request->src)
+ && (req->tag == MPI_ANY_TAG || req->tag == request->tag)) {
+ print_request("Match found", req);
+ xbt_fifo_remove_item(data->pending_recv, item);
+ /* Materialize the *_ANY_* fields from corresponding irecv request */
+ req->src = request->src;
+ req->tag = request->tag;
+ req->match = request;
+ request->rdv = req->rdv;
+ request->match = req;
+ return;
+ }
+ }
+ request->rdv = SIMIX_rdv_create(NULL);
+ xbt_fifo_push(data->pending_sent, request);
+}
+void smpi_process_post_recv(MPI_Request request)
+{
+ smpi_process_data_t data = smpi_process_data();
+ xbt_fifo_item_t item;
+ MPI_Request req;
+
+ print_request("Irecv", request);
+ xbt_fifo_foreach(data->pending_sent, item, req, MPI_Request) {
+ if (req->comm == request->comm
+ && (request->src == MPI_ANY_SOURCE || req->src == request->src)
+ && (request->tag == MPI_ANY_TAG || req->tag == request->tag)) {
+ print_request("Match found", req);
+ xbt_fifo_remove_item(data->pending_sent, item);
+ /* Materialize the *_ANY_* fields from the irecv request */
+ req->match = request;
+ request->src = req->src;
+ request->tag = req->tag;
+ request->rdv = req->rdv;
+ request->match = req;
+ return;
+ }
+ }
+ request->rdv = SIMIX_rdv_create(NULL);
+ xbt_fifo_push(data->pending_recv, request);
}
-void smpi_global_destroy()
+void smpi_global_init(void)
{
- int i;
-
- int size = SIMIX_host_get_number();
-
- // start/stop
- SIMIX_mutex_destroy(smpi_global->start_stop_mutex);
- SIMIX_cond_destroy(smpi_global->start_stop_cond);
-
- // processes
- xbt_free(smpi_global->sender_processes);
- xbt_free(smpi_global->receiver_processes);
-
- // running hosts
- SIMIX_mutex_destroy(smpi_global->running_hosts_count_mutex);
-
- // mallocators
- xbt_mallocator_free(smpi_global->request_mallocator);
- xbt_mallocator_free(smpi_global->message_mallocator);
-
- xbt_os_timer_free(smpi_global->timer);
- SIMIX_mutex_destroy(smpi_global->timer_mutex);
- SIMIX_cond_destroy(smpi_global->timer_cond);
- SIMIX_mutex_destroy(smpi_global->times_mutex);
- SIMIX_mutex_destroy(smpi_global->execute_mutex);
- SIMIX_cond_destroy(smpi_global->execute_cond);
-
- for(i = 0; i < size; i++) {
- xbt_fifo_free(smpi_global->pending_send_request_queues[i]);
- SIMIX_mutex_destroy(smpi_global->pending_send_request_queues_mutexes[i]);
- xbt_fifo_free(smpi_global->pending_recv_request_queues[i]);
- SIMIX_mutex_destroy(smpi_global->pending_recv_request_queues_mutexes[i]);
- xbt_fifo_free(smpi_global->received_message_queues[i]);
- SIMIX_mutex_destroy(smpi_global->received_message_queues_mutexes[i]);
- }
-
- xbt_free(smpi_global->pending_send_request_queues);
- xbt_free(smpi_global->pending_send_request_queues_mutexes);
- xbt_free(smpi_global->pending_recv_request_queues);
- xbt_free(smpi_global->pending_recv_request_queues_mutexes);
- xbt_free(smpi_global->received_message_queues);
- xbt_free(smpi_global->received_message_queues_mutexes);
-
- xbt_free(smpi_global);
-
- smpi_global = NULL;
+ int i;
+ MPI_Group group;
+
+ SIMIX_network_set_copy_data_callback
+ (&SIMIX_network_copy_buffer_callback);
+ process_count = SIMIX_process_count();
+ process_data = xbt_new(smpi_process_data_t, process_count);
+ for (i = 0; i < process_count; i++) {
+ process_data[i] = xbt_new(s_smpi_process_data_t, 1);
+ process_data[i]->index = i;
+ process_data[i]->argc = NULL;
+ process_data[i]->argv = NULL;
+ process_data[i]->pending_sent = xbt_fifo_new();
+ process_data[i]->pending_recv = xbt_fifo_new();
+ process_data[i]->timer = xbt_os_timer_new();
+ group = smpi_group_new(1);
+ process_data[i]->comm_self = smpi_comm_new(group);
+ smpi_group_set_mapping(group, i, 0);
+ }
+ group = smpi_group_new(process_count);
+ MPI_COMM_WORLD = smpi_comm_new(group);
+ for (i = 0; i < process_count; i++) {
+ smpi_group_set_mapping(group, i, i);
+ }
}
-int smpi_host_index()
+void smpi_global_destroy(void)
{
- smx_host_t host = SIMIX_host_self();
- smpi_host_data_t hdata = (smpi_host_data_t)SIMIX_host_get_data(host);
+ int count = smpi_process_count();
+ int i;
+
+ smpi_bench_destroy();
+ smpi_comm_destroy(MPI_COMM_WORLD);
+ MPI_COMM_WORLD = MPI_COMM_NULL;
+ for (i = 0; i < count; i++) {
+ smpi_comm_destroy(process_data[i]->comm_self);
+ xbt_os_timer_free(process_data[i]->timer);
+ xbt_fifo_free(process_data[i]->pending_recv);
+ xbt_fifo_free(process_data[i]->pending_sent);
+ xbt_free(process_data[i]);
+ }
+ xbt_free(process_data);
+ process_data = NULL;
+}
- return hdata->index;
+/* Fortran specific stuff */
+/* With smpicc, the following weak symbols are used */
+/* With smpiff, the following weak symbols are replaced by those in libf2c */
+int __attribute__((weak)) xargc;
+char** __attribute__((weak)) xargv;
+
+int __attribute__((weak)) main(int argc, char** argv) {
+ xargc = argc;
+ xargv = argv;
+ return MAIN__();
}
-int smpi_run_simulation(int *argc, char **argv)
+int MAIN__(void)
{
- xbt_fifo_item_t cond_item = NULL;
- smx_cond_t cond = NULL;
- xbt_fifo_item_t action_item = NULL;
- smx_action_t action = NULL;
+ srand(SMPI_RAND_SEED);
+
+ double default_reference_speed = 20000.0;
+ xbt_cfg_register(&_surf_cfg_set, "smpi/running_power",
+ "Power of the host running the simulation (in flop/s). Used to bench the operations.",
+ xbt_cfgelm_double, &default_reference_speed, 1, 1, NULL,
+ NULL);
- xbt_fifo_t actions_failed = xbt_fifo_new();
- xbt_fifo_t actions_done = xbt_fifo_new();
+ int default_display_timing = 0;
+ xbt_cfg_register(&_surf_cfg_set, "smpi/display_timing",
+ "Boolean indicating whether we should display the timing after simulation.",
+ xbt_cfgelm_int, &default_display_timing, 1, 1, NULL,
+ NULL);
- srand(SMPI_RAND_SEED);
+ int default_display_smpe = 0;
+ xbt_cfg_register(&_surf_cfg_set, "smpi/log_events",
+ "Boolean indicating whether we should display simulated time spent in MPI calls.",
+ xbt_cfgelm_int, &default_display_smpe, 1, 1, NULL,
+ NULL);
- SIMIX_global_init(argc, argv);
+ double default_threshold = 1e-6;
+ xbt_cfg_register(&_surf_cfg_set, "smpi/cpu_threshold",
+ "Minimal computation time (in seconds) not discarded.",
+ xbt_cfgelm_double, &default_threshold, 1, 1, NULL,
+ NULL);
- SIMIX_function_register("smpi_simulated_main", smpi_simulated_main);
- SIMIX_function_register("smpi_sender", smpi_sender);
- SIMIX_function_register("smpi_receiver", smpi_receiver);
+#ifdef HAVE_TRACING
+ TRACE_global_init(&xargc, xargv);
+#endif
- // FIXME: ought to verify these files...
- SIMIX_create_environment(argv[1]);
+ SIMIX_global_init(&xargc, xargv);
- // must initialize globals between creating environment and launching app....
- smpi_global_init();
+#ifdef HAVE_TRACING
+ TRACE_smpi_start();
+#endif
- SIMIX_launch_application(argv[2]);
+ // parse the platform file: get the host list
+ SIMIX_create_environment(xargv[1]);
- /* Prepare to display some more info when dying on Ctrl-C pressing */
- // FIXME: doesn't work
- //signal(SIGINT, inthandler);
+ SIMIX_function_register("smpi_simulated_main", smpi_simulated_main);
+ SIMIX_launch_application(xargv[2]);
- /* Clean IO before the run */
- fflush(stdout);
- fflush(stderr);
+ smpi_global_init();
- while (SIMIX_solve(actions_done, actions_failed) != -1.0) {
- xbt_fifo_foreach(actions_failed, action_item, action, smx_action_t) {
- DEBUG1("** %s failed **", action->name);
- xbt_fifo_foreach(action->cond_list, cond_item, cond, smx_cond_t) {
- SIMIX_cond_broadcast(cond);
- }
- }
- xbt_fifo_foreach(actions_done, action_item, action, smx_action_t) {
- DEBUG1("** %s done **",action->name);
- xbt_fifo_foreach(action->cond_list, cond_item, cond, smx_cond_t) {
- SIMIX_cond_broadcast(cond);
- }
- }
- }
+ /* Clean IO before the run */
+ fflush(stdout);
+ fflush(stderr);
+ SIMIX_init();
- // FIXME: cleanup incomplete
- xbt_fifo_free(actions_failed);
- xbt_fifo_free(actions_done);
+#ifdef HAVE_MC
+ if (_surf_do_model_check)
+ MC_modelcheck(1);
+ else
+#endif
+ while (SIMIX_solve(NULL, NULL) != -1.0);
- INFO1("simulation time %g", SIMIX_get_clock());
+ if (xbt_cfg_get_int(_surf_cfg_set, "smpi/display_timing"))
+ INFO1("simulation time %g", SIMIX_get_clock());
- smpi_global_destroy();
+ smpi_global_destroy();
- SIMIX_clean();
+#ifdef HAVE_TRACING
+ TRACE_smpi_release();
+#endif
- return 0;
+ SIMIX_clean();
+ return 0;
}