#include "src/internal_config.h"
#include "private.h"
#include "private.hpp"
+#include <xbt/ex.hpp>
#include "xbt/dict.h"
#include "xbt/sysdep.h"
#include "xbt/ex.h"
#include "simgrid/modelchecker.h"
#include "src/mc/mc_replay.h"
+#include <sys/types.h>
#ifndef WIN32
#include <sys/mman.h>
#endif
#include <sys/stat.h>
-#include <sys/types.h>
#include <errno.h>
#include <fcntl.h>
#include <math.h> // sqrt
#include <string.h>
#include <stdio.h>
+#if HAVE_PAPI
+#include <papi.h>
+#endif
+
#ifndef MAP_ANONYMOUS
#define MAP_ANONYMOUS MAP_ANON
#endif
xbt_dict_t calls = nullptr; /* Allocated on first use */
double smpi_cpu_threshold;
-double smpi_running_power;
+double smpi_host_speed;
int smpi_loaded_page = -1;
char* smpi_start_data_exe = nullptr;
class smpi_source_location {
public:
smpi_source_location(const char* filename, int line)
- : filename(filename), filename_length(strlen(filename)), line(line) {}
+ : filename(xbt_strdup(filename)), filename_length(strlen(filename)), line(line) {}
/** Pointer to a static string containing the file name */
- const char* filename = nullptr;
+ char* filename = nullptr;
int filename_length = 0;
int line = 0;
mem = mmap(nullptr, size, PROT_READ | PROT_WRITE, MAP_SHARED, fd, 0);
if(mem == MAP_FAILED) {
- xbt_die("Could not map fd %d: %s", fd, strerror(errno));
+ xbt_die("Could not map fd %d with size %zu: %s.\n If you are running a lot of processes, you may be exceeding the amount of mappings allowed per process. \n On linux systems, this value can be set by using sudo sysctl -w vm.max_map_count=newvalue .\n Default value is 65536", fd, size, strerror(errno));
}
snprintf(loc, PTR_STRLEN, "%p", mem);
meta.size = size;
}
#endif
-void smpi_bench_destroy(void)
+void smpi_bench_destroy()
{
allocs.clear();
allocs_metadata.clear();
}
void smpi_execute_flops(double flops) {
- smx_synchro_t action;
XBT_DEBUG("Handle real computation time: %f flops", flops);
- action = simcall_execution_start("computation", flops, 1, 0, 0);
+ smx_activity_t action = simcall_execution_start("computation", flops, 1, 0);
simcall_set_category (action, TRACE_internal_smpi_get_category());
simcall_execution_wait(action);
smpi_switch_data_segment(smpi_process_index());
{
if (duration >= smpi_cpu_threshold) {
XBT_DEBUG("Sleep for %g to handle real computation time", duration);
- double flops = duration * smpi_running_power;
+ double flops = duration * smpi_host_speed;
int rank = smpi_process_index();
instr_extra_data extra = xbt_new0(s_instr_extra_data_t,1);
extra->type=TRACING_COMPUTING;
extra->comp_size=flops;
TRACE_smpi_computing_in(rank, extra);
+
smpi_execute_flops(flops);
TRACE_smpi_computing_out(rank);
}
}
-void smpi_bench_begin(void)
+void smpi_bench_begin()
{
if (smpi_privatize_global_variables) {
smpi_switch_data_segment(smpi_process_index());
if (MC_is_active() || MC_record_replay_is_active())
return;
+#if HAVE_PAPI
+ if (xbt_cfg_get_string("smpi/papi-events")[0] != '\0') {
+ int event_set = smpi_process_papi_event_set();
+ // PAPI_start sets everything to 0! See man(3) PAPI_start
+ if (PAPI_LOW_LEVEL_INITED == PAPI_is_initialized()) {
+ if (PAPI_start(event_set) != PAPI_OK) {
+ // TODO This needs some proper handling.
+ XBT_CRITICAL("Could not start PAPI counters.\n");
+ xbt_die("Error.");
+ }
+ }
+ }
+#endif
xbt_os_threadtimer_start(smpi_process_timer());
}
-void smpi_bench_end(void)
+void smpi_bench_end()
{
-
if (MC_is_active() || MC_record_replay_is_active())
return;
double speedup = 1;
xbt_os_timer_t timer = smpi_process_timer();
xbt_os_threadtimer_stop(timer);
+
+#if HAVE_PAPI
+ /**
+ * An MPI function has been called and now is the right time to update
+ * our PAPI counters for this process.
+ */
+ if (xbt_cfg_get_string("smpi/papi-events")[0] != '\0') {
+ papi_counter_t& counter_data = smpi_process_papi_counters();
+ int event_set = smpi_process_papi_event_set();
+ std::vector<long long> event_values = std::vector<long long>(counter_data.size());
+
+ if (PAPI_stop(event_set, &event_values[0]) != PAPI_OK) { // Error
+ XBT_CRITICAL("Could not stop PAPI counters.\n");
+ xbt_die("Error.");
+ } else {
+ for (unsigned int i = 0; i < counter_data.size(); i++) {
+ counter_data[i].second += event_values[i];
+ // XBT_DEBUG("[%i] PAPI: Counter %s: Value is now %lli (got increment by %lli\n", smpi_process_index(),
+ // counter_data[i].first.c_str(), counter_data[i].second, event_values[i]);
+ }
+ }
+ }
+#endif
+
if (smpi_process_get_sampling()) {
XBT_CRITICAL("Cannot do recursive benchmarks.");
XBT_CRITICAL("Are you trying to make a call to MPI within a SMPI_SAMPLE_ block?");
smpi_execute(xbt_os_timer_elapsed(timer)/speedup);
}
+#if HAVE_PAPI
+ if (xbt_cfg_get_string("smpi/papi-events")[0] != '\0' && TRACE_smpi_is_enabled()) {
+ char container_name[INSTR_DEFAULT_STR_SIZE];
+ smpi_container(smpi_process_index(), container_name, INSTR_DEFAULT_STR_SIZE);
+ container_t container = PJ_container_get(container_name);
+ papi_counter_t& counter_data = smpi_process_papi_counters();
+
+ for (auto& pair : counter_data) {
+ new_pajeSetVariable(surf_get_clock(), container,
+ PJ_type_get(/* countername */ pair.first.c_str(), container->type), pair.second);
+ }
+ }
+#endif
+
smpi_total_benched_time += xbt_os_timer_elapsed(timer);
}
return static_cast<int>(private_sleep(static_cast<double>(usecs) / 1000000.0));
}
-#if _POSIX_TIMERS && _POSIX_C_SOURCE >= 199309L
+#if _POSIX_TIMERS > 0
int smpi_nanosleep(const struct timespec *tp, struct timespec * t)
{
return static_cast<int>(private_sleep(static_cast<double>(tp->tv_sec + tp->tv_nsec / 1000000000.0)));
return 0;
}
-#if _POSIX_TIMERS && _POSIX_C_SOURCE >= 199309L
+#if _POSIX_TIMERS > 0
int smpi_clock_gettime(clockid_t clk_id, struct timespec *tp)
{
//there is only one time in SMPI, so clk_id is ignored.
#endif
extern double sg_surf_precision;
-unsigned long long smpi_rastro_resolution (void)
+unsigned long long smpi_rastro_resolution ()
{
smpi_bench_end();
double resolution = (1/sg_surf_precision);
return static_cast<unsigned long long>(resolution);
}
-unsigned long long smpi_rastro_timestamp (void)
+unsigned long long smpi_rastro_timestamp ()
{
smpi_bench_end();
double now = SIMIX_get_clock();
void *smpi_shared_malloc(size_t size, const char *file, int line)
{
void* mem;
- if (xbt_cfg_get_boolean("smpi/use-shared-malloc")){
+ if (size > 0 && xbt_cfg_get_boolean("smpi/use-shared-malloc")){
int fd;
smpi_source_location loc(file, line);
auto res = allocs.insert(std::make_pair(loc, shared_data_t()));
snprintf(loc, PTR_STRLEN, "%p", ptr);
auto meta = allocs_metadata.find(ptr);
if (meta == allocs_metadata.end()) {
- XBT_WARN("Cannot free: %p was not shared-allocated by SMPI", ptr);
+ XBT_WARN("Cannot free: %p was not shared-allocated by SMPI - maybe its size was 0?", ptr);
return;
}
shared_data_t* data = &meta->second.data->second;
XBT_WARN("Unmapping of fd %d failed: %s", data->fd, strerror(errno));
}
data->count--;
- XBT_DEBUG("Shared free - no removal - of %p, count = %d", ptr, data->count);
if (data->count <= 0) {
close(data->fd);
allocs.erase(allocs.find(meta->second.data->first));
XBT_DEBUG("Shared free - with removal - of %p", ptr);
+ }else{
+ XBT_DEBUG("Shared free - no removal - of %p, count = %d", ptr, data->count);
}
}else{
XBT_DEBUG("Classic free of %p", ptr);
for (int i=0; i< smpi_process_count(); i++){
//create SIMIX_process_count() mappings of this size with the same data inside
+ int file_descriptor;
void *address = nullptr;
- char path[] = "/dev/shm/my-buffer-XXXXXX";
+ char path[24];
int status;
- int file_descriptor= mkstemp (path);
+ do {
+ snprintf(path, sizeof(path), "/smpi-buffer-%06x", rand()%0xffffff);
+ file_descriptor = shm_open(path, O_RDWR|O_CREAT|O_EXCL, S_IRUSR|S_IWUSR);
+ } while (file_descriptor == -1 && errno == EEXIST);
if (file_descriptor < 0) {
if (errno==EMFILE) {
xbt_die("Impossible to create temporary file for memory mapping: %s\n\
strerror(errno));
}
- status = unlink (path);
- if (status)
- xbt_die("Impossible to unlink temporary file for memory mapping");
-
status = ftruncate(file_descriptor, smpi_size_data_exe);
if(status)
xbt_die("Impossible to set the size of the temporary file for memory mapping");
if (address == MAP_FAILED)
xbt_die("Couldn't find a free region for memory mapping");
+ status = shm_unlink(path);
+ if (status)
+ xbt_die("Impossible to unlink temporary file for memory mapping");
+
//initialize the values
memcpy(address, TOPAGE(smpi_start_data_exe), smpi_size_data_exe);