Logo AND Algorithmique Numérique Distribuée

Public GIT Repository
Merge branch 'master' of framagit.org:simgrid/simgrid
[simgrid.git] / src / smpi / include / private.hpp
1 /* Copyright (c) 2007-2020. The SimGrid Team. All rights reserved.          */
2
3 /* This program is free software; you can redistribute it and/or modify it
4  * under the terms of the license (GNU LGPL) which comes with this package. */
5
6 #ifndef SMPI_PRIVATE_HPP
7 #define SMPI_PRIVATE_HPP
8
9 #include "simgrid/s4u/Barrier.hpp"
10 #include "smpi/smpi.h"
11 #include "smpi/smpi_helpers_internal.h"
12 #include "src/instr/instr_smpi.hpp"
13 #include <unordered_map>
14 #include <vector>
15
16 constexpr unsigned MPI_REQ_PERSISTENT     = 0x1;
17 constexpr unsigned MPI_REQ_NON_PERSISTENT = 0x2;
18 constexpr unsigned MPI_REQ_SEND           = 0x4;
19 constexpr unsigned MPI_REQ_RECV           = 0x8;
20 constexpr unsigned MPI_REQ_RECV_DELETE    = 0x10;
21 constexpr unsigned MPI_REQ_ISEND          = 0x20;
22 constexpr unsigned MPI_REQ_SSEND          = 0x40;
23 constexpr unsigned MPI_REQ_PREPARED       = 0x80;
24 constexpr unsigned MPI_REQ_FINISHED       = 0x100;
25 constexpr unsigned MPI_REQ_RMA            = 0x200;
26 constexpr unsigned MPI_REQ_ACCUMULATE     = 0x400;
27 constexpr unsigned MPI_REQ_GENERALIZED    = 0x800;
28 constexpr unsigned MPI_REQ_COMPLETE       = 0x1000;
29 constexpr unsigned MPI_REQ_BSEND          = 0x2000;
30
31 enum class SmpiProcessState { UNINITIALIZED, INITIALIZING, INITIALIZED /*(=MPI_Init called)*/, FINALIZED };
32
33 constexpr int COLL_TAG_REDUCE         = -112;
34 constexpr int COLL_TAG_SCATTER        = -223;
35 constexpr int COLL_TAG_SCATTERV       = -334;
36 constexpr int COLL_TAG_GATHER         = -445;
37 constexpr int COLL_TAG_ALLGATHER      = -556;
38 constexpr int COLL_TAG_ALLGATHERV     = -667;
39 constexpr int COLL_TAG_BARRIER        = -778;
40 constexpr int COLL_TAG_REDUCE_SCATTER = -889;
41 constexpr int COLL_TAG_ALLTOALLV      = -1000;
42 constexpr int COLL_TAG_ALLTOALLW      = -1020;
43 constexpr int COLL_TAG_ALLTOALL       = -1112;
44 constexpr int COLL_TAG_GATHERV        = -2223;
45 constexpr int COLL_TAG_BCAST          = -3334;
46 constexpr int COLL_TAG_ALLREDUCE      = -4445;
47
48 // SMPI_RMA_TAG has to be the smallest one, as it will be decremented for accumulate ordering.
49 constexpr int SMPI_RMA_TAG            = -6666;
50
51 #define MPI_REQUEST_IGNORED ((MPI_Request*)-100)
52
53 /* Bindings for MPI special values */
54 extern XBT_PUBLIC int mpi_in_place_;
55 extern XBT_PUBLIC int mpi_bottom_;
56 extern XBT_PUBLIC int mpi_status_ignore_;
57 extern XBT_PUBLIC int mpi_statuses_ignore_; 
58 /* Convert between Fortran and C */
59 #define FORT_ADDR(addr, val, val2)                                         \
60   (((void *)(addr) == (void*) &(val2))                  \
61    ? (val) : (void *)(addr))
62 #define FORT_BOTTOM(addr) FORT_ADDR((addr), MPI_BOTTOM, mpi_bottom_)
63 #define FORT_IN_PLACE(addr) FORT_ADDR((addr), MPI_IN_PLACE, mpi_in_place_)
64 #define FORT_STATUS_IGNORE(addr) static_cast<MPI_Status*>(FORT_ADDR((addr), MPI_STATUS_IGNORE, mpi_status_ignore_))
65 #define FORT_STATUSES_IGNORE(addr)                                                                                     \
66   static_cast<MPI_Status*>(FORT_ADDR((addr), MPI_STATUSES_IGNORE, mpi_statuses_ignore_))
67
68 extern XBT_PRIVATE MPI_Comm MPI_COMM_UNINITIALIZED;
69
70 typedef SMPI_Cart_topology* MPIR_Cart_Topology;
71
72 typedef SMPI_Graph_topology* MPIR_Graph_Topology;
73
74 typedef SMPI_Dist_Graph_topology* MPIR_Dist_Graph_Topology;
75
76 XBT_PRIVATE simgrid::smpi::ActorExt* smpi_process();
77 XBT_PRIVATE simgrid::smpi::ActorExt* smpi_process_remote(simgrid::s4u::ActorPtr actor);
78 XBT_PRIVATE int smpi_get_universe_size();
79
80 XBT_PRIVATE void smpi_deployment_register_process(const std::string& instance_id, int rank, simgrid::s4u::Actor* actor);
81 XBT_PRIVATE void smpi_deployment_unregister_process(const std::string& instance_id);
82
83 XBT_PRIVATE MPI_Comm* smpi_deployment_comm_world(const std::string& instance_id);
84 XBT_PRIVATE void smpi_deployment_cleanup_instances();
85
86 XBT_PRIVATE void smpi_comm_copy_buffer_callback(simgrid::kernel::activity::CommImpl* comm, void* buff,
87                                                 size_t buff_size);
88
89 XBT_PRIVATE void smpi_comm_null_copy_buffer_callback(simgrid::kernel::activity::CommImpl* comm, void* buff,
90                                                      size_t buff_size);
91
92 XBT_PRIVATE int smpi_enabled();
93 XBT_PRIVATE double smpi_mpi_wtime();
94 XBT_PRIVATE void smpi_mpi_init();
95
96 enum class SharedMallocType { NONE, LOCAL, GLOBAL };
97 enum class SmpiPrivStrategies { NONE = 0, MMAP = 1, DLOPEN = 2, DEFAULT = DLOPEN };
98
99 XBT_PRIVATE double smpi_cfg_host_speed();
100 XBT_PRIVATE bool smpi_cfg_simulate_computation();
101 XBT_PRIVATE SharedMallocType smpi_cfg_shared_malloc();
102 XBT_PRIVATE double smpi_cfg_cpu_thresh();
103 XBT_PRIVATE SmpiPrivStrategies smpi_cfg_privatization();
104 XBT_PRIVATE int smpi_cfg_async_small_thresh();
105 XBT_PRIVATE int smpi_cfg_detached_send_thresh();
106 XBT_PRIVATE bool smpi_cfg_grow_injected_times();
107 XBT_PRIVATE double smpi_cfg_iprobe_cpu_usage();
108 XBT_PRIVATE bool smpi_cfg_trace_call_location();
109 XBT_PRIVATE bool smpi_cfg_trace_call_use_absolute_path();
110 XBT_PRIVATE std::string smpi_cfg_comp_adjustment_file();
111 XBT_PRIVATE std::string smpi_cfg_papi_events_file();
112 XBT_PRIVATE double smpi_cfg_auto_shared_malloc_thresh();
113
114 // utilities
115 extern XBT_PRIVATE char* smpi_data_exe_start; // start of the data+bss segment of the executable
116 extern XBT_PRIVATE int smpi_data_exe_size;    // size of the data+bss segment of the executable
117
118 XBT_PRIVATE void smpi_switch_data_segment(simgrid::s4u::ActorPtr actor);
119
120 XBT_PRIVATE void smpi_prepare_global_memory_segment();
121 XBT_PRIVATE void smpi_backup_global_memory_segment();
122 XBT_PRIVATE void smpi_destroy_global_memory_segments();
123 XBT_PRIVATE void smpi_bench_destroy();
124 XBT_PRIVATE void smpi_bench_begin();
125 XBT_PRIVATE void smpi_bench_end();
126 XBT_PRIVATE void smpi_shared_destroy();
127 XBT_PRIVATE double smpi_adjust_comp_speed();
128
129 XBT_PRIVATE unsigned char* smpi_get_tmp_sendbuffer(size_t size);
130 XBT_PRIVATE unsigned char* smpi_get_tmp_recvbuffer(size_t size);
131 XBT_PRIVATE void smpi_free_tmp_buffer(const unsigned char* buf);
132 XBT_PRIVATE void smpi_free_replay_tmp_buffers();
133
134 extern "C" {
135 // f77 wrappers
136
137 void mpi_init_(int* ierr);
138 void mpi_finalize_(int* ierr);
139 void mpi_abort_(int* comm, int* errorcode, int* ierr);
140 void mpi_comm_rank_(int* comm, int* rank, int* ierr);
141 void mpi_comm_size_(int* comm, int* size, int* ierr);
142 double mpi_wtime_();
143 double mpi_wtick_();
144 void mpi_initialized_(int* flag, int* ierr);
145
146 void mpi_comm_dup_(int* comm, int* newcomm, int* ierr);
147 void mpi_comm_create_(int* comm, int* group, int* newcomm, int* ierr);
148 void mpi_comm_free_(int* comm, int* ierr);
149 void mpi_comm_split_(int* comm, int* color, int* key, int* comm_out, int* ierr);
150 void mpi_group_incl_(int* group, int* n, int* key, int* group_out, int* ierr);
151 void mpi_comm_group_(int* comm, int* group_out, int* ierr);
152 void mpi_comm_create_group_(int* comm, int* group, int, int* comm_out, int* ierr);
153 void mpi_send_init_(void* buf, int* count, int* datatype, int* dst, int* tag, int* comm, int* request, int* ierr);
154 void mpi_isend_(void* buf, int* count, int* datatype, int* dst, int* tag, int* comm, int* request, int* ierr);
155 void mpi_irsend_(void* buf, int* count, int* datatype, int* dst, int* tag, int* comm, int* request, int* ierr);
156 void mpi_send_(void* buf, int* count, int* datatype, int* dst, int* tag, int* comm, int* ierr);
157 void mpi_rsend_(void* buf, int* count, int* datatype, int* dst, int* tag, int* comm, int* ierr);
158 void mpi_recv_init_(void* buf, int* count, int* datatype, int* src, int* tag, int* comm, int* request, int* ierr);
159 void mpi_irecv_(void* buf, int* count, int* datatype, int* src, int* tag, int* comm, int* request, int* ierr);
160 void mpi_recv_(void* buf, int* count, int* datatype, int* src, int* tag, int* comm, MPI_Status* status, int* ierr);
161 void mpi_start_(int* request, int* ierr);
162 void mpi_startall_(int* count, int* requests, int* ierr);
163 void mpi_wait_(int* request, MPI_Status* status, int* ierr);
164 void mpi_waitany_(int* count, int* requests, int* index, MPI_Status* status, int* ierr);
165 void mpi_waitall_(int* count, int* requests, MPI_Status* status, int* ierr);
166
167 void mpi_barrier_(int* comm, int* ierr);
168 void mpi_bcast_(void* buf, int* count, int* datatype, int* root, int* comm, int* ierr);
169 void mpi_reduce_(void* sendbuf, void* recvbuf, int* count, int* datatype, int* op, int* root, int* comm, int* ierr);
170 void mpi_allreduce_(void* sendbuf, void* recvbuf, int* count, int* datatype, int* op, int* comm, int* ierr);
171 void mpi_reduce_scatter_(void* sendbuf, void* recvbuf, int* recvcounts, int* datatype, int* op, int* comm, int* ierr);
172 void mpi_reduce_scatter_block_(void* sendbuf, void* recvbuf, int* recvcount, int* datatype, int* op, int* comm,
173                                int* ierr);
174 void mpi_scatter_(void* sendbuf, int* sendcount, int* sendtype, void* recvbuf, int* recvcount, int* recvtype, int* root,
175                   int* comm, int* ierr);
176 void mpi_scatterv_(void* sendbuf, int* sendcounts, int* displs, int* sendtype, void* recvbuf, int* recvcount,
177                    int* recvtype, int* root, int* comm, int* ierr);
178 void mpi_gather_(void* sendbuf, int* sendcount, int* sendtype, void* recvbuf, int* recvcount, int* recvtype, int* root,
179                  int* comm, int* ierr);
180 void mpi_gatherv_(void* sendbuf, int* sendcount, int* sendtype, void* recvbuf, int* recvcounts, int* displs,
181                   int* recvtype, int* root, int* comm, int* ierr);
182 void mpi_allgather_(void* sendbuf, int* sendcount, int* sendtype, void* recvbuf, int* recvcount, int* recvtype,
183                     int* comm, int* ierr);
184 void mpi_allgatherv_(void* sendbuf, int* sendcount, int* sendtype, void* recvbuf, int* recvcount, int* displs,
185                      int* recvtype, int* comm, int* ierr);
186 void mpi_scan_(void* sendbuf, void* recvbuf, int* count, int* datatype, int* op, int* comm, int* ierr);
187 void mpi_alltoall_(void* sendbuf, int* sendcount, int* sendtype, void* recvbuf, int* recvcount, int* recvtype,
188                    int* comm, int* ierr);
189 void mpi_alltoallv_(void* sendbuf, int* sendcounts, int* senddisps, int* sendtype, void* recvbuf, int* recvcounts,
190                     int* recvdisps, int* recvtype, int* comm, int* ierr);
191 void mpi_alltoallw_(void* sendbuf, int* sendcnts, int* sdispls, int* sendtypes, void* recvbuf, int* recvcnts,
192                     int* rdispls, int* recvtypes, int* comm, int* ierr);
193 void mpi_exscan_(void* sendbuf, void* recvbuf, int* count, int* datatype, int* op, int* comm, int* ierr);
194
195 void mpi_ibarrier_(int* comm, int* request, int* ierr);
196 void mpi_ibcast_(void* buf, int* count, int* datatype, int* root, int* comm, int* request, int* ierr);
197 void mpi_ireduce_(void* sendbuf, void* recvbuf, int* count, int* datatype, int* op, int* root, int* comm, int* request, int* ierr);
198 void mpi_iallreduce_(void* sendbuf, void* recvbuf, int* count, int* datatype, int* op, int* comm, int* request, int* ierr);
199 void mpi_ireduce_scatter_(void* sendbuf, void* recvbuf, int* recvcounts, int* datatype, int* op, int* comm, int* request, int* ierr);
200 void mpi_ireduce_scatter_block_(void* sendbuf, void* recvbuf, int* recvcount, int* datatype, int* op, int* comm, int* request ,
201                                int* ierr);
202 void mpi_iscatter_(void* sendbuf, int* sendcount, int* sendtype, void* recvbuf, int* recvcount, int* recvtype, int* root,
203                   int* comm, int* request, int* ierr);
204 void mpi_iscatterv_(void* sendbuf, int* sendcounts, int* displs, int* sendtype, void* recvbuf, int* recvcount,
205                    int* recvtype, int* root, int* comm, int* request, int* ierr);
206 void mpi_igather_(void* sendbuf, int* sendcount, int* sendtype, void* recvbuf, int* recvcount, int* recvtype, int* root,
207                  int* comm, int* request, int* ierr);
208 void mpi_igatherv_(void* sendbuf, int* sendcount, int* sendtype, void* recvbuf, int* recvcounts, int* displs,
209                   int* recvtype, int* root, int* comm, int* request, int* ierr);
210 void mpi_iallgather_(void* sendbuf, int* sendcount, int* sendtype, void* recvbuf, int* recvcount, int* recvtype,
211                     int* comm, int* request, int* ierr);
212 void mpi_iallgatherv_(void* sendbuf, int* sendcount, int* sendtype, void* recvbuf, int* recvcount, int* displs,
213                      int* recvtype, int* comm, int* request, int* ierr);
214 void mpi_iscan_(void* sendbuf, void* recvbuf, int* count, int* datatype, int* op, int* comm, int* request, int* ierr);
215 void mpi_ialltoall_(void* sendbuf, int* sendcount, int* sendtype, void* recvbuf, int* recvcount, int* recvtype,
216                    int* comm, int* request, int* ierr);
217 void mpi_ialltoallv_(void* sendbuf, int* sendcounts, int* senddisps, int* sendtype, void* recvbuf, int* recvcounts,
218                     int* recvdisps, int* recvtype, int* comm, int* request, int* ierr);
219 void mpi_ialltoallw_(void* sendbuf, int* sendcnts, int* sdispls, int* sendtypes, void* recvbuf, int* recvcnts,
220                     int* rdispls, int* recvtypes, int* comm, int* request, int* ierr);
221 void mpi_iexscan_(void* sendbuf, void* recvbuf, int* count, int* datatype, int* op, int* comm, int* request, int* ierr);
222
223 void mpi_type_size_(int* datatype, int* size, int* ierr);
224 void mpi_get_processor_name_(char* name, int* resultlen, int* ierr);
225 void mpi_test_(int* request, int* flag, MPI_Status* status, int* ierr);
226 void mpi_testall_(int* count, int* requests, int* flag, MPI_Status* statuses, int* ierr);
227 void mpi_get_count_(MPI_Status* status, int* datatype, int* count, int* ierr);
228 void mpi_type_extent_(int* datatype, MPI_Aint* extent, int* ierr);
229 void mpi_attr_get_(int* comm, int* keyval, int* attr_value, int* flag, int* ierr);
230 void mpi_type_commit_(int* datatype, int* ierr);
231 void mpi_type_vector_(int* count, int* blocklen, int* stride, int* old_type, int* newtype, int* ierr);
232 void mpi_type_hvector_(int* count, int* blocklen, MPI_Aint* stride, int* old_type, int* newtype, int* ierr);
233 void mpi_type_create_hvector_(int* count, int* blocklen, MPI_Aint* stride, int* old_type, int* newtype, int* ierr);
234 void mpi_type_free_(int* datatype, int* ierr);
235 void mpi_type_lb_(int* datatype, MPI_Aint* extent, int* ierr);
236 void mpi_type_ub_(int* datatype, MPI_Aint* extent, int* ierr);
237 void mpi_win_fence_(int* assert, int* win, int* ierr);
238 void mpi_win_free_(int* win, int* ierr);
239 void mpi_win_create_(int* base, MPI_Aint* size, int* disp_unit, int* info, int* comm, int* win, int* ierr);
240 void mpi_win_set_name_(int* win, char* name, int* ierr, int size);
241 void mpi_win_get_name_(int* win, char* name, int* len, int* ierr);
242 void mpi_win_post_(int* group, int assert, int* win, int* ierr);
243 void mpi_win_start_(int* group, int assert, int* win, int* ierr);
244 void mpi_win_complete_(int* win, int* ierr);
245 void mpi_win_wait_(int* win, int* ierr);
246 void mpi_win_allocate_(MPI_Aint* size, int* disp_unit, int* info, int* comm, void* base, int* win, int* ierr);
247 void mpi_win_attach_(int* win, int* base, MPI_Aint* size, int* ierr);
248 void mpi_win_create_dynamic_(int* info, int* comm, int* win, int* ierr);
249 void mpi_win_detach_(int* win, int* base, int* ierr);
250 void mpi_win_set_info_(int* win, int* info, int* ierr);
251 void mpi_win_get_info_(int* win, int* info, int* ierr);
252 void mpi_win_get_group_(int* win, int* group, int* ierr);
253 void mpi_win_get_attr_(int* win, int* type_keyval, MPI_Aint* attribute_val, int* flag, int* ierr);
254 void mpi_win_set_attr_(int* win, int* type_keyval, MPI_Aint* att, int* ierr);
255 void mpi_win_delete_attr_(int* win, int* comm_keyval, int* ierr);
256 void mpi_win_create_keyval_(void* copy_fn, void* delete_fn, int* keyval, void* extra_state, int* ierr);
257 void mpi_win_free_keyval_(int* keyval, int* ierr);
258 void mpi_win_lock_(int* lock_type, int* rank, int* assert, int* win, int* ierr);
259 void mpi_win_lock_all_(int* assert, int* win, int* ierr);
260 void mpi_win_unlock_(int* rank, int* win, int* ierr);
261 void mpi_win_unlock_all_(int* win, int* ierr);
262 void mpi_win_flush_(int* rank, int* win, int* ierr);
263 void mpi_win_flush_local_(int* rank, int* win, int* ierr);
264 void mpi_win_flush_all_(int* win, int* ierr);
265 void mpi_win_flush_local_all_(int* win, int* ierr);
266 void mpi_win_dup_fn_( int* win, int* keyval, int* extrastate, MPI_Aint* valin, MPI_Aint* valout, int* flag, int* ierr );
267 void mpi_win_null_copy_fn_( int* win, int* keyval, int* extrastate, MPI_Aint* valin, MPI_Aint* valout, int* flag, int* ierr );
268 void mpi_info_create_(int* info, int* ierr);
269 void mpi_info_set_(int* info, char* key, char* value, int* ierr, unsigned int keylen, unsigned int valuelen);
270 void mpi_info_free_(int* info, int* ierr);
271 void mpi_get_(int* origin_addr, int* origin_count, int* origin_datatype, int* target_rank, MPI_Aint* target_disp,
272               int* target_count, int* target_datatype, int* win, int* ierr);
273 void mpi_put_(int* origin_addr, int* origin_count, int* origin_datatype, int* target_rank, MPI_Aint* target_disp,
274               int* target_count, int* target_datatype, int* win, int* ierr);
275 void mpi_rget_(int* origin_addr, int* origin_count, int* origin_datatype, int* target_rank, MPI_Aint* target_disp,
276                int* target_count, int* target_datatype, int* win, int* request, int* ierr);
277 void mpi_rput_(int* origin_addr, int* origin_count, int* origin_datatype, int* target_rank, MPI_Aint* target_disp,
278                int* target_count, int* target_datatype, int* win, int* request, int* ierr);
279 void mpi_fetch_and_op_(int* origin_addr, int* result_addr, int* datatype, int* target_rank, MPI_Aint* target_disp,
280                        int* op, int* win, int* ierr);
281 void mpi_compare_and_swap_(int* origin_addr, int* compare_addr, int* result_addr, int* datatype, int* target_rank,
282                            MPI_Aint* target_disp, int* win, int* ierr);
283 void mpi_get_accumulate_(int* origin_addr, int* origin_count, int* origin_datatype, int* result_addr, int* result_count,
284                          int* result_datatype, int* target_rank, MPI_Aint* target_disp, int* target_count,
285                          int* target_datatype, int* op, int* win, int* ierr);
286 void mpi_rget_accumulate_(int* origin_addr, int* origin_count, int* origin_datatype, int* result_addr,
287                           int* result_count, int* result_datatype, int* target_rank, MPI_Aint* target_disp,
288                           int* target_count, int* target_datatype, int* op, int* win, int* request, int* ierr);
289 void mpi_accumulate_(int* origin_addr, int* origin_count, int* origin_datatype, int* target_rank, MPI_Aint* target_disp,
290                      int* target_count, int* target_datatype, int* op, int* win, int* ierr);
291 void mpi_raccumulate_(int* origin_addr, int* origin_count, int* origin_datatype, int* target_rank,
292                       MPI_Aint* target_disp, int* target_count, int* target_datatype, int* op, int* win, int* request,
293                       int* ierr);
294 void mpi_error_string_(int* errorcode, char* string, int* resultlen, int* ierr);
295 void mpi_sendrecv_(void* sendbuf, int* sendcount, int* sendtype, int* dst, int* sendtag, void* recvbuf, int* recvcount,
296                    int* recvtype, int* src, int* recvtag, int* comm, MPI_Status* status, int* ierr);
297
298 void mpi_finalized_(int* flag, int* ierr);
299 void mpi_init_thread_(int* required, int* provided, int* ierr);
300 void mpi_query_thread_(int* provided, int* ierr);
301 void mpi_is_thread_main_(int* flag, int* ierr);
302 void mpi_address_(void* location, MPI_Aint* address, int* ierr);
303 void mpi_get_address_(void* location, MPI_Aint* address, int* ierr);
304 void mpi_type_dup_(int* datatype, int* newdatatype, int* ierr);
305 void mpi_type_set_name_(int* datatype, char* name, int* ierr, int size);
306 void mpi_type_get_name_(int* datatype, char* name, int* len, int* ierr);
307 void mpi_type_get_attr_(int* type, int* type_keyval, int* attribute_val, int* flag, int* ierr);
308 void mpi_type_set_attr_(int* type, int* type_keyval, int* attribute_val, int* ierr);
309 void mpi_type_delete_attr_(int* type, int* type_keyval, int* ierr);
310 void mpi_type_create_keyval_(void* copy_fn, void* delete_fn, int* keyval, void* extra_state, int* ierr);
311 void mpi_type_free_keyval_(int* keyval, int* ierr);
312 void mpi_pcontrol_(int* level, int* ierr);
313 void mpi_type_get_extent_(int* datatype, MPI_Aint* lb, MPI_Aint* extent, int* ierr);
314 void mpi_type_get_true_extent_(int* datatype, MPI_Aint* lb, MPI_Aint* extent, int* ierr);
315 void mpi_op_create_(void* function, int* commute, int* op, int* ierr);
316 void mpi_op_free_(int* op, int* ierr);
317 void mpi_op_commutative_(int* op, int* commute, int* ierr);
318 void mpi_group_free_(int* group, int* ierr);
319 void mpi_group_size_(int* group, int* size, int* ierr);
320 void mpi_group_rank_(int* group, int* rank, int* ierr);
321 void mpi_group_translate_ranks_(int* group1, int* n, int* ranks1, int* group2, int* ranks2, int* ierr);
322 void mpi_group_compare_(int* group1, int* group2, int* result, int* ierr);
323 void mpi_group_union_(int* group1, int* group2, int* newgroup, int* ierr);
324 void mpi_group_intersection_(int* group1, int* group2, int* newgroup, int* ierr);
325 void mpi_group_difference_(int* group1, int* group2, int* newgroup, int* ierr);
326 void mpi_group_excl_(int* group, int* n, int* ranks, int* newgroup, int* ierr);
327 void mpi_group_range_incl_(int* group, int* n, int ranges[][3], int* newgroup, int* ierr);
328 void mpi_group_range_excl_(int* group, int* n, int ranges[][3], int* newgroup, int* ierr);
329 void mpi_comm_get_attr_(int* comm, int* comm_keyval, int* attribute_val, int* flag, int* ierr);
330 void mpi_comm_set_attr_(int* comm, int* comm_keyval, int* attribute_val, int* ierr);
331 void mpi_comm_delete_attr_(int* comm, int* comm_keyval, int* ierr);
332 void mpi_comm_create_keyval_(void* copy_fn, void* delete_fn, int* keyval, void* extra_state, int* ierr);
333 void mpi_comm_free_keyval_(int* keyval, int* ierr);
334 void mpi_comm_get_name_(int* comm, char* name, int* len, int* ierr);
335 void mpi_comm_compare_(int* comm1, int* comm2, int* result, int* ierr);
336 void mpi_comm_disconnect_(int* comm, int* ierr);
337 void mpi_request_free_(int* request, int* ierr);
338 void mpi_sendrecv_replace_(void* buf, int* count, int* datatype, int* dst, int* sendtag, int* src, int* recvtag,
339                            int* comm, MPI_Status* status, int* ierr);
340 void mpi_testany_(int* count, int* requests, int* index, int* flag, MPI_Status* status, int* ierr);
341 void mpi_waitsome_(int* incount, int* requests, int* outcount, int* indices, MPI_Status* status, int* ierr);
342 void mpi_reduce_local_(void* inbuf, void* inoutbuf, int* count, int* datatype, int* op, int* ierr);
343 void mpi_pack_size_(int* incount, int* datatype, int* comm, int* size, int* ierr);
344 void mpi_cart_coords_(int* comm, int* rank, int* maxdims, int* coords, int* ierr);
345 void mpi_cart_create_(int* comm_old, int* ndims, int* dims, int* periods, int* reorder, int* comm_cart, int* ierr);
346 void mpi_cart_get_(int* comm, int* maxdims, int* dims, int* periods, int* coords, int* ierr);
347 void mpi_cart_map_(int* comm_old, int* ndims, int* dims, int* periods, int* newrank, int* ierr);
348 void mpi_cart_rank_(int* comm, int* coords, int* rank, int* ierr);
349 void mpi_cart_shift_(int* comm, int* direction, int* displ, int* source, int* dest, int* ierr);
350 void mpi_cart_sub_(int* comm, int* remain_dims, int* comm_new, int* ierr);
351 void mpi_cartdim_get_(int* comm, int* ndims, int* ierr);
352 void mpi_graph_create_(int* comm_old, int* nnodes, int* index, int* edges, int* reorder, int* comm_graph, int* ierr);
353 void mpi_graph_get_(int* comm, int* maxindex, int* maxedges, int* index, int* edges, int* ierr);
354 void mpi_graph_map_(int* comm_old, int* nnodes, int* index, int* edges, int* newrank, int* ierr);
355 void mpi_graph_neighbors_(int* comm, int* rank, int* maxneighbors, int* neighbors, int* ierr);
356 void mpi_graph_neighbors_count_(int* comm, int* rank, int* nneighbors, int* ierr);
357 void mpi_graphdims_get_(int* comm, int* nnodes, int* nedges, int* ierr);
358 void mpi_topo_test_(int* comm, int* top_type, int* ierr);
359 void mpi_error_class_(int* errorcode, int* errorclass, int* ierr);
360 void mpi_errhandler_create_(void* function, int* errhandler, int* ierr);
361 void mpi_errhandler_free_(int* errhandler, int* ierr);
362 void mpi_errhandler_get_(int* comm, int* errhandler, int* ierr);
363 void mpi_errhandler_set_(int* comm, int* errhandler, int* ierr);
364 void mpi_comm_set_errhandler_(int* comm, int* errhandler, int* ierr);
365 void mpi_comm_get_errhandler_(int* comm, int* errhandler, int* ierr);
366 void mpi_type_contiguous_(int* count, int* old_type, int* newtype, int* ierr);
367 void mpi_cancel_(int* request, int* ierr);
368 void mpi_buffer_attach_(void* buffer, int* size, int* ierr);
369 void mpi_buffer_detach_(void* buffer, int* size, int* ierr);
370 void mpi_testsome_(int* incount, int* requests, int* outcount, int* indices, MPI_Status* statuses, int* ierr);
371 void mpi_comm_test_inter_(int* comm, int* flag, int* ierr);
372 void mpi_unpack_(void* inbuf, int* insize, int* position, void* outbuf, int* outcount, int* type, int* comm, int* ierr);
373 void mpi_pack_external_size_(char* datarep, int* incount, int* datatype, MPI_Aint* size, int* ierr);
374 void mpi_pack_external_(char* datarep, void* inbuf, int* incount, int* datatype, void* outbuf, MPI_Aint* outcount,
375                         MPI_Aint* position, int* ierr);
376 void mpi_unpack_external_(char* datarep, void* inbuf, MPI_Aint* insize, MPI_Aint* position, void* outbuf, int* outcount,
377                           int* datatype, int* ierr);
378 void mpi_type_hindexed_(int* count, int* blocklens, int* indices, int* old_type, int* newtype, int* ierr);
379 void mpi_type_create_hindexed_(int* count, int* blocklens, MPI_Aint* indices, int* old_type, int* newtype, int* ierr);
380 void mpi_type_create_hindexed_block_(int* count, int* blocklength, MPI_Aint* indices, int* old_type, int* newtype,
381                                      int* ierr);
382 void mpi_type_indexed_(int* count, int* blocklens, int* indices, int* old_type, int* newtype, int* ierr);
383 void mpi_type_create_indexed_(int* count, int* blocklens, int* indices, int* old_type, int* newtype, int* ierr);
384 void mpi_type_create_indexed_block_(int* count, int* blocklength, int* indices, int* old_type, int* newtype, int* ierr);
385 void mpi_type_struct_(int* count, int* blocklens, int* indices, int* old_types, int* newtype, int* ierr);
386 void mpi_type_create_struct_(int* count, int* blocklens, MPI_Aint* indices, int* old_types, int* newtype, int* ierr);
387 void mpi_ssend_(void* buf, int* count, int* datatype, int* dest, int* tag, int* comm, int* ierr);
388 void mpi_ssend_init_(void* buf, int* count, int* datatype, int* dest, int* tag, int* comm, int* request, int* ierr);
389 void mpi_intercomm_create_(int* local_comm, int* local_leader, int* peer_comm, int* remote_leader, int* tag,
390                            int* comm_out, int* ierr);
391 void mpi_intercomm_merge_(int* comm, int* high, int* comm_out, int* ierr);
392 void mpi_bsend_(void* buf, int* count, int* datatype, int* dest, int* tag, int* comm, int* ierr);
393 void mpi_bsend_init_(void* buf, int* count, int* datatype, int* dest, int* tag, int* comm, int* request, int* ierr);
394 void mpi_ibsend_(void* buf, int* count, int* datatype, int* dest, int* tag, int* comm, int* request, int* ierr);
395 void mpi_comm_remote_group_(int* comm, int* group, int* ierr);
396 void mpi_comm_remote_size_(int* comm, int* size, int* ierr);
397 void mpi_issend_(void* buf, int* count, int* datatype, int* dest, int* tag, int* comm, int* request, int* ierr);
398 void mpi_probe_(int* source, int* tag, int* comm, MPI_Status* status, int* ierr);
399 void mpi_attr_delete_(int* comm, int* keyval, int* ierr);
400 void mpi_attr_put_(int* comm, int* keyval, int* attr_value, int* ierr);
401 void mpi_rsend_init_(void* buf, int* count, int* datatype, int* dest, int* tag, int* comm, int* request, int* ierr);
402 void mpi_keyval_create_(void* copy_fn, void* delete_fn, int* keyval, void* extra_state, int* ierr);
403 void mpi_keyval_free_(int* keyval, int* ierr);
404 void mpi_test_cancelled_(MPI_Status* status, int* flag, int* ierr);
405 void mpi_pack_(void* inbuf, int* incount, int* type, void* outbuf, int* outcount, int* position, int* comm, int* ierr);
406 void mpi_get_elements_(MPI_Status* status, int* datatype, int* elements, int* ierr);
407 void mpi_dims_create_(int* nnodes, int* ndims, int* dims, int* ierr);
408 void mpi_iprobe_(int* source, int* tag, int* comm, int* flag, MPI_Status* status, int* ierr);
409 void mpi_type_get_envelope_(int* datatype, int* num_integers, int* num_addresses, int* num_datatypes, int* combiner,
410                             int* ierr);
411 void mpi_type_get_contents_(int* datatype, int* max_integers, int* max_addresses, int* max_datatypes,
412                             int* array_of_integers, MPI_Aint* array_of_addresses, int* array_of_datatypes, int* ierr);
413 void mpi_type_create_darray_(int* size, int* rank, int* ndims, int* array_of_gsizes, int* array_of_distribs,
414                              int* array_of_dargs, int* array_of_psizes, int* order, int* oldtype, int* newtype,
415                              int* ierr);
416 void mpi_type_create_resized_(int* oldtype, MPI_Aint* lb, MPI_Aint* extent, int* newtype, int* ierr);
417 void mpi_type_create_subarray_(int* ndims, int* array_of_sizes, int* array_of_subsizes, int* array_of_starts,
418                                int* order, int* oldtype, int* newtype, int* ierr);
419 void mpi_type_match_size_(int* typeclass, int* size, int* datatype, int* ierr);
420 void mpi_comm_set_name_(int* comm, char* name, int* ierr);
421 void mpi_comm_dup_with_info_(int* comm, int* info, int* newcomm, int* ierr);
422 void mpi_comm_split_type_(int* comm, int* split_type, int* key, int* info, int* newcomm, int* ierr);
423 void mpi_comm_set_info_(int* comm, int* info, int* ierr);
424 void mpi_comm_get_info_(int* comm, int* info, int* ierr);
425 void mpi_info_get_(int* info, char* key, int* valuelen, char* value, int* flag, int* ierr, unsigned int keylen);
426 void mpi_comm_create_errhandler_(void* function, int* errhandler, int* ierr);
427 void mpi_add_error_class_(int* errorclass, int* ierr);
428 void mpi_add_error_code_(int* errorclass, int* errorcode, int* ierr);
429 void mpi_add_error_string_(int* errorcode, char* string, int* ierr);
430 void mpi_comm_call_errhandler_(int* comm, int* errorcode, int* ierr);
431 void mpi_info_dup_(int* info, int* newinfo, int* ierr);
432 void mpi_info_get_valuelen_(int* info, char* key, int* valuelen, int* flag, int* ierr, unsigned int keylen);
433 void mpi_info_delete_(int* info, char* key, int* ierr, unsigned int keylen);
434 void mpi_info_get_nkeys_(int* info, int* nkeys, int* ierr);
435 void mpi_info_get_nthkey_(int* info, int* n, char* key, int* ierr, unsigned int keylen);
436 void mpi_get_version_(int* version, int* subversion, int* ierr);
437 void mpi_get_library_version_(char* version, int* len, int* ierr);
438 void mpi_request_get_status_(int* request, int* flag, MPI_Status* status, int* ierr);
439 void mpi_grequest_start_(void* query_fn, void* free_fn, void* cancel_fn, void* extra_state, int* request, int* ierr);
440 void mpi_grequest_complete_(int* request, int* ierr);
441 void mpi_status_set_cancelled_(MPI_Status* status, int* flag, int* ierr);
442 void mpi_status_set_elements_(MPI_Status* status, int* datatype, int* count, int* ierr);
443 void mpi_comm_connect_(char* port_name, int* info, int* root, int* comm, int* newcomm, int* ierr);
444 void mpi_publish_name_(char* service_name, int* info, char* port_name, int* ierr);
445 void mpi_unpublish_name_(char* service_name, int* info, char* port_name, int* ierr);
446 void mpi_lookup_name_(char* service_name, int* info, char* port_name, int* ierr);
447 void mpi_comm_join_(int* fd, int* intercomm, int* ierr);
448 void mpi_open_port_(int* info, char* port_name, int* ierr);
449 void mpi_close_port_(char* port_name, int* ierr);
450 void mpi_comm_accept_(char* port_name, int* info, int* root, int* comm, int* newcomm, int* ierr);
451 void mpi_comm_spawn_(char* command, char* argv, int* maxprocs, int* info, int* root, int* comm, int* intercomm,
452                      int* array_of_errcodes, int* ierr);
453 void mpi_comm_spawn_multiple_(int* count, char* array_of_commands, char** array_of_argv, int* array_of_maxprocs,
454                               int* array_of_info, int* root, int* comm, int* intercomm, int* array_of_errcodes,
455                               int* ierr);
456 void mpi_comm_get_parent_(int* parent, int* ierr);
457 void mpi_file_close_(int* file, int* ierr);
458 void mpi_file_delete_(char* filename, int* info, int* ierr);
459 void mpi_file_open_(int* comm, char* filename, int* amode, int* info, int* fh, int* ierr);
460 void mpi_file_set_view_(int* fh, long long int* offset, int* etype, int* filetype, char* datarep, int* info, int* ierr);
461 void mpi_file_read_(int* fh, void* buf, int* count, int* datatype, MPI_Status* status, int* ierr);
462 void mpi_file_write_(int* fh, void* buf, int* count, int* datatype, MPI_Status* status, int* ierr);
463 void smpi_init_fortran_types();
464 void smpi_execute_flops_(double* flops);
465 void smpi_execute_flops_benched_(double* flops);
466 void smpi_execute_(double* duration);
467 void smpi_execute_benched_(double* duration);
468 } // extern "C"
469
470 XBT_PRIVATE int smpi_temp_shm_get();
471 XBT_PRIVATE void* smpi_temp_shm_mmap(int fd, size_t size);
472
473 struct s_smpi_privatization_region_t {
474   void* address;
475   int file_descriptor;
476 };
477 typedef s_smpi_privatization_region_t* smpi_privatization_region_t;
478
479 extern XBT_PRIVATE int smpi_loaded_page;
480 XBT_PRIVATE smpi_privatization_region_t smpi_init_global_memory_segment_process();
481
482 /**
483  * Get the address of the beginning of the memory page where addr is located.
484  * Note that we use an integer division here, so (a/b)*b is not a, unless a%b == 0
485  *
486  * This is used when privatizing.
487  */
488 #define TOPAGE(addr) (void*)(((unsigned long)(addr) / xbt_pagesize) * xbt_pagesize)
489
490 /** Used only if PAPI is compiled in, but integrated anyway so that this file does not depend on internal_config.h (to speed builds) */
491 typedef std::vector<std::pair</* counter name */ std::string, /* counter value */ long long>> papi_counter_t;
492 struct papi_process_data {
493   papi_counter_t counter_data;
494   int event_set;
495 };
496 extern std::map</* computation unit name */ std::string, papi_process_data> units2papi_setup;
497
498 extern std::unordered_map<std::string, double> location2speedup;
499
500 /** @brief Returns the last call location (filename, linenumber). Process-specific. */
501 XBT_PUBLIC smpi_trace_call_location_t* smpi_trace_get_call_location();
502
503 XBT_PRIVATE void private_execute_flops(double flops);
504
505
506 #define CHECK_ARGS(test, errcode, ...)                                                                                 \
507   if (test) {                                                                                                          \
508     if((errcode) != MPI_SUCCESS)                                                                                       \
509       XBT_WARN(__VA_ARGS__);                                                                                           \
510     return (errcode);                                                                                                  \
511   }
512
513 #define CHECK_MPI_NULL(num, val, err, ptr)                                                                             \
514   CHECK_ARGS((ptr) == (val), (err),                                                                                    \
515              "%s: param %d %s cannot be %s", __func__, (num), _XBT_STRINGIFY(ptr), _XBT_STRINGIFY(val));
516 #define CHECK_NULL(num,err,buf)                                                                                        \
517   CHECK_ARGS((buf) == nullptr, (err),                                                                                  \
518              "%s: param %d %s cannot be NULL", __func__, (num), _XBT_STRINGIFY(buf));
519 #define CHECK_NEGATIVE(num, err, val)                                                                                  \
520   CHECK_ARGS((val) < 0, (err),                                                                                         \
521              "%s: param %d %s cannot be negative", __func__, (num), _XBT_STRINGIFY(val));
522 #define CHECK_COMM2(num, comm)                                                                                         \
523   CHECK_MPI_NULL((num), MPI_COMM_NULL, MPI_ERR_COMM, (comm))
524 #define CHECK_COMM(num)                                                                                                \
525   CHECK_COMM2((num), comm)
526 #define CHECK_REQUEST(num)                                                                                             \
527   CHECK_ARGS(request == nullptr, MPI_ERR_REQUEST,                                                                      \
528              "%s: param %d request cannot be NULL",__func__, (num));
529 #define CHECK_BUFFER(num,buf,count)                                                                                    \
530   CHECK_ARGS((buf) == nullptr && (count) > 0, MPI_ERR_BUFFER,                                                          \
531              "%s: param %d %s cannot be NULL if %s > 0",__func__, (num), _XBT_STRINGIFY(buf), _XBT_STRINGIFY(count));
532 #define CHECK_COUNT(num, count)                                                                                        \
533   CHECK_NEGATIVE((num), MPI_ERR_COUNT, (count))
534 #define CHECK_TYPE(num, datatype)                                                                                      \
535   CHECK_ARGS(((datatype) == MPI_DATATYPE_NULL|| not (datatype)->is_valid()), MPI_ERR_TYPE,                             \
536              "%s: param %d %s cannot be MPI_DATATYPE_NULL or invalid", __func__, (num), _XBT_STRINGIFY(datatype));
537 #define CHECK_OP(num)                                                                                                  \
538     CHECK_MPI_NULL((num), MPI_OP_NULL, MPI_ERR_OP, op)
539 #define CHECK_ROOT(num)\
540   CHECK_ARGS((root < 0 || root >= comm->size()), MPI_ERR_ROOT,                                                         \
541              "%s: param %d root (=%d) cannot be negative or larger than communicator size (=%d)", __func__, (num),     \
542              root, comm->size());
543 #define CHECK_PROC(num,proc)                                                                                           \
544     CHECK_MPI_NULL((num), MPI_PROC_NULL, MPI_SUCCESS, (proc))
545 #define CHECK_INFO(num,info)                                                                                           \
546     CHECK_MPI_NULL((num), MPI_INFO_NULL, MPI_ERR_INFO, (info))
547 #define CHECK_TAG(num,tag)                                                                                             \
548   CHECK_ARGS(((tag) < 0 && (tag) !=  MPI_ANY_TAG), MPI_ERR_TAG,                                                        \
549              "%s: param %d %s (=%d) cannot be negative", __func__, (num), _XBT_STRINGIFY(tag), (tag));
550 #define CHECK_FILE(num, fh)                                                                                            \
551     CHECK_MPI_NULL((num), MPI_FILE_NULL, MPI_ERR_FILE, (fh))
552 #define CHECK_OFFSET(num, offset)                                                                                      \
553   CHECK_NEGATIVE((num), MPI_ERR_DISP, (offset))
554 #define CHECK_GROUP(num, group)                                                                                        \
555       CHECK_MPI_NULL((num), MPI_GROUP_NULL, MPI_ERR_GROUP, (group))
556 #define CHECK_WIN(num, win)                                                                                            \
557       CHECK_MPI_NULL((num), MPI_WIN_NULL, MPI_ERR_WIN, (win))
558 #define CHECK_RANK(num, rank, comm)                                                                                    \
559         CHECK_ARGS(((rank) >= (comm)->group()->size() || (rank) <0), MPI_ERR_RANK,                                     \
560              "%s: param %d %s (=%d) cannot be < 0 or > %d", __func__, (num), _XBT_STRINGIFY(rank),                     \
561              (rank), (comm)->group()->size() );
562 #endif