2 /* pmm - parallel matrix multiplication "double diffusion" */
4 /* Copyright (c) 2006-2008 The SimGrid team. All rights reserved. */
6 /* This program is free software; you can redistribute it and/or modify it
7 * under the terms of the license (GNU LGPL) which comes with this package. */
10 #include "xbt/matrix.h"
11 #include "amok/peermanagement.h"
13 #define PROC_MATRIX_SIZE 3
14 #define NEIGHBOR_COUNT PROC_MATRIX_SIZE - 1
15 #define SLAVE_COUNT (PROC_MATRIX_SIZE*PROC_MATRIX_SIZE)
17 #define DATA_MATRIX_SIZE 18
18 const int submatrix_size = DATA_MATRIX_SIZE/PROC_MATRIX_SIZE;
20 XBT_LOG_NEW_DEFAULT_CATEGORY(pmm,"Parallel Matrix Multiplication");
22 /* struct for recovering results */
23 GRAS_DEFINE_TYPE(s_result,struct s_result {
26 xbt_matrix_t C GRAS_ANNOTE(subtype,double);
28 typedef struct s_result result_t;
30 /* struct to send initial data to slave */
31 GRAS_DEFINE_TYPE(s_pmm_assignment,struct s_pmm_assignment {
34 xbt_peer_t line[NEIGHBOR_COUNT];
35 xbt_peer_t row[NEIGHBOR_COUNT];
36 xbt_matrix_t A GRAS_ANNOTE(subtype,double);
37 xbt_matrix_t B GRAS_ANNOTE(subtype,double);
39 typedef struct s_pmm_assignment s_pmm_assignment_t;
41 /* register messages which may be sent (common to client and server) */
42 static void register_messages(void) {
43 gras_datadesc_type_t result_type;
44 gras_datadesc_type_t pmm_assignment_type;
46 gras_datadesc_set_const("NEIGHBOR_COUNT",NEIGHBOR_COUNT);
47 result_type=gras_datadesc_by_symbol(s_result);
48 pmm_assignment_type=gras_datadesc_by_symbol(s_pmm_assignment);
50 /* receive a final result from slave */
51 gras_msgtype_declare("result", result_type);
53 /* send from master to slave to assign a position and some data */
54 gras_msgtype_declare("pmm_slave", pmm_assignment_type);
56 /* send data between slaves */
57 gras_msgtype_declare("dataA", gras_datadesc_matrix(gras_datadesc_by_name("double"),NULL));
58 gras_msgtype_declare("dataB", gras_datadesc_matrix(gras_datadesc_by_name("double"),NULL));
61 /* Function prototypes */
62 int slave (int argc,char *argv[]);
63 int master (int argc,char *argv[]);
66 /* **********************************************************************
68 * **********************************************************************/
70 /* Global private data */
78 int master (int argc,char *argv[]) {
87 xbt_dynar_t peers; /* group of slaves */
88 xbt_peer_t grid[SLAVE_COUNT]; /* The slaves as an array */
89 gras_socket_t socket[SLAVE_COUNT]; /* sockets for brodcast to slaves */
91 /* Init the GRAS's infrastructure */
92 gras_init(&argc, argv);
96 /* Initialize data matrices */
97 A = xbt_matrix_double_new_id(DATA_MATRIX_SIZE,DATA_MATRIX_SIZE);
98 B = xbt_matrix_double_new_seq(DATA_MATRIX_SIZE,DATA_MATRIX_SIZE);
99 C = xbt_matrix_double_new_zeros(DATA_MATRIX_SIZE,DATA_MATRIX_SIZE);
101 /* Create the connexions */
102 xbt_assert0(argc>1, "Usage: master <port>");
103 gras_socket_server(atoi(argv[1]));
104 peers=amok_pm_group_new("pmm");
106 /* friends, we're ready. Come and play */
107 INFO0("Wait for peers for 5 sec");
108 gras_msg_handleall(5);
109 INFO1("Got %ld pals",xbt_dynar_length(peers));
112 i<xbt_dynar_length(peers) && i<SLAVE_COUNT;
115 xbt_dynar_get_cpy(peers,i,&grid[i]);
116 socket[i]=gras_socket_client(grid[i]->name,grid[i]->port);
118 xbt_assert2(i==SLAVE_COUNT,
119 "Not enough slaves for this setting (got %d of %d). Change the deployment file",
122 /* Kill surnumerous slaves */
123 for (i=SLAVE_COUNT; i<xbt_dynar_length(peers); ) {
126 xbt_dynar_remove_at(peers,i,&h);
127 INFO2("Too much slaves. Killing %s:%d", h->name, h->port);
128 amok_pm_kill_hp(h->name,h->port);
133 /* Assign job to slaves */
135 INFO0("XXXXXXXXXXXXXXXXXXXXXX begin Multiplication");
136 for(i=0 ; i<SLAVE_COUNT; i++){
137 s_pmm_assignment_t assignment;
140 assignment.linepos=line; // assigned line
141 assignment.rowpos=row; // assigned row
144 for (j=0,k=0; j<PROC_MATRIX_SIZE; j++) {
145 if (i != j*PROC_MATRIX_SIZE+(row)) {
146 assignment.row[k] = grid[ j*PROC_MATRIX_SIZE+(row) ] ;
150 for (j=0,k=0; j<PROC_MATRIX_SIZE; j++) {
151 if (i != (line)*PROC_MATRIX_SIZE+j) {
152 assignment.line[k] = grid[ (line)*PROC_MATRIX_SIZE+j ] ;
157 assignment.A=xbt_matrix_new_sub(A,
158 submatrix_size,submatrix_size,
159 submatrix_size*line,submatrix_size*row,
161 assignment.B=xbt_matrix_new_sub(B,
162 submatrix_size,submatrix_size,
163 submatrix_size*line,submatrix_size*row,
166 if (row >= PROC_MATRIX_SIZE) {
171 gras_msg_send(socket[i],"pmm_slave",&assignment);
172 xbt_matrix_free(assignment.A);
173 xbt_matrix_free(assignment.B);
176 /* (have a rest while the slave perform the multiplication) */
178 /* Retrieve the results */
179 for( i=0;i< SLAVE_COUNT;i++){
180 gras_msg_wait(6000,"result",&from,&result);
181 VERB2("%d slaves are done already. Waiting for %d",i+1, SLAVE_COUNT);
182 xbt_matrix_copy_values(C,result.C, submatrix_size,submatrix_size,
183 submatrix_size*result.linepos,
184 submatrix_size*result.rowpos,
186 xbt_matrix_free(result.C);
190 if (DATA_MATRIX_SIZE < 30) {
191 INFO0 ("The Result of Multiplication is :");
192 xbt_matrix_dump(C,"C:res",0,xbt_matrix_dump_display_double);
194 INFO1("Matrix size too big (%d>30) to be displayed here",DATA_MATRIX_SIZE);
197 amok_pm_group_shutdown ("pmm"); /* Ok, we're out of here */
199 for(i=0; i<SLAVE_COUNT; i++) {
200 gras_socket_close(socket[i]);
208 } /* end_of_master */
210 /* **********************************************************************
212 * **********************************************************************/
214 static int pmm_worker_cb(gras_msg_cb_ctx_t ctx, void *payload) {
215 /* Recover my initialized Data and My Position*/
216 s_pmm_assignment_t assignment = *(s_pmm_assignment_t*)payload;
217 gras_socket_t master = gras_msg_cb_ctx_from(ctx);
222 xbt_matrix_t bA=xbt_matrix_new(submatrix_size,submatrix_size,
223 sizeof(double),NULL);
224 xbt_matrix_t bB=xbt_matrix_new(submatrix_size,submatrix_size,
225 sizeof(double),NULL);
228 xbt_matrix_t mydataA,mydataB;
229 xbt_matrix_t bC=xbt_matrix_double_new_zeros(submatrix_size,submatrix_size);
233 gras_socket_t from; /* to exchange data with my neighbor */
235 /* sockets for brodcast to other slave */
236 gras_socket_t socket_line[PROC_MATRIX_SIZE-1];
237 gras_socket_t socket_row[PROC_MATRIX_SIZE-1];
238 memset(socket_line,0,sizeof(socket_line));
239 memset(socket_row,0,sizeof(socket_row));
243 gras_os_sleep(1); /* wait for my pals */
245 myline = assignment.linepos;
246 myrow = assignment.rowpos;
247 mydataA = assignment.A;
248 mydataB = assignment.B;
250 INFO2("Receive my pos (%d,%d) and assignment",myline,myrow);
252 /* Get my neighborhood from the assignment message (skipping myself) */
253 for (i=0 ; i<PROC_MATRIX_SIZE-1 ; i++){
254 socket_line[i]=gras_socket_client(assignment.line[i]->name,
255 assignment.line[i]->port);
256 xbt_peer_free(assignment.line[i]);
258 for (i=0 ; i<PROC_MATRIX_SIZE-1 ; i++){
259 socket_row[i]=gras_socket_client(assignment.row[i]->name,
260 assignment.row[i]->port);
261 xbt_peer_free(assignment.row[i]);
264 for (step=0; step<PROC_MATRIX_SIZE;step++) {
266 /* a line brodcast */
268 INFO2("LINE: step(%d) = Myline(%d). Broadcast my data.",
270 for (l=0;l < PROC_MATRIX_SIZE-1 ;l++) {
271 INFO1("LINE: Send to %s",
272 gras_socket_peer_name(socket_row[l]));
273 gras_msg_send(socket_row[l], "dataB", &mydataB);
278 bB = xbt_matrix_new_sub(mydataB,
279 submatrix_size,submatrix_size,
284 gras_msg_wait(600,"dataB",&from,&bB);
286 RETHROW0("Can't get a data message from line : %s");
288 INFO3("LINE: step(%d) <> Myline(%d). Receive data from %s",step,myline,
289 gras_socket_peer_name(from));
294 INFO2("ROW: step(%d)=myrow(%d). Broadcast my data.",step,myrow);
295 for (l=1;l < PROC_MATRIX_SIZE ; l++) {
296 INFO1("ROW: Send to %s",
297 gras_socket_peer_name(socket_line[l-1]));
298 gras_msg_send(socket_line[l-1],"dataA", &mydataA);
301 bA = xbt_matrix_new_sub(mydataA,
302 submatrix_size,submatrix_size,
307 gras_msg_wait(1200,"dataA", &from,&bA);
309 RETHROW0("Can't get a data message from row : %s");
311 INFO3("ROW: step(%d)<>myrow(%d). Receive data from %s",step,myrow,
312 gras_socket_peer_name(from));
314 xbt_matrix_double_addmult(bA,bB,bC);
318 /* send Result to master */
320 result.linepos=myline;
324 gras_msg_send(master, "result",&result);
326 RETHROW0("Failed to send answer to server: %s");
328 INFO2(">>>>>>>> Result sent to %s:%d <<<<<<<<",
329 gras_socket_peer_name(master),gras_socket_peer_port(master));
330 /* Free the allocated resources, and shut GRAS down */
336 xbt_matrix_free(mydataA);
337 xbt_matrix_free(mydataB);
338 /* FIXME: some are said to be unknown
339 gras_socket_close(master);
340 gras_socket_close(from);
341 for (l=0; l < PROC_MATRIX_SIZE-1; l++) {
343 gras_socket_close(socket_line[l]);
345 gras_socket_close(socket_row[l]);
351 int slave(int argc,char *argv[]) {
352 gras_socket_t mysock;
353 gras_socket_t master = NULL;
357 /* Init the GRAS's infrastructure */
358 gras_init(&argc, argv);
360 if (argc != 3 && argc !=2)
361 xbt_die("Usage: slave masterhost:masterport [rank]");
365 rank = atoi(argv[2]);
367 /* Register the known messages and my callback */
369 gras_cb_register("pmm_slave",pmm_worker_cb);
371 /* Create the connexions */
372 mysock = gras_socket_server_range(3000,9999,0,0);
373 INFO1("Sensor %d starting",rank);
377 master = gras_socket_client_from_string(argv[1]);
380 if (e.category != system_error)
387 /* Join and run the group */
388 amok_pm_group_join(master,"pmm",rank);
389 amok_pm_mainloop(600);
392 gras_socket_close(mysock);
393 // gras_socket_close(master); Unknown