Logo AND Algorithmique Numérique Distribuée

Public GIT Repository
ONGOING work on exceptions plus minor cleanups.
[simgrid.git] / src / surf / workstation.c
1 /*      $Id$     */
2
3 /* Copyright (c) 2004 Arnaud Legrand. All rights reserved.                  */
4
5 /* This program is free software; you can redistribute it and/or modify it
6  * under the terms of the license (GNU LGPL) which comes with this package. */
7
8 #include "xbt/ex.h"
9 #include "xbt/dict.h"
10 #include "workstation_private.h"
11 #include "cpu_private.h"
12 #include "network_private.h"
13
14 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(workstation, surf,
15                                 "Logging specific to the SURF workstation module");
16
17 surf_workstation_resource_t surf_workstation_resource = NULL;
18
19 xbt_dict_t workstation_set = NULL;
20
21 static workstation_CLM03_t workstation_new(const char *name,
22                                      void *cpu, void *card)
23 {
24   workstation_CLM03_t workstation = xbt_new0(s_workstation_CLM03_t, 1);
25
26   workstation->resource = (surf_resource_t) surf_workstation_resource;
27   workstation->name = xbt_strdup(name);
28   workstation->cpu = cpu;
29   workstation->network_card = card;
30
31   return workstation;
32 }
33
34 static void workstation_free(void *workstation)
35 {
36   free(((workstation_CLM03_t)workstation)->name);
37   free(workstation);
38 }
39
40 static void create_workstations(void)
41 {
42   xbt_dict_cursor_t cursor = NULL;
43   char *name = NULL;
44   void *cpu = NULL;
45   void *nw_card = NULL;
46
47   xbt_dict_foreach(cpu_set, cursor, name, cpu) {
48     nw_card = xbt_dict_get_or_null(network_card_set, name);
49     xbt_assert1(nw_card,
50                 "No corresponding card found for %s",name);
51
52     xbt_dict_set(workstation_set, name,
53                  workstation_new(name, cpu, nw_card), workstation_free);
54   }
55 }
56
57 static void *name_service(const char *name)
58 {
59   return xbt_dict_get_or_null(workstation_set, name);
60 }
61
62 static const char *get_resource_name(void *resource_id)
63 {
64   return ((workstation_CLM03_t) resource_id)->name;
65 }
66
67 static int resource_used(void *resource_id)
68 {
69   xbt_assert0(0,
70               "Workstation is a virtual resource. I should not be there!");
71   return 0;
72 }
73
74 static int parallel_action_free(surf_action_t action)
75 {
76   action->using--;
77   if(!action->using) {
78     xbt_swag_remove(action, action->state_set);
79     if(((surf_action_parallel_task_CSL05_t)action)->variable)
80       lmm_variable_free(maxmin_system, ((surf_action_parallel_task_CSL05_t)action)->variable);
81     free(action);
82     return 1;
83   }
84   return 0;
85 }
86
87 static void parallel_action_use(surf_action_t action)
88 {
89   action->using++;
90 }
91
92 static int action_free(surf_action_t action)
93 {
94   if(action->resource_type==(surf_resource_t)surf_network_resource) 
95     return surf_network_resource->common_public->action_free(action);
96   else if(action->resource_type==(surf_resource_t)surf_cpu_resource) 
97     return surf_cpu_resource->common_public->action_free(action);
98   else if(action->resource_type==(surf_resource_t)surf_workstation_resource)
99     return parallel_action_free(action);
100   else DIE_IMPOSSIBLE;
101   return 0;
102 }
103
104 static void action_use(surf_action_t action)
105 {
106   if(action->resource_type==(surf_resource_t)surf_network_resource) 
107     surf_network_resource->common_public->action_use(action);
108   else if(action->resource_type==(surf_resource_t)surf_cpu_resource) 
109     surf_cpu_resource->common_public->action_use(action);
110   else if(action->resource_type==(surf_resource_t)surf_workstation_resource)
111     return parallel_action_use(action);
112   else DIE_IMPOSSIBLE;
113   return;
114 }
115
116 static void action_cancel(surf_action_t action)
117 {
118   if(action->resource_type==(surf_resource_t)surf_network_resource) 
119     surf_network_resource->common_public->action_cancel(action);
120   else if(action->resource_type==(surf_resource_t)surf_cpu_resource) 
121     surf_cpu_resource->common_public->action_cancel(action);
122   else if(action->resource_type==(surf_resource_t)surf_workstation_resource)
123     return parallel_action_use(action);
124   else DIE_IMPOSSIBLE;
125   return;
126 }
127
128 static void action_recycle(surf_action_t action)
129 {
130   DIE_IMPOSSIBLE;
131   return;
132 }
133
134 static void action_change_state(surf_action_t action,
135                                 e_surf_action_state_t state)
136 {
137   if(action->resource_type==(surf_resource_t)surf_network_resource) 
138     surf_network_resource->common_public->action_change_state(action,state);
139   else if(action->resource_type==(surf_resource_t)surf_cpu_resource) 
140     surf_cpu_resource->common_public->action_change_state(action,state);
141   else if(action->resource_type==(surf_resource_t)surf_workstation_resource)
142     surf_action_change_state(action, state);
143   else DIE_IMPOSSIBLE;
144   return;
145 }
146
147 static double share_resources(double now)
148 {
149   s_surf_action_parallel_task_CSL05_t action;
150   return generic_maxmin_share_resources(surf_workstation_resource->common_public->
151                                         states.running_action_set,
152                                         xbt_swag_offset(action, variable));
153 }
154
155 static void update_actions_state(double now, double delta)
156 {
157   surf_action_parallel_task_CSL05_t action = NULL;
158   surf_action_parallel_task_CSL05_t next_action = NULL;
159   xbt_swag_t running_actions =
160       surf_workstation_resource->common_public->states.running_action_set;
161   /* FIXME: unused
162   xbt_swag_t failed_actions =
163       surf_workstation_resource->common_public->states.failed_action_set;
164   */
165
166   xbt_swag_foreach_safe(action, next_action, running_actions) {
167     surf_double_update(&(action->generic_action.remains),
168         lmm_variable_getvalue(action->variable) * delta);
169     if (action->generic_action.max_duration != NO_MAX_DURATION)
170       surf_double_update(&(action->generic_action.max_duration), delta);
171     if ((action->generic_action.remains <= 0) && 
172         (lmm_get_variable_weight(action->variable)>0)) {
173       action->generic_action.finish = surf_get_clock();
174       action_change_state((surf_action_t) action, SURF_ACTION_DONE);
175     } else if ((action->generic_action.max_duration != NO_MAX_DURATION) &&
176                (action->generic_action.max_duration <= 0)) {
177       action->generic_action.finish = surf_get_clock();
178       action_change_state((surf_action_t) action, SURF_ACTION_DONE);
179     } else {                    /* Need to check that none of the resource has failed */
180       lmm_constraint_t cnst = NULL;
181       int i = 0;
182       surf_resource_t resource = NULL;
183
184       while ((cnst =
185               lmm_get_cnst_from_var(maxmin_system, action->variable,
186                                     i++))) {
187         resource = (surf_resource_t) lmm_constraint_id(cnst);
188         if(resource== (surf_resource_t) surf_cpu_resource) {
189           cpu_Cas01_t cpu = lmm_constraint_id(cnst);
190           if (cpu->state_current == SURF_CPU_OFF) {
191             action->generic_action.finish = surf_get_clock();
192             action_change_state((surf_action_t) action, SURF_ACTION_FAILED);
193             break;
194           }
195         } else if (resource== (surf_resource_t) surf_network_resource) {
196           network_link_CM02_t nw_link = lmm_constraint_id(cnst);
197
198           if (nw_link->state_current == SURF_NETWORK_LINK_OFF) {
199             action->generic_action.finish = surf_get_clock();
200             action_change_state((surf_action_t) action, SURF_ACTION_FAILED);
201             break;
202           }
203         } 
204       }
205     }
206   }
207
208   return;
209 }
210
211 static void update_resource_state(void *id,
212                                   tmgr_trace_event_t event_type,
213                                   double value)
214 {
215   return;
216 }
217
218 static surf_action_t execute(void *workstation, double size)
219 {
220   return surf_cpu_resource->extension_public->
221       execute(((workstation_CLM03_t) workstation)->cpu, size);
222 }
223
224 static surf_action_t action_sleep(void *workstation, double duration)
225 {
226   return surf_cpu_resource->extension_public->
227       sleep(((workstation_CLM03_t) workstation)->cpu, duration);
228 }
229
230 static void action_suspend(surf_action_t action)
231 {
232   if(action->resource_type==(surf_resource_t)surf_network_resource) 
233     surf_network_resource->common_public->suspend(action);
234   else if(action->resource_type==(surf_resource_t)surf_cpu_resource) 
235     surf_cpu_resource->common_public->suspend(action);
236   else DIE_IMPOSSIBLE;
237 }
238
239 static void action_resume(surf_action_t action)
240 {
241   if(action->resource_type==(surf_resource_t)surf_network_resource)
242     surf_network_resource->common_public->resume(action);
243   else if(action->resource_type==(surf_resource_t)surf_cpu_resource)
244     surf_cpu_resource->common_public->resume(action);
245   else DIE_IMPOSSIBLE;
246 }
247
248 static int action_is_suspended(surf_action_t action)
249 {
250   if(action->resource_type==(surf_resource_t)surf_network_resource) 
251     return surf_network_resource->common_public->is_suspended(action);
252   if(action->resource_type==(surf_resource_t)surf_cpu_resource) 
253     return surf_cpu_resource->common_public->is_suspended(action);
254   DIE_IMPOSSIBLE;
255 }
256
257 static void action_set_max_duration(surf_action_t action, double duration)
258 {
259   if(action->resource_type==(surf_resource_t)surf_network_resource)
260     surf_network_resource->common_public->set_max_duration(action,duration);
261   else if(action->resource_type==(surf_resource_t)surf_cpu_resource) 
262     surf_cpu_resource->common_public->set_max_duration(action,duration);
263   else  DIE_IMPOSSIBLE;
264 }
265
266 static surf_action_t communicate(void *workstation_src,
267                                  void *workstation_dst, double size,
268                                  double rate)
269 {
270   return surf_network_resource->extension_public->
271       communicate(((workstation_CLM03_t) workstation_src)->network_card,
272                   ((workstation_CLM03_t) workstation_dst)->network_card, size, rate);
273 }
274
275 static e_surf_cpu_state_t get_state(void *workstation)
276 {
277   return surf_cpu_resource->extension_public->
278       get_state(((workstation_CLM03_t) workstation)->cpu);
279 }
280
281 static double get_speed(void *workstation, double load)
282 {
283   return surf_cpu_resource->extension_public->
284       get_speed(((workstation_CLM03_t) workstation)->cpu, load);
285 }
286
287 static surf_action_t execute_parallel_task (int workstation_nb,
288                                             void **workstation_list,
289                                             double *computation_amount,
290                                             double *communication_amount,
291                                             double amount,
292                                             double rate)
293 {
294   surf_action_parallel_task_CSL05_t action = NULL;
295   int i, j, k;
296   xbt_dict_t network_link_set = xbt_dict_new();
297   xbt_dict_cursor_t cursor = NULL;
298   char *name = NULL;
299   int nb_link = 0;
300   int nb_host = 0;
301   network_link_CM02_t link;
302
303   /* Compute the number of affected resources... */
304   for(i=0; i< workstation_nb; i++) {
305     for(j=0; j< workstation_nb; j++) {
306       network_card_CM02_t card_src = ((workstation_CLM03_t*)workstation_list)[i]->network_card;
307       network_card_CM02_t card_dst = ((workstation_CLM03_t*)workstation_list)[j]->network_card;
308       int route_size = ROUTE_SIZE(card_src->id, card_dst->id);
309       network_link_CM02_t *route = ROUTE(card_src->id, card_dst->id);
310       
311       if(communication_amount[i*workstation_nb+j]>0)
312         for(k=0; k< route_size; k++) {
313           xbt_dict_set(network_link_set, route[k]->name, route[k], NULL);
314         }
315     }
316   }
317
318   xbt_dict_foreach(network_link_set, cursor, name, link) {
319     nb_link++;
320   }
321
322   xbt_dict_free(&network_link_set);
323
324   for (i = 0; i<workstation_nb; i++)
325     if(computation_amount[i]>0) nb_host++;
326  
327   if(nb_link + workstation_nb == 0)
328     return NULL;
329
330   action = xbt_new0(s_surf_action_parallel_task_CSL05_t, 1);
331   action->generic_action.using = 1;
332   action->generic_action.cost = amount;
333   action->generic_action.remains = amount;
334   action->generic_action.max_duration = NO_MAX_DURATION;
335   action->generic_action.start = -1.0;
336   action->generic_action.finish = -1.0;
337   action->generic_action.resource_type =
338       (surf_resource_t) surf_workstation_resource;
339   action->suspended = 0;  /* Should be useless because of the
340                              calloc but it seems to help valgrind... */
341   action->generic_action.state_set =
342       surf_workstation_resource->common_public->states.running_action_set;
343
344   xbt_swag_insert(action, action->generic_action.state_set);
345   action->rate = rate;
346
347   if(action->rate>0)
348     action->variable = lmm_variable_new(maxmin_system, action, 1.0, -1.0,
349                                         nb_host + nb_link);
350   else   
351     action->variable = lmm_variable_new(maxmin_system, action, 1.0, action->rate,
352                                         nb_host + nb_link);
353
354   for (i = 0; i<workstation_nb; i++)
355     if(computation_amount[i]>0)
356       lmm_expand(maxmin_system, ((cpu_Cas01_t) ((workstation_CLM03_t) workstation_list[i])->cpu)->constraint, 
357                  action->variable, computation_amount[i]);
358
359   for (i=0; i<workstation_nb; i++) {
360     for(j=0; j< workstation_nb; j++) {
361       network_card_CM02_t card_src = ((workstation_CLM03_t*)workstation_list)[i]->network_card;
362       network_card_CM02_t card_dst = ((workstation_CLM03_t*)workstation_list)[j]->network_card;
363       int route_size = ROUTE_SIZE(card_src->id, card_dst->id);
364       network_link_CM02_t *route = ROUTE(card_src->id, card_dst->id);
365       
366       for(k=0; k< route_size; k++) {
367         if(communication_amount[i*workstation_nb+j]>0) {
368           lmm_expand_add(maxmin_system, route[k]->constraint, 
369                        action->variable, communication_amount[i*workstation_nb+j]);
370         }
371       }
372     }
373   }
374   
375   return (surf_action_t) action;
376 }
377
378 static void finalize(void)
379 {
380   xbt_dict_free(&workstation_set);
381   xbt_swag_free(surf_workstation_resource->common_public->states.ready_action_set);
382   xbt_swag_free(surf_workstation_resource->common_public->states.
383                 running_action_set);
384   xbt_swag_free(surf_workstation_resource->common_public->states.
385                 failed_action_set);
386   xbt_swag_free(surf_workstation_resource->common_public->states.done_action_set);
387
388   free(surf_workstation_resource->common_public);
389   free(surf_workstation_resource->common_private);
390   free(surf_workstation_resource->extension_public);
391
392   free(surf_workstation_resource);
393   surf_workstation_resource = NULL;
394 }
395
396 static void surf_workstation_resource_init_internal(void)
397 {
398   s_surf_action_t action;
399
400   surf_workstation_resource = xbt_new0(s_surf_workstation_resource_t, 1);
401
402   surf_workstation_resource->common_private =
403       xbt_new0(s_surf_resource_private_t, 1);
404   surf_workstation_resource->common_public =
405       xbt_new0(s_surf_resource_public_t, 1);
406 /*   surf_workstation_resource->extension_private = xbt_new0(s_surf_workstation_resource_extension_private_t,1); */
407   surf_workstation_resource->extension_public =
408       xbt_new0(s_surf_workstation_resource_extension_public_t, 1);
409
410   surf_workstation_resource->common_public->states.ready_action_set =
411       xbt_swag_new(xbt_swag_offset(action, state_hookup));
412   surf_workstation_resource->common_public->states.running_action_set =
413       xbt_swag_new(xbt_swag_offset(action, state_hookup));
414   surf_workstation_resource->common_public->states.failed_action_set =
415       xbt_swag_new(xbt_swag_offset(action, state_hookup));
416   surf_workstation_resource->common_public->states.done_action_set =
417       xbt_swag_new(xbt_swag_offset(action, state_hookup));
418
419   surf_workstation_resource->common_public->name_service = name_service;
420   surf_workstation_resource->common_public->get_resource_name =
421       get_resource_name;
422   surf_workstation_resource->common_public->action_get_state =
423       surf_action_get_state;
424   surf_workstation_resource->common_public->action_free = action_free;
425   surf_workstation_resource->common_public->action_use = action_use;
426   surf_workstation_resource->common_public->action_cancel = action_cancel;
427   surf_workstation_resource->common_public->action_recycle =
428       action_recycle;
429   surf_workstation_resource->common_public->action_change_state =
430       action_change_state;
431   surf_workstation_resource->common_public->action_set_data = surf_action_set_data;
432   surf_workstation_resource->common_public->name = "Workstation";
433
434   surf_workstation_resource->common_private->resource_used = resource_used;
435   surf_workstation_resource->common_private->share_resources =
436       share_resources;
437   surf_workstation_resource->common_private->update_actions_state =
438       update_actions_state;
439   surf_workstation_resource->common_private->update_resource_state =
440       update_resource_state;
441   surf_workstation_resource->common_private->finalize = finalize;
442
443   surf_workstation_resource->common_public->suspend = action_suspend;
444   surf_workstation_resource->common_public->resume = action_resume;
445   surf_workstation_resource->common_public->is_suspended = action_is_suspended;
446   surf_workstation_resource->common_public->set_max_duration = action_set_max_duration;
447
448   surf_workstation_resource->extension_public->execute = execute;
449   surf_workstation_resource->extension_public->sleep = action_sleep;
450   surf_workstation_resource->extension_public->get_state = get_state;
451   surf_workstation_resource->extension_public->get_speed = get_speed;
452   surf_workstation_resource->extension_public->communicate = communicate;
453   surf_workstation_resource->extension_public->execute_parallel_task = 
454     execute_parallel_task;
455
456   workstation_set = xbt_dict_new();
457
458   xbt_assert0(maxmin_system, "surf_init has to be called first!");
459 }
460
461 /********************************************************************/
462 /* The model used in MSG and presented at CCGrid03                  */
463 /********************************************************************/
464 /* @InProceedings{Casanova.CLM_03, */
465 /*   author = {Henri Casanova and Arnaud Legrand and Loris Marchal}, */
466 /*   title = {Scheduling Distributed Applications: the SimGrid Simulation Framework}, */
467 /*   booktitle = {Proceedings of the third IEEE International Symposium on Cluster Computing and the Grid (CCGrid'03)}, */
468 /*   publisher = {"IEEE Computer Society Press"}, */
469 /*   month = {may}, */
470 /*   year = {2003} */
471 /* } */
472 void surf_workstation_resource_init_CLM03(const char *filename)
473 {
474 /*   int i ; */
475 /*   surf_resource_t resource =  NULL; */
476
477   surf_workstation_resource_init_internal();
478   surf_cpu_resource_init_Cas01(filename);
479   surf_network_resource_init_CM02(filename);
480   create_workstations();
481   xbt_dynar_push(resource_list, &surf_workstation_resource);
482 /*   xbt_dynar_foreach(resource_list, i, resource) { */
483 /*     if(resource==surf_cpu_resource) { */
484 /*       xbt_dynar_remove_at(resource_list, i, NULL); */
485 /*       i--;  */
486 /*       continue; */
487 /*     } */
488 /*     if(resource==surf_network_resource) { */
489 /*       xbt_dynar_remove_at(resource_list, i, NULL); */
490 /*       i--;  */
491 /*       continue; */
492 /*     } */
493 /*   } */
494 }