Logo AND Algorithmique Numérique Distribuée

Public GIT Repository
Create the dummy cpu action at destination
[simgrid.git] / src / surf / vm_workstation.c
1 /* Copyright (c) 2004, 2005, 2006, 2007, 2008, 2009, 2010. The SimGrid Team.
2  * All rights reserved.                                                     */
3
4 /* This program is free software; you can redistribute it and/or modify it
5  * under the terms of the license (GNU LGPL) which comes with this package. */
6
7 #include "xbt/ex.h"
8 #include "xbt/dict.h"
9 #include "portable.h"
10 #include "surf_private.h"
11 #include "surf/surf_resource.h"
12 #include "simgrid/sg_config.h"
13 #include "vm_workstation_private.h"
14 #include "surf/cpu_cas01_private.h"
15 #include "surf/maxmin_private.h"
16
17 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(surf_vm_workstation, surf,
18                                 "Logging specific to the SURF VM workstation module");
19
20
21 surf_model_t surf_vm_workstation_model = NULL;
22
23 /* ind means ''indirect'' that this is a reference on the whole dict_elm
24  * structure (i.e not on the surf_resource_private infos) */
25
26 static void vm_ws_create(const char *name, void *ind_phys_workstation)
27 {
28   workstation_CLM03_t sub_ws = surf_workstation_resource_priv(ind_phys_workstation);
29   const char *sub_ws_name = sub_ws->generic_resource.name;
30
31   /* The workstation_VM2013 struct inherits the workstation_CLM03 struct. We
32    * create a physical workstation resource, but specifying the size of
33    * s_workstation_VM2013_t and the vm workstation model object. */
34   workstation_CLM03_t ws = (workstation_CLM03_t) surf_resource_new(sizeof(s_workstation_VM2013_t),
35       surf_vm_workstation_model, name, NULL);
36
37   /* Currently, we assume a VM has no storage. */
38   ws->storage = NULL;
39
40   /* Currently, a VM uses the network resource of its physical host. In
41    * host_lib, this network resource object is refered from two different keys.
42    * When deregistering the reference that points the network resource object
43    * from the VM name, we have to make sure that the system does not call the
44    * free callback for the network resource object. The network resource object
45    * is still used by the physical machine. */
46   ws->net_elm = xbt_lib_get_or_null(host_lib, sub_ws_name, ROUTING_HOST_LEVEL);
47   xbt_lib_set(host_lib, name, ROUTING_HOST_LEVEL, ws->net_elm);
48
49   /* The SURF_WKS_LEVEL at host_lib saves workstation_CLM03 objects. Please
50    * note workstation_VM2013 objects, inheriting the workstation_CLM03
51    * structure, are also saved there. 
52    *
53    * If you want to get a workstation_VM2013 object from host_lib, see
54    * ws->generic_resouce.model->type first. If it is
55    * SURF_MODEL_TYPE_VM_WORKSTATION, you can cast ws to vm_ws. */
56   XBT_INFO("Create VM(%s)@PM(%s) with %ld mounted disks", name, sub_ws_name, xbt_dynar_length(ws->storage));
57   xbt_lib_set(host_lib, name, SURF_WKS_LEVEL, ws);
58
59
60   /* We initialize the VM-specific members. */
61   workstation_VM2013_t vm_ws = (workstation_VM2013_t) ws;
62   vm_ws->sub_ws = sub_ws;
63   vm_ws->current_state = SURF_VM_STATE_CREATED;
64
65
66
67   // //// CPU  RELATED STUFF ////
68   // Roughly, create a vcpu resource by using the values of the sub_cpu one.
69   cpu_Cas01_t sub_cpu = surf_cpu_resource_priv(ind_phys_workstation);
70
71   /* We can assume one core and cas01 cpu for the first step.
72    * Do xbt_lib_set(host_lib, name, SURF_CPU_LEVEL, cpu) if you get the resource. */
73   cpu_cas01_create_resource(name, // name
74       sub_cpu->power_peak,        // host->power_peak,
75       1,                          // host->power_scale,
76       NULL,                       // host->power_trace,
77       1,                          // host->core_amount,
78       SURF_RESOURCE_ON,           // host->initial_state,
79       NULL,                       // host->state_trace,
80       NULL,                       // host->properties,
81       surf_cpu_model_vm);
82
83
84
85   /* We create cpu_action corresponding to a VM process on the host operating system. */
86   /* FIXME: TODO: we have to peridocally input GUESTOS_NOISE to the system? how ? */
87   // vm_ws->cpu_action = surf_cpu_model_pm->extension.cpu.execute(ind_phys_workstation, GUESTOS_NOISE);
88   vm_ws->cpu_action = surf_cpu_model_pm->extension.cpu.execute(ind_phys_workstation, 0);
89
90
91   /* TODO:
92    * - check how network requests are scheduled between distinct processes competing for the same card.
93    */
94 }
95
96 /*
97  * Update the physical host of the given VM
98  */
99 static void vm_ws_migrate(void *ind_vm, void *ind_dst_pm)
100
101    /* ind_phys_workstation equals to smx_host_t */
102    workstation_VM2013_t ws_vm2013 = surf_workstation_resource_priv(ind_vm);
103    workstation_CLM03_t ws_clm03_dst = surf_workstation_resource_priv(ind_dst_pm);
104    const char *vm_name = ws_vm2013->ws.generic_resource.name;
105    const char *pm_name_src = ws_vm2013->sub_ws->generic_resource.name;
106    const char *pm_name_dst = ws_clm03_dst->generic_resource.name;
107
108    xbt_assert(ws_vm2013);
109    xbt_assert(ws_clm03_dst);
110
111    ws_vm2013->current_state = SURF_VM_STATE_MIGRATING;
112
113    /* do something */
114
115    /* update net_elm with that of the destination physical host */
116    void *old_net_elm = ws_vm2013->ws.net_elm;
117    void *new_net_elm = xbt_lib_get_or_null(host_lib, pm_name_dst, ROUTING_HOST_LEVEL);
118    xbt_assert(new_net_elm);
119
120    /* Unregister the current net_elm from host_lib. Do not call the free callback. */
121    xbt_lib_unset(host_lib, vm_name, ROUTING_HOST_LEVEL, 0);
122
123    /* Then, resister the new one. */
124    ws_vm2013->ws.net_elm = new_net_elm;
125    xbt_lib_set(host_lib, vm_name, ROUTING_HOST_LEVEL, ws_vm2013->ws.net_elm);
126
127    ws_vm2013->sub_ws = ws_clm03_dst;
128
129    /* Update vcpu's action for the new pm */
130    {
131 #if 0
132      XBT_INFO("cpu_action->remains %g", ws_vm2013->cpu_action->remains);
133      XBT_INFO("cost %f remains %f start %f finish %f", ws_vm2013->cpu_action->cost,
134          ws_vm2013->cpu_action->remains,
135          ws_vm2013->cpu_action->start,
136          ws_vm2013->cpu_action->finish
137          );
138      XBT_INFO("cpu_action state %d", surf_action_state_get(ws_vm2013->cpu_action));
139 #endif
140
141      /* create a cpu action bound to the pm model at the destination. */
142      surf_action_t new_cpu_action = surf_cpu_model_pm->extension.cpu.execute(ind_dst_pm, 0);
143
144      e_surf_action_state_t state = surf_action_state_get(ws_vm2013->cpu_action);
145      if (state != SURF_ACTION_DONE)
146        XBT_CRITICAL("FIXME: may need a proper handling, %d", state);
147      if (ws_vm2013->cpu_action->remains > 0)
148        XBT_CRITICAL("FIXME: need copy the state(?), %d", ws_vm2013->cpu_action->remains);
149
150      int ret = surf_cpu_model_pm->action_unref(ws_vm2013->cpu_action);
151      xbt_assert(ret == 1, "Bug: some resource still remains");
152
153      ws_vm2013->cpu_action = new_cpu_action;
154    }
155
156    XBT_DEBUG("migrate VM(%s): change net_elm (%p to %p)", vm_name, old_net_elm, new_net_elm);
157    XBT_DEBUG("migrate VM(%s): change PM (%s to %s)", vm_name, pm_name_src, pm_name_dst);
158
159    ws_vm2013->current_state = SURF_VM_STATE_RUNNING;
160 }
161
162 /*
163  * A physical host does not disapper in the current SimGrid code, but a VM may
164  * disapper during a simulation.
165  */
166 static void vm_ws_destroy(void *ind_vm_workstation)
167
168         /* ind_phys_workstation equals to smx_host_t */
169
170   /* Before clearing the entries in host_lib, we have to pick up resources. */
171         workstation_VM2013_t vm_ws = surf_workstation_resource_priv(ind_vm_workstation);
172   cpu_Cas01_t cpu = surf_cpu_resource_priv(ind_vm_workstation);
173         const char *name = vm_ws->ws.generic_resource.name;
174   XBT_INFO("%s", name);
175
176         xbt_assert(vm_ws);
177         xbt_assert(vm_ws->ws.generic_resource.model == surf_vm_workstation_model);
178
179
180   /* We deregister objects from host_lib, without invoking the freeing callback
181    * of each level.
182    *
183    * Do not call xbt_lib_remove() here. It deletes all levels of the key,
184    * including MSG_HOST_LEVEL and others. We should unregister only what we know.
185    */
186   xbt_lib_unset(host_lib, name, SURF_CPU_LEVEL, 0);
187   xbt_lib_unset(host_lib, name, ROUTING_HOST_LEVEL, 0);
188   xbt_lib_unset(host_lib, name, SURF_WKS_LEVEL, 0);
189
190   /* TODO: comment out when VM stroage is implemented. */
191   // xbt_lib_unset(host_lib, name, SURF_STORAGE_LEVEL, 0);
192
193
194   /* Free the cpu_action of the VM. */
195   int ret = surf_cpu_model_pm->action_unref(vm_ws->cpu_action);
196   xbt_assert(ret == 1, "Bug: some resource still remains");
197
198   /* Free the cpu resource of the VM. If using power_trace, we will have to
199    * free other objects than lmm_constraint. */
200   surf_model_t cpu_model = cpu->generic_resource.model;
201   lmm_constraint_free(cpu_model->model_private->maxmin_system, cpu->constraint);
202   surf_resource_free(cpu);
203
204   /* Free the network resource of the VM. */
205         // Nothing has to be done, because net_elmts is just a pointer on the physical one
206
207   /* Free the storage resource of the VM. */
208   // Not relevant yet
209
210         /* Free the workstation resource of the VM. */
211   surf_resource_free(vm_ws);
212 }
213
214 static int vm_ws_get_state(void *ind_vm_ws)
215 {
216         return ((workstation_VM2013_t) surf_workstation_resource_priv(ind_vm_ws))->current_state;
217 }
218
219 static void vm_ws_set_state(void *ind_vm_ws, int state)
220 {
221          ((workstation_VM2013_t) surf_workstation_resource_priv(ind_vm_ws))->current_state = state;
222 }
223
224 static void vm_ws_suspend(void *ind_vm_ws)
225 {
226   workstation_VM2013_t vm_ws = surf_workstation_resource_priv(ind_vm_ws);
227
228   XBT_INFO("vm %p suspend", ind_vm_ws);
229   surf_action_suspend(vm_ws->cpu_action);
230
231   vm_ws->current_state = SURF_VM_STATE_SUSPENDED;
232 }
233
234 static void vm_ws_resume(void *ind_vm_ws)
235 {
236   workstation_VM2013_t vm_ws = surf_workstation_resource_priv(ind_vm_ws);
237
238   surf_action_resume(vm_ws->cpu_action);
239
240   vm_ws->current_state = SURF_VM_STATE_RUNNING;
241 }
242
243 static void vm_ws_save(void *ind_vm_ws)
244 {
245   workstation_VM2013_t vm_ws = surf_workstation_resource_priv(ind_vm_ws);
246
247   vm_ws->current_state = SURF_VM_STATE_SAVING;
248
249   /* FIXME: do something here */
250   surf_action_suspend(vm_ws->cpu_action);
251
252   vm_ws->current_state = SURF_VM_STATE_SAVED;
253 }
254
255 static void vm_ws_restore(void *ind_vm_ws)
256 {
257   workstation_VM2013_t vm_ws = surf_workstation_resource_priv(ind_vm_ws);
258
259   vm_ws->current_state = SURF_VM_STATE_RESTORING;
260
261   /* FIXME: do something here */
262   surf_action_resume(vm_ws->cpu_action);
263
264   vm_ws->current_state = SURF_VM_STATE_RUNNING;
265 }
266
267
268 static double get_solved_value(surf_action_t cpu_action)
269 {
270   int found = 0;
271   /* NOTE: Do not use surf_workstation_model's maxmin_system. It is not used. */
272   lmm_system_t pm_system = surf_cpu_model_pm->model_private->maxmin_system;
273   lmm_variable_t var = NULL;
274
275   xbt_swag_foreach(var, &pm_system->variable_set) {
276     XBT_DEBUG("var id %p id_int %d double %f", var->id, var->id_int, var->value);
277     if (var->id == cpu_action) {
278       found = 1;
279       break;
280     }
281   }
282
283   if (found)
284     return var->value;
285
286   XBT_CRITICAL("bug: cannot found the solved variable of the action %p", cpu_action);
287   DIE_IMPOSSIBLE;
288   return -1; /* NOT REACHED */
289 }
290
291
292
293 /* In the real world, processes on the guest operating system will be somewhat
294  * degraded due to virtualization overhead. The total CPU share that these
295  * processes get is smaller than that of the VM process gets on a host
296  * operating system. */
297 const double virt_overhead = 0.95;
298
299 static double vm_ws_share_resources(surf_model_t workstation_model, double now)
300 {
301   /* TODO: udpate action's cost with the total cost of processes on the VM. */
302
303
304   /* 0. Make sure that we already calculated the resource share at the physical
305    * machine layer. */
306   {
307     unsigned int index_of_pm_ws_model = xbt_dynar_search(model_list_invoke, &surf_workstation_model);
308     unsigned int index_of_vm_ws_model = xbt_dynar_search(model_list_invoke, &surf_vm_workstation_model);
309     xbt_assert((index_of_pm_ws_model < index_of_vm_ws_model), "Cannot assume surf_workstation_model comes before");
310  
311     /* Another option is that we call sub_ws->share_resource() here. The
312      * share_resource() function has no side-effect. We can call it here to
313      * ensure that. */
314   }
315
316
317   /* 1. Now we know how many resource should be assigned to each virtual
318    * machine. We update constraints of the virtual machine layer.
319    *
320    *
321    * If we have two virtual machine (VM1 and VM2) on a physical machine (PM1).
322    *     X1 + X2 = C       (Equation 1)
323    * where
324    *    the resource share of VM1: X1
325    *    the resource share of VM2: X2
326    *    the capacity of PM1: C
327    *
328    * Then, if we have two process (P1 and P2) on VM1.
329    *     X1_1 + X1_2 = X1  (Equation 2)
330    * where
331    *    the resource share of P1: X1_1
332    *    the resource share of P2: X1_2
333    *    the capacity of VM1: X1
334    *
335    * Equation 1 was solved in the physical machine layer.
336    * Equation 2 is solved in the virtual machine layer (here).
337    * X1 must be passed to the virtual machine laye as a constraint value.
338    *
339    **/
340
341   /* iterate for all hosts including virtual machines */
342   xbt_lib_cursor_t cursor;
343   char *key;
344   void **ind_host;
345   xbt_lib_foreach(host_lib, cursor, key, ind_host) {
346     workstation_CLM03_t ws_clm03 = ind_host[SURF_WKS_LEVEL];
347     cpu_Cas01_t cpu_cas01 = ind_host[SURF_CPU_LEVEL];
348
349     if (!ws_clm03)
350       continue;
351     /* skip if it is not a virtual machine */
352     if (ws_clm03->generic_resource.model != surf_vm_workstation_model)
353       continue;
354     xbt_assert(cpu_cas01, "cpu-less workstation");
355
356     /* It is a virtual machine, so we can cast it to workstation_VM2013_t */
357     workstation_VM2013_t ws_vm2013 = (workstation_VM2013_t) ws_clm03;
358
359     double solved_value = get_solved_value(ws_vm2013->cpu_action);
360     XBT_DEBUG("assign %f to vm %s @ pm %s", solved_value,
361         ws_clm03->generic_resource.name, ws_vm2013->sub_ws->generic_resource.name);
362
363     // TODO: check lmm_update_constraint_bound() works fine instead of the below manual substitution.
364     // cpu_cas01->constraint->bound = solved_value;
365     surf_model_t cpu_model = cpu_cas01->generic_resource.model;
366     xbt_assert(cpu_model == surf_cpu_model_vm);
367     lmm_system_t vcpu_system = cpu_model->model_private->maxmin_system;
368     lmm_update_constraint_bound(vcpu_system, cpu_cas01->constraint, virt_overhead * solved_value);
369   }
370
371
372   /* 2. Calculate resource share at the virtual machine layer. */
373   double ret = ws_share_resources(workstation_model, now);
374
375
376   /* FIXME: 3. do we have to re-initialize our cpu_action object? */
377 #if 1
378   /* iterate for all hosts including virtual machines */
379   xbt_lib_foreach(host_lib, cursor, key, ind_host) {
380     workstation_CLM03_t ws_clm03 = ind_host[SURF_WKS_LEVEL];
381
382     /* skip if it is not a virtual machine */
383     if (!ws_clm03)
384       continue;
385     if (ws_clm03->generic_resource.model != surf_vm_workstation_model)
386       continue;
387
388     /* It is a virtual machine, so we can cast it to workstation_VM2013_t */
389     workstation_VM2013_t ws_vm2013 = (workstation_VM2013_t) ws_clm03;
390     {
391       void *ind_sub_host = xbt_lib_get_elm_or_null(host_lib, ws_vm2013->sub_ws->generic_resource.name);
392       XBT_INFO("cost %f remains %f start %f finish %f", ws_vm2013->cpu_action->cost,
393           ws_vm2013->cpu_action->remains,
394           ws_vm2013->cpu_action->start,
395           ws_vm2013->cpu_action->finish
396           );
397
398 #if 0
399       surf_cpu_model_pm->action_unref(ws_vm2013->cpu_action);
400       /* FIXME: this means busy loop? */
401       // ws_vm2013->cpu_action = surf_cpu_model_pm->extension.cpu.execute(ind_sub_host, GUESTOS_NOISE);
402       ws_vm2013->cpu_action = surf_cpu_model_pm->extension.cpu.execute(ind_sub_host, 0);
403 #endif
404
405     }
406   }
407 #endif
408
409
410   return ret;
411 }
412
413
414 /*
415  * A surf level object will be useless in the upper layer. Returing the
416  * dict_elm of the host.
417  **/
418 static void *vm_ws_get_pm(void *ind_vm_ws)
419 {
420         workstation_VM2013_t vm_ws = surf_workstation_resource_priv(ind_vm_ws);
421   const char *sub_ws_name = vm_ws->sub_ws->generic_resource.name;
422
423   return xbt_lib_get_elm_or_null(host_lib, sub_ws_name);
424 }
425
426
427
428 /* Adding a task to a VM updates the VCPU task on its physical machine. */
429 surf_action_t vm_ws_execute(void *workstation, double size)
430 {
431   surf_resource_t ws = ((surf_resource_t) surf_workstation_resource_priv(workstation));
432
433   xbt_assert(ws->model->type == SURF_MODEL_TYPE_VM_WORKSTATION);
434   workstation_VM2013_t vm_ws = (workstation_VM2013_t) ws;
435
436   double old_cost = vm_ws->cpu_action->cost;
437   double new_cost = old_cost + size;
438
439   XBT_INFO("VM(%s)@PM(%s): update dummy action's cost (%f -> %f)",
440       ws->name, vm_ws->sub_ws->generic_resource.name,
441       old_cost, new_cost);
442
443   vm_ws->cpu_action->cost = new_cost;
444
445   return ws_execute(workstation, size);
446 }
447
448 static void vm_ws_action_cancel(surf_action_t action)
449 {
450   XBT_CRITICAL("FIXME: Not yet implemented. Reduce dummy action's cost by %f", action->cost);
451
452   ws_action_cancel(action);
453 }
454
455
456 static void surf_vm_workstation_model_init_internal(void)
457 {
458   surf_model_t model = surf_model_init();
459
460   model->name = "Virtual Workstation";
461   model->type = SURF_MODEL_TYPE_VM_WORKSTATION;
462
463   model->action_unref     = ws_action_unref;
464   model->action_cancel    = vm_ws_action_cancel;
465   // model->action_state_set = ws_action_state_set;
466
467
468   model->model_private->share_resources       = vm_ws_share_resources;
469   model->model_private->resource_used         = ws_resource_used;
470   model->model_private->update_actions_state  = ws_update_actions_state;
471   model->model_private->update_resource_state = ws_update_resource_state;
472   model->model_private->finalize              = ws_finalize;
473
474
475   /* operation for an action, not for VM it self */
476   model->suspend          = ws_action_suspend;
477   model->resume           = ws_action_resume;
478 //   model->is_suspended     = ws_action_is_suspended;
479 //   model->set_max_duration = ws_action_set_max_duration;
480   model->set_priority     = ws_action_set_priority;
481 // #ifdef HAVE_TRACING
482 //   model->set_category     = ws_action_set_category;
483 // #endif
484 //   model->get_remains      = ws_action_get_remains;
485 // #ifdef HAVE_LATENCY_BOUND_TRACKING
486 //   model->get_latency_limited = ws_get_latency_limited;
487 // #endif
488
489
490
491
492
493
494
495   xbt_assert(surf_cpu_model_vm);
496   model->extension.workstation.cpu_model = surf_cpu_model_vm;
497
498   model->extension.workstation.execute   = vm_ws_execute;
499   model->extension.workstation.sleep     = ws_action_sleep;
500   model->extension.workstation.get_state = ws_get_state;
501   // model->extension.workstation.get_speed = ws_get_speed;
502   // model->extension.workstation.get_available_speed = ws_get_available_speed;
503
504   // model->extension.workstation.communicate           = ws_communicate;
505   // model->extension.workstation.get_route             = ws_get_route;
506   // model->extension.workstation.execute_parallel_task = ws_execute_parallel_task;
507   // model->extension.workstation.get_link_bandwidth    = ws_get_link_bandwidth;
508   // model->extension.workstation.get_link_latency      = ws_get_link_latency;
509   // model->extension.workstation.link_shared           = ws_link_shared;
510   // model->extension.workstation.get_properties        = ws_get_properties;
511
512   // model->extension.workstation.open   = ws_action_open;
513   // model->extension.workstation.close  = ws_action_close;
514   // model->extension.workstation.read   = ws_action_read;
515   // model->extension.workstation.write  = ws_action_write;
516   // model->extension.workstation.stat   = ws_action_stat;
517   // model->extension.workstation.unlink = ws_action_unlink;
518   // model->extension.workstation.ls     = ws_action_ls;
519
520
521   model->extension.vm_workstation.create        = vm_ws_create;
522   model->extension.vm_workstation.set_state     = vm_ws_set_state;
523   model->extension.vm_workstation.get_state     = vm_ws_get_state;
524   model->extension.vm_workstation.migrate       = vm_ws_migrate;
525   model->extension.vm_workstation.destroy       = vm_ws_destroy;
526   model->extension.vm_workstation.suspend       = vm_ws_suspend;
527   model->extension.vm_workstation.resume        = vm_ws_resume;
528   model->extension.vm_workstation.save          = vm_ws_save;
529   model->extension.vm_workstation.restore       = vm_ws_restore;
530   model->extension.vm_workstation.get_pm        = vm_ws_get_pm;
531
532   model->extension.workstation.set_params    = ws_set_params;
533   model->extension.workstation.get_params    = ws_get_params;
534
535   surf_vm_workstation_model = model;
536 }
537
538 void surf_vm_workstation_model_init(void)
539 {
540   surf_vm_workstation_model_init_internal();
541   xbt_dynar_push(model_list, &surf_vm_workstation_model);
542   xbt_dynar_push(model_list_invoke, &surf_vm_workstation_model);
543 }