1 /* Copyright (c) 2004, 2005, 2006, 2007, 2008, 2009, 2010. The SimGrid Team.
2 * All rights reserved. */
4 /* This program is free software; you can redistribute it and/or modify it
5 * under the terms of the license (GNU LGPL) which comes with this package. */
10 #include "surf_private.h"
11 #include "surf/surf_resource.h"
12 #include "simgrid/sg_config.h"
13 #include "vm_workstation_private.h"
14 #include "cpu_cas01_private.h"
15 #include "maxmin_private.h"
17 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(surf_vm_workstation, surf,
18 "Logging specific to the SURF VM workstation module");
21 surf_model_t surf_vm_workstation_model = NULL;
23 /* ind means ''indirect'' that this is a reference on the whole dict_elm
24 * structure (i.e not on the surf_resource_private infos) */
26 static void vm_ws_create(const char *name, void *ind_phys_workstation)
28 workstation_CLM03_t sub_ws = surf_workstation_resource_priv(ind_phys_workstation);
29 const char *sub_ws_name = sub_ws->generic_resource.name;
31 /* The workstation_VM2013 struct inherits the workstation_CLM03 struct. We
32 * create a physical workstation resource, but specifying the size of
33 * s_workstation_VM2013_t and the vm workstation model object. */
34 workstation_CLM03_t ws = (workstation_CLM03_t) surf_resource_new(sizeof(s_workstation_VM2013_t),
35 surf_vm_workstation_model, name, NULL);
37 /* Currently, we assume a VM has no storage. */
40 /* Currently, a VM uses the network resource of its physical host. In
41 * host_lib, this network resource object is refered from two different keys.
42 * When deregistering the reference that points the network resource object
43 * from the VM name, we have to make sure that the system does not call the
44 * free callback for the network resource object. The network resource object
45 * is still used by the physical machine. */
46 ws->net_elm = xbt_lib_get_or_null(host_lib, sub_ws_name, ROUTING_HOST_LEVEL);
47 xbt_lib_set(host_lib, name, ROUTING_HOST_LEVEL, ws->net_elm);
49 /* The SURF_WKS_LEVEL at host_lib saves workstation_CLM03 objects. Please
50 * note workstation_VM2013 objects, inheriting the workstation_CLM03
51 * structure, are also saved there.
53 * If you want to get a workstation_VM2013 object from host_lib, see
54 * ws->generic_resouce.model->type first. If it is
55 * SURF_MODEL_TYPE_VM_WORKSTATION, you can cast ws to vm_ws. */
56 XBT_INFO("Create VM(%s)@PM(%s) with %ld mounted disks", name, sub_ws_name, xbt_dynar_length(ws->storage));
57 xbt_lib_set(host_lib, name, SURF_WKS_LEVEL, ws);
60 /* We initialize the VM-specific members. */
61 workstation_VM2013_t vm_ws = (workstation_VM2013_t) ws;
62 vm_ws->sub_ws = sub_ws;
63 vm_ws->current_state = SURF_VM_STATE_CREATED;
67 // //// CPU RELATED STUFF ////
68 // Roughly, create a vcpu resource by using the values of the sub_cpu one.
69 cpu_Cas01_t sub_cpu = surf_cpu_resource_priv(ind_phys_workstation);
71 /* We can assume one core and cas01 cpu for the first step.
72 * Do xbt_lib_set(host_lib, name, SURF_CPU_LEVEL, cpu) if you get the resource. */
73 cpu_cas01_create_resource(name, // name
74 sub_cpu->power_peak, // host->power_peak,
75 1, // host->power_scale,
76 NULL, // host->power_trace,
77 1, // host->core_amount,
78 SURF_RESOURCE_ON, // host->initial_state,
79 NULL, // host->state_trace,
80 NULL, // host->properties,
85 /* We create cpu_action corresponding to a VM process on the host operating system. */
86 /* FIXME: TODO: we have to peridocally input GUESTOS_NOISE to the system? how ? */
87 // vm_ws->cpu_action = surf_cpu_model_pm->extension.cpu.execute(ind_phys_workstation, GUESTOS_NOISE);
88 vm_ws->cpu_action = surf_cpu_model_pm->extension.cpu.execute(ind_phys_workstation, 0);
92 * - check how network requests are scheduled between distinct processes competing for the same card.
97 * Update the physical host of the given VM
99 static void vm_ws_migrate(void *ind_vm, void *ind_dst_pm)
101 /* ind_phys_workstation equals to smx_host_t */
102 workstation_VM2013_t ws_vm2013 = surf_workstation_resource_priv(ind_vm);
103 workstation_CLM03_t ws_clm03_dst = surf_workstation_resource_priv(ind_dst_pm);
104 const char *vm_name = ws_vm2013->ws.generic_resource.name;
105 const char *pm_name_src = ws_vm2013->sub_ws->generic_resource.name;
106 const char *pm_name_dst = ws_clm03_dst->generic_resource.name;
108 xbt_assert(ws_vm2013);
109 xbt_assert(ws_clm03_dst);
113 /* update net_elm with that of the destination physical host */
114 void *old_net_elm = ws_vm2013->ws.net_elm;
115 void *new_net_elm = xbt_lib_get_or_null(host_lib, pm_name_dst, ROUTING_HOST_LEVEL);
116 xbt_assert(new_net_elm);
118 /* Unregister the current net_elm from host_lib. Do not call the free callback. */
119 xbt_lib_unset(host_lib, vm_name, ROUTING_HOST_LEVEL, 0);
121 /* Then, resister the new one. */
122 ws_vm2013->ws.net_elm = new_net_elm;
123 xbt_lib_set(host_lib, vm_name, ROUTING_HOST_LEVEL, ws_vm2013->ws.net_elm);
125 ws_vm2013->sub_ws = ws_clm03_dst;
127 /* Update vcpu's action for the new pm */
130 XBT_INFO("cpu_action->remains %g", ws_vm2013->cpu_action->remains);
131 XBT_INFO("cost %f remains %f start %f finish %f", ws_vm2013->cpu_action->cost,
132 ws_vm2013->cpu_action->remains,
133 ws_vm2013->cpu_action->start,
134 ws_vm2013->cpu_action->finish
136 XBT_INFO("cpu_action state %d", surf_action_state_get(ws_vm2013->cpu_action));
139 /* create a cpu action bound to the pm model at the destination. */
140 surf_action_t new_cpu_action = surf_cpu_model_pm->extension.cpu.execute(ind_dst_pm, 0);
142 e_surf_action_state_t state = surf_action_state_get(ws_vm2013->cpu_action);
143 if (state != SURF_ACTION_DONE)
144 XBT_CRITICAL("FIXME: may need a proper handling, %d", state);
145 if (ws_vm2013->cpu_action->remains > 0)
146 XBT_CRITICAL("FIXME: need copy the state(?), %f", ws_vm2013->cpu_action->remains);
148 int ret = surf_cpu_model_pm->action_unref(ws_vm2013->cpu_action);
149 xbt_assert(ret == 1, "Bug: some resource still remains");
151 ws_vm2013->cpu_action = new_cpu_action;
154 XBT_DEBUG("migrate VM(%s): change net_elm (%p to %p)", vm_name, old_net_elm, new_net_elm);
155 XBT_DEBUG("migrate VM(%s): change PM (%s to %s)", vm_name, pm_name_src, pm_name_dst);
159 * A physical host does not disapper in the current SimGrid code, but a VM may
160 * disapper during a simulation.
162 static void vm_ws_destroy(void *ind_vm_workstation)
164 /* ind_phys_workstation equals to smx_host_t */
166 /* Before clearing the entries in host_lib, we have to pick up resources. */
167 workstation_VM2013_t vm_ws = surf_workstation_resource_priv(ind_vm_workstation);
168 cpu_Cas01_t cpu = surf_cpu_resource_priv(ind_vm_workstation);
169 const char *name = vm_ws->ws.generic_resource.name;
172 xbt_assert(vm_ws->ws.generic_resource.model == surf_vm_workstation_model);
175 /* We deregister objects from host_lib, without invoking the freeing callback
178 * Do not call xbt_lib_remove() here. It deletes all levels of the key,
179 * including MSG_HOST_LEVEL and others. We should unregister only what we know.
181 xbt_lib_unset(host_lib, name, SURF_CPU_LEVEL, 0);
182 xbt_lib_unset(host_lib, name, ROUTING_HOST_LEVEL, 0);
183 xbt_lib_unset(host_lib, name, SURF_WKS_LEVEL, 0);
185 /* TODO: comment out when VM stroage is implemented. */
186 // xbt_lib_unset(host_lib, name, SURF_STORAGE_LEVEL, 0);
189 /* Free the cpu_action of the VM. */
190 int ret = surf_cpu_model_pm->action_unref(vm_ws->cpu_action);
191 xbt_assert(ret == 1, "Bug: some resource still remains");
193 /* Free the cpu resource of the VM. If using power_trace, we will have to
194 * free other objects than lmm_constraint. */
195 surf_model_t cpu_model = cpu->generic_resource.model;
196 lmm_constraint_free(cpu_model->model_private->maxmin_system, cpu->constraint);
199 for (i = 0; i < cpu->core; i++) {
200 void *cnst_id = cpu->constraint_core[i]->id;
201 lmm_constraint_free(cpu_model->model_private->maxmin_system, cpu->constraint_core[i]);
205 xbt_free(cpu->constraint_core);
208 surf_resource_free(cpu);
210 /* Free the network resource of the VM. */
211 // Nothing has to be done, because net_elmts is just a pointer on the physical one
213 /* Free the storage resource of the VM. */
216 /* Free the workstation resource of the VM. */
217 surf_resource_free(vm_ws);
220 static int vm_ws_get_state(void *ind_vm_ws)
222 return ((workstation_VM2013_t) surf_workstation_resource_priv(ind_vm_ws))->current_state;
225 static void vm_ws_set_state(void *ind_vm_ws, int state)
227 ((workstation_VM2013_t) surf_workstation_resource_priv(ind_vm_ws))->current_state = state;
230 static void vm_ws_suspend(void *ind_vm_ws)
232 workstation_VM2013_t vm_ws = surf_workstation_resource_priv(ind_vm_ws);
234 surf_action_suspend(vm_ws->cpu_action);
236 vm_ws->current_state = SURF_VM_STATE_SUSPENDED;
239 static void vm_ws_resume(void *ind_vm_ws)
241 workstation_VM2013_t vm_ws = surf_workstation_resource_priv(ind_vm_ws);
243 surf_action_resume(vm_ws->cpu_action);
245 vm_ws->current_state = SURF_VM_STATE_RUNNING;
248 static void vm_ws_save(void *ind_vm_ws)
250 workstation_VM2013_t vm_ws = surf_workstation_resource_priv(ind_vm_ws);
252 vm_ws->current_state = SURF_VM_STATE_SAVING;
254 /* FIXME: do something here */
255 surf_action_suspend(vm_ws->cpu_action);
257 vm_ws->current_state = SURF_VM_STATE_SAVED;
260 static void vm_ws_restore(void *ind_vm_ws)
262 workstation_VM2013_t vm_ws = surf_workstation_resource_priv(ind_vm_ws);
264 vm_ws->current_state = SURF_VM_STATE_RESTORING;
266 /* FIXME: do something here */
267 surf_action_resume(vm_ws->cpu_action);
269 vm_ws->current_state = SURF_VM_STATE_RUNNING;
272 static double get_solved_value(surf_action_t cpu_action)
274 lmm_variable_t var = ((surf_action_lmm_t) cpu_action)->variable;
279 /* In the real world, processes on the guest operating system will be somewhat
280 * degraded due to virtualization overhead. The total CPU share that these
281 * processes get is smaller than that of the VM process gets on a host
282 * operating system. */
283 // const double virt_overhead = 0.95;
284 const double virt_overhead = 1;
286 static double vm_ws_share_resources(surf_model_t workstation_model, double now)
288 /* TODO: udpate action's cost with the total cost of processes on the VM. */
291 /* 0. Make sure that we already calculated the resource share at the physical
294 unsigned int index_of_pm_ws_model = xbt_dynar_search(model_list_invoke, &surf_workstation_model);
295 unsigned int index_of_vm_ws_model = xbt_dynar_search(model_list_invoke, &surf_vm_workstation_model);
296 xbt_assert((index_of_pm_ws_model < index_of_vm_ws_model), "Cannot assume surf_workstation_model comes before");
298 /* Another option is that we call sub_ws->share_resource() here. The
299 * share_resource() function has no side-effect. We can call it here to
304 /* 1. Now we know how many resource should be assigned to each virtual
305 * machine. We update constraints of the virtual machine layer.
308 * If we have two virtual machine (VM1 and VM2) on a physical machine (PM1).
309 * X1 + X2 = C (Equation 1)
311 * the resource share of VM1: X1
312 * the resource share of VM2: X2
313 * the capacity of PM1: C
315 * Then, if we have two process (P1 and P2) on VM1.
316 * X1_1 + X1_2 = X1 (Equation 2)
318 * the resource share of P1: X1_1
319 * the resource share of P2: X1_2
320 * the capacity of VM1: X1
322 * Equation 1 was solved in the physical machine layer.
323 * Equation 2 is solved in the virtual machine layer (here).
324 * X1 must be passed to the virtual machine laye as a constraint value.
328 /* iterate for all hosts including virtual machines */
329 xbt_lib_cursor_t cursor;
332 xbt_lib_foreach(host_lib, cursor, key, ind_host) {
333 workstation_CLM03_t ws_clm03 = ind_host[SURF_WKS_LEVEL];
334 cpu_Cas01_t cpu_cas01 = ind_host[SURF_CPU_LEVEL];
338 /* skip if it is not a virtual machine */
339 if (ws_clm03->generic_resource.model != surf_vm_workstation_model)
341 xbt_assert(cpu_cas01, "cpu-less workstation");
343 /* It is a virtual machine, so we can cast it to workstation_VM2013_t */
344 workstation_VM2013_t ws_vm2013 = (workstation_VM2013_t) ws_clm03;
346 double solved_value = get_solved_value(ws_vm2013->cpu_action);
347 XBT_DEBUG("assign %f to vm %s @ pm %s", solved_value,
348 ws_clm03->generic_resource.name, ws_vm2013->sub_ws->generic_resource.name);
350 // TODO: check lmm_update_constraint_bound() works fine instead of the below manual substitution.
351 // cpu_cas01->constraint->bound = solved_value;
352 surf_model_t cpu_model = cpu_cas01->generic_resource.model;
353 xbt_assert(cpu_model == surf_cpu_model_vm);
354 lmm_system_t vcpu_system = cpu_model->model_private->maxmin_system;
355 lmm_update_constraint_bound(vcpu_system, cpu_cas01->constraint, virt_overhead * solved_value);
359 /* 2. Calculate resource share at the virtual machine layer. */
360 double ret = ws_share_resources(workstation_model, now);
363 /* FIXME: 3. do we have to re-initialize our cpu_action object? */
365 /* iterate for all hosts including virtual machines */
366 xbt_lib_foreach(host_lib, cursor, key, ind_host) {
367 workstation_CLM03_t ws_clm03 = ind_host[SURF_WKS_LEVEL];
369 /* skip if it is not a virtual machine */
372 if (ws_clm03->generic_resource.model != surf_vm_workstation_model)
375 /* It is a virtual machine, so we can cast it to workstation_VM2013_t */
378 workstation_VM2013_t ws_vm2013 = (workstation_VM2013_t) ws_clm03;
379 XBT_INFO("cost %f remains %f start %f finish %f", ws_vm2013->cpu_action->cost,
380 ws_vm2013->cpu_action->remains,
381 ws_vm2013->cpu_action->start,
382 ws_vm2013->cpu_action->finish
386 void *ind_sub_host = xbt_lib_get_elm_or_null(host_lib, ws_vm2013->sub_ws->generic_resource.name);
387 surf_cpu_model_pm->action_unref(ws_vm2013->cpu_action);
388 /* FIXME: this means busy loop? */
389 // ws_vm2013->cpu_action = surf_cpu_model_pm->extension.cpu.execute(ind_sub_host, GUESTOS_NOISE);
390 ws_vm2013->cpu_action = surf_cpu_model_pm->extension.cpu.execute(ind_sub_host, 0);
403 * A surf level object will be useless in the upper layer. Returing the
404 * dict_elm of the host.
406 static void *vm_ws_get_pm(void *ind_vm_ws)
408 workstation_VM2013_t vm_ws = surf_workstation_resource_priv(ind_vm_ws);
409 const char *sub_ws_name = vm_ws->sub_ws->generic_resource.name;
411 return xbt_lib_get_elm_or_null(host_lib, sub_ws_name);
415 /* Adding a task to a VM updates the VCPU task on its physical machine. */
416 static surf_action_t vm_ws_execute(void *workstation, double size)
418 surf_resource_t ws = ((surf_resource_t) surf_workstation_resource_priv(workstation));
420 xbt_assert(ws->model->type == SURF_MODEL_TYPE_VM_WORKSTATION);
421 workstation_VM2013_t vm_ws = (workstation_VM2013_t) ws;
423 double old_cost = vm_ws->cpu_action->cost;
424 double new_cost = old_cost + size;
426 XBT_DEBUG("VM(%s)@PM(%s): update dummy action's cost (%f -> %f)",
427 ws->name, vm_ws->sub_ws->generic_resource.name,
430 vm_ws->cpu_action->cost = new_cost;
432 return ws_execute(workstation, size);
435 static void vm_ws_action_cancel(surf_action_t action)
437 XBT_CRITICAL("FIXME: Not yet implemented. Reduce dummy action's cost by %f", action->cost);
439 ws_action_cancel(action);
443 /* Now we can set bound for each task by using MSG_task_set_bound. But, it does
444 * not work for the dummy CPU action of a VM. Here, we add the set_bound
445 * function for the dummy CPU action. */
446 static void vm_ws_set_vm_bound(void *vm, double bound)
448 surf_resource_t ws = ((surf_resource_t) surf_workstation_resource_priv(vm));
449 xbt_assert(ws->model->type == SURF_MODEL_TYPE_VM_WORKSTATION);
450 workstation_VM2013_t vm_ws = (workstation_VM2013_t) ws;
452 surf_action_set_bound(vm_ws->cpu_action, bound);
456 /* set the affinity of a VM to the CPU cores of a PM */
457 static void vm_ws_set_vm_affinity(void *vm, void *pm, unsigned long mask)
459 surf_resource_t ws = ((surf_resource_t) surf_workstation_resource_priv(vm));
460 xbt_assert(ws->model->type == SURF_MODEL_TYPE_VM_WORKSTATION);
461 workstation_VM2013_t vm_ws = (workstation_VM2013_t) ws;
463 surf_cpu_model_pm->set_affinity(vm_ws->cpu_action, pm, mask);
467 static void surf_vm_workstation_model_init_internal(void)
469 surf_model_t model = surf_model_init();
471 model->name = "Virtual Workstation";
472 model->type = SURF_MODEL_TYPE_VM_WORKSTATION;
474 model->action_unref = ws_action_unref;
475 model->action_cancel = vm_ws_action_cancel;
476 // model->action_state_set = ws_action_state_set;
479 model->model_private->share_resources = vm_ws_share_resources;
480 model->model_private->resource_used = ws_resource_used;
481 model->model_private->update_actions_state = ws_update_actions_state;
482 model->model_private->update_resource_state = ws_update_resource_state;
483 model->model_private->finalize = ws_finalize;
486 /* operation for an action, not for VM it self */
487 model->suspend = ws_action_suspend;
488 model->resume = ws_action_resume;
489 // model->is_suspended = ws_action_is_suspended;
490 // model->set_max_duration = ws_action_set_max_duration;
491 model->set_priority = ws_action_set_priority;
492 model->set_bound = ws_action_set_bound;
493 model->set_affinity = ws_action_set_affinity;
494 // #ifdef HAVE_TRACING
495 // model->set_category = ws_action_set_category;
497 model->get_remains = ws_action_get_remains;
498 // #ifdef HAVE_LATENCY_BOUND_TRACKING
499 // model->get_latency_limited = ws_get_latency_limited;
508 xbt_assert(surf_cpu_model_vm);
509 model->extension.workstation.cpu_model = surf_cpu_model_vm;
511 model->extension.workstation.execute = vm_ws_execute;
512 model->extension.workstation.sleep = ws_action_sleep;
513 model->extension.workstation.get_state = ws_get_state;
514 model->extension.workstation.get_speed = ws_get_speed;
515 // model->extension.workstation.get_available_speed = ws_get_available_speed;
517 // model->extension.workstation.communicate = ws_communicate;
518 // model->extension.workstation.get_route = ws_get_route;
519 // model->extension.workstation.execute_parallel_task = ws_execute_parallel_task;
520 // model->extension.workstation.get_link_bandwidth = ws_get_link_bandwidth;
521 // model->extension.workstation.get_link_latency = ws_get_link_latency;
522 // model->extension.workstation.link_shared = ws_link_shared;
523 // model->extension.workstation.get_properties = ws_get_properties;
525 // model->extension.workstation.open = ws_action_open;
526 // model->extension.workstation.close = ws_action_close;
527 // model->extension.workstation.read = ws_action_read;
528 // model->extension.workstation.write = ws_action_write;
529 // model->extension.workstation.stat = ws_action_stat;
530 // model->extension.workstation.unlink = ws_action_unlink;
531 // model->extension.workstation.ls = ws_action_ls;
534 model->extension.vm_workstation.create = vm_ws_create;
535 model->extension.vm_workstation.set_state = vm_ws_set_state;
536 model->extension.vm_workstation.get_state = vm_ws_get_state;
537 model->extension.vm_workstation.migrate = vm_ws_migrate;
538 model->extension.vm_workstation.destroy = vm_ws_destroy;
539 model->extension.vm_workstation.suspend = vm_ws_suspend;
540 model->extension.vm_workstation.resume = vm_ws_resume;
541 model->extension.vm_workstation.save = vm_ws_save;
542 model->extension.vm_workstation.restore = vm_ws_restore;
543 model->extension.vm_workstation.get_pm = vm_ws_get_pm;
544 model->extension.vm_workstation.set_vm_bound = vm_ws_set_vm_bound;
545 model->extension.vm_workstation.set_vm_affinity = vm_ws_set_vm_affinity;
547 model->extension.workstation.set_params = ws_set_params;
548 model->extension.workstation.get_params = ws_get_params;
550 surf_vm_workstation_model = model;
553 void surf_vm_workstation_model_init(void)
555 surf_vm_workstation_model_init_internal();
556 xbt_dynar_push(model_list, &surf_vm_workstation_model);
557 xbt_dynar_push(model_list_invoke, &surf_vm_workstation_model);