X-Git-Url: http://info.iut-bm.univ-fcomte.fr/pub/gitweb/simgrid.git/blobdiff_plain/0afad4b7e2215154531cd6b2933af898ec6b781d..dc9b8feaddd53842f6204f4f24409b2382393fa9:/src/plugins/vm/VmLiveMigration.cpp diff --git a/src/plugins/vm/VmLiveMigration.cpp b/src/plugins/vm/VmLiveMigration.cpp index f0ec4ec59e..825284fcf3 100644 --- a/src/plugins/vm/VmLiveMigration.cpp +++ b/src/plugins/vm/VmLiveMigration.cpp @@ -1,20 +1,25 @@ -/* Copyright (c) 2013-2017. The SimGrid Team. All rights reserved. */ +/* Copyright (c) 2013-2019. The SimGrid Team. All rights reserved. */ /* This program is free software; you can redistribute it and/or modify it * under the terms of the license (GNU LGPL) which comes with this package. */ -#include -#include -#include -#include -#include -#include -#include +#include "src/plugins/vm/VmLiveMigration.hpp" +#include "simgrid/Exception.hpp" +#include "src/instr/instr_private.hpp" +#include "src/plugins/vm/VirtualMachineImpl.hpp" +#include "src/plugins/vm/VmHostExt.hpp" XBT_LOG_NEW_DEFAULT_CATEGORY(vm_live_migration, "S4U virtual machines live migration"); namespace simgrid { namespace vm { +simgrid::xbt::Extension VmMigrationExt::EXTENSION_ID; + +void VmMigrationExt::ensureVmMigrationExtInstalled() +{ + if (not EXTENSION_ID.valid()) + EXTENSION_ID = simgrid::s4u::Host::extension_create(); +} void MigrationRx::operator()() { @@ -22,7 +27,7 @@ void MigrationRx::operator()() bool received_finalize = false; std::string finalize_task_name = - std::string("__mig_stage3:") + vm_->getCname() + "(" + src_pm_->getCname() + "-" + dst_pm_->getCname() + ")"; + std::string("__mig_stage3:") + vm_->get_cname() + "(" + src_pm_->get_cname() + "-" + dst_pm_->get_cname() + ")"; while (not received_finalize) { std::string* payload = static_cast(mbox->get()); @@ -38,40 +43,38 @@ void MigrationRx::operator()() /* Update the vm location */ /* precopy migration makes the VM temporally paused */ - xbt_assert(vm_->getState() == SURF_VM_STATE_SUSPENDED); + xbt_assert(vm_->get_state() == s4u::VirtualMachine::state::SUSPENDED); /* Update the vm location and resume it */ - vm_->setPm(dst_pm_); + vm_->set_pm(dst_pm_); vm_->resume(); // Now the VM is running on the new host (the migration is completed) (even if the SRC crash) - vm_->pimpl_vm_->isMigrating = false; - XBT_DEBUG("VM(%s) moved from PM(%s) to PM(%s)", vm_->getCname(), src_pm_->getCname(), dst_pm_->getCname()); + vm_->get_impl()->is_migrating_ = false; + XBT_DEBUG("VM(%s) moved from PM(%s) to PM(%s)", vm_->get_cname(), src_pm_->get_cname(), dst_pm_->get_cname()); - if (TRACE_msg_vm_is_enabled()) { + if (TRACE_vm_is_enabled()) { static long long int counter = 0; std::string key = std::to_string(counter); counter++; // start link - container_t msg = simgrid::instr::Container::byName(vm_->getName()); - simgrid::instr::Container::getRoot()->getLink("MSG_VM_LINK")->startEvent(msg, "M", key); + container_t msg = simgrid::instr::Container::by_name(vm_->get_name()); + simgrid::instr::Container::get_root()->get_link("VM_LINK")->start_event(msg, "M", key); // destroy existing container of this vm - container_t existing_container = simgrid::instr::Container::byName(vm_->getName()); - existing_container->removeFromParent(); - delete existing_container; + simgrid::instr::Container::by_name(vm_->get_name())->remove_from_parent(); // create new container on the new_host location - new simgrid::instr::Container(vm_->getCname(), "MSG_VM", simgrid::instr::Container::byName(dst_pm_->getName())); + new simgrid::instr::Container(vm_->get_name(), "VM", simgrid::instr::Container::by_name(dst_pm_->get_name())); // end link - msg = simgrid::instr::Container::byName(vm_->getName()); - simgrid::instr::Container::getRoot()->getLink("MSG_VM_LINK")->endEvent(msg, "M", key); + msg = simgrid::instr::Container::by_name(vm_->get_name()); + simgrid::instr::Container::get_root()->get_link("VM_LINK")->end_event(msg, "M", key); } // Inform the SRC that the migration has been correctly performed std::string* payload = new std::string("__mig_stage4:"); - *payload = *payload + vm_->getCname() + "(" + src_pm_->getCname() + "-" + dst_pm_->getCname() + ")"; + *payload = *payload + vm_->get_cname() + "(" + src_pm_->get_cname() + "-" + dst_pm_->get_cname() + ")"; mbox_ctl->put(payload, 0); @@ -93,26 +96,27 @@ sg_size_t MigrationTx::sendMigrationData(sg_size_t size, int stage, int stage2_r { sg_size_t sent = size; std::string* msg = new std::string("__mig_stage"); - *msg = *msg + std::to_string(stage) + ":" + vm_->getCname() + "(" + src_pm_->getCname() + "-" + dst_pm_->getCname() + - ")"; + *msg = *msg + std::to_string(stage) + ":" + vm_->get_cname() + "(" + src_pm_->get_cname() + "-" + + dst_pm_->get_cname() + ")"; - double clock_sta = s4u::Engine::getClock(); + double clock_sta = s4u::Engine::get_clock(); s4u::Activity* comm = nullptr; try { if (mig_speed > 0) - comm = mbox->put_init(msg, size)->setRate(mig_speed)->wait(timeout); + comm = mbox->put_init(msg, size)->set_rate(mig_speed)->wait_for(timeout); else - comm = mbox->put_async(msg, size)->wait(); + comm = mbox->put_async(msg, size)->wait_for(timeout); } catch (xbt_ex& e) { if (comm) { - sg_size_t remaining = static_cast(comm->getRemains()); + sg_size_t remaining = static_cast(comm->get_remaining()); XBT_VERB("timeout (%lf s) in sending_migration_data, remaining %llu bytes of %llu", timeout, remaining, size); sent -= remaining; } + delete msg; } - double clock_end = s4u::Engine::getClock(); + double clock_end = s4u::Engine::get_clock(); double duration = clock_end - clock_sta; double actual_speed = size / duration; @@ -130,8 +134,8 @@ void MigrationTx::operator()() { XBT_DEBUG("mig: tx_start"); - double host_speed = vm_->getPm()->getSpeed(); - const sg_size_t ramsize = vm_->getRamsize(); + double host_speed = vm_->get_pm()->get_speed(); + const sg_size_t ramsize = vm_->get_ramsize(); const double dp_rate = host_speed ? (sg_vm_get_migration_speed(vm_) * sg_vm_get_dirty_page_intensity(vm_)) / host_speed : 1; const sg_size_t dp_cap = sg_vm_get_working_set_memory(vm_); @@ -142,7 +146,11 @@ void MigrationTx::operator()() bool skip_stage2 = false; size_t remaining_size = ramsize; - size_t threshold = 0.0; + + double clock_prev_send; + double clock_post_send; + double bandwidth; + size_t threshold; /* check parameters */ if (ramsize == 0) @@ -158,7 +166,7 @@ void MigrationTx::operator()() sg_vm_start_dirty_page_tracking(vm_); double computed_during_stage1 = 0; - double clock_prev_send = s4u::Engine::getClock(); + clock_prev_send = s4u::Engine::get_clock(); try { /* At stage 1, we do not need timeout. We have to send all the memory pages even though the duration of this @@ -181,7 +189,7 @@ void MigrationTx::operator()() return; } - double clock_post_send = s4u::Engine::getClock(); + clock_post_send = s4u::Engine::get_clock(); mig_timeout -= (clock_post_send - clock_prev_send); if (mig_timeout < 0) { XBT_VERB("The duration of stage 1 exceeds the timeout value, skip stage 2"); @@ -189,8 +197,8 @@ void MigrationTx::operator()() } /* estimate bandwidth */ - double bandwidth = ramsize / (clock_post_send - clock_prev_send); - threshold = bandwidth * max_downtime; + bandwidth = ramsize / (clock_post_send - clock_prev_send); + threshold = bandwidth * max_downtime; XBT_DEBUG("actual bandwidth %f (MB/s), threshold %zu", bandwidth / 1024 / 1024, threshold); /* Stage2: send update pages iteratively until the size of remaining states becomes smaller than threshold value. */ @@ -217,8 +225,8 @@ void MigrationTx::operator()() if (remaining_size < threshold) break; - sg_size_t sent = 0; - double clock_prev_send = s4u::Engine::getClock(); + sg_size_t sent = 0; + clock_prev_send = s4u::Engine::get_clock(); try { XBT_DEBUG("Stage 2, gonna send %llu", updated_size); sent = sendMigrationData(updated_size, 2, stage2_round, mig_speed, mig_timeout); @@ -229,12 +237,12 @@ void MigrationTx::operator()() sg_vm_stop_dirty_page_tracking(vm_); return; } - double clock_post_send = s4u::Engine::getClock(); + clock_post_send = s4u::Engine::get_clock(); if (sent == updated_size) { /* timeout did not happen */ - double bandwidth = updated_size / (clock_post_send - clock_prev_send); - threshold = bandwidth * max_downtime; + bandwidth = updated_size / (clock_post_send - clock_prev_send); + threshold = bandwidth * max_downtime; XBT_DEBUG("actual bandwidth %f, threshold %zu", bandwidth / 1024 / 1024, threshold); remaining_size -= sent; stage2_round += 1; @@ -279,41 +287,82 @@ void MigrationTx::operator()() } } -SG_BEGIN_DECL() +static void onVirtualMachineShutdown(simgrid::s4u::VirtualMachine& vm) +{ + if (vm.get_impl()->is_migrating_) { + vm.extension()->rx_->kill(); + vm.extension()->tx_->kill(); + vm.extension()->issuer_->kill(); + vm.get_impl()->is_migrating_ = false; + } +} + +void sg_vm_live_migration_plugin_init() +{ + sg_vm_dirty_page_tracking_init(); + simgrid::vm::VmMigrationExt::ensureVmMigrationExtInstalled(); + simgrid::s4u::VirtualMachine::on_shutdown.connect(&onVirtualMachineShutdown); +} + +simgrid::s4u::VirtualMachine* sg_vm_create_migratable(simgrid::s4u::Host* pm, const char* name, int coreAmount, + int ramsize, int mig_netspeed, int dp_intensity) +{ + simgrid::vm::VmHostExt::ensureVmExtInstalled(); + + /* For the moment, intensity_rate is the percentage against the migration bandwidth */ + + sg_vm_t vm = new simgrid::s4u::VirtualMachine(name, pm, coreAmount, static_cast(ramsize) * 1024 * 1024); + sg_vm_set_dirty_page_intensity(vm, dp_intensity / 100.0); + sg_vm_set_working_set_memory(vm, vm->get_ramsize() * 0.9); // assume working set memory is 90% of ramsize + sg_vm_set_migration_speed(vm, mig_netspeed * 1024 * 1024.0); + + XBT_DEBUG("migspeed : %f intensity mem : %d", mig_netspeed * 1024 * 1024.0, dp_intensity); + + return vm; +} + +int sg_vm_is_migrating(simgrid::s4u::VirtualMachine* vm) +{ + return vm->get_impl()->is_migrating_; +} + void sg_vm_migrate(simgrid::s4u::VirtualMachine* vm, simgrid::s4u::Host* dst_pm) { - simgrid::s4u::Host* src_pm = vm->getPm(); + simgrid::s4u::Host* src_pm = vm->get_pm(); - if (src_pm->isOff()) - THROWF(vm_error, 0, "Cannot migrate VM '%s' from host '%s', which is offline.", vm->getCname(), src_pm->getCname()); - if (dst_pm->isOff()) - THROWF(vm_error, 0, "Cannot migrate VM '%s' to host '%s', which is offline.", vm->getCname(), dst_pm->getCname()); - if (vm->getState() != SURF_VM_STATE_RUNNING) - THROWF(vm_error, 0, "Cannot migrate VM '%s' that is not running yet.", vm->getCname()); - if (vm->isMigrating()) - THROWF(vm_error, 0, "Cannot migrate VM '%s' that is already migrating.", vm->getCname()); + if (not src_pm->is_on()) + THROWF(vm_error, 0, "Cannot migrate VM '%s' from host '%s', which is offline.", vm->get_cname(), + src_pm->get_cname()); + if (not dst_pm->is_on()) + THROWF(vm_error, 0, "Cannot migrate VM '%s' to host '%s', which is offline.", vm->get_cname(), dst_pm->get_cname()); + if (vm->get_state() != simgrid::s4u::VirtualMachine::state::RUNNING) + THROWF(vm_error, 0, "Cannot migrate VM '%s' that is not running yet.", vm->get_cname()); + if (vm->get_impl()->is_migrating_) + THROWF(vm_error, 0, "Cannot migrate VM '%s' that is already migrating.", vm->get_cname()); - vm->pimpl_vm_->isMigrating = true; + vm->get_impl()->is_migrating_ = true; + simgrid::s4u::VirtualMachine::on_migration_start(*vm); std::string rx_name = - std::string("__pr_mig_rx:") + vm->getCname() + "(" + src_pm->getCname() + "-" + dst_pm->getCname() + ")"; + std::string("__pr_mig_rx:") + vm->get_cname() + "(" + src_pm->get_cname() + "-" + dst_pm->get_cname() + ")"; std::string tx_name = - std::string("__pr_mig_tx:") + vm->getCname() + "(" + src_pm->getCname() + "-" + dst_pm->getCname() + ")"; + std::string("__pr_mig_tx:") + vm->get_cname() + "(" + src_pm->get_cname() + "-" + dst_pm->get_cname() + ")"; simgrid::s4u::ActorPtr rx = - simgrid::s4u::Actor::createActor(rx_name.c_str(), dst_pm, simgrid::vm::MigrationRx(vm, dst_pm)); + simgrid::s4u::Actor::create(rx_name.c_str(), dst_pm, simgrid::vm::MigrationRx(vm, dst_pm)); simgrid::s4u::ActorPtr tx = - simgrid::s4u::Actor::createActor(tx_name.c_str(), src_pm, simgrid::vm::MigrationTx(vm, dst_pm)); + simgrid::s4u::Actor::create(tx_name.c_str(), src_pm, simgrid::vm::MigrationTx(vm, dst_pm)); + + vm->extension_set(new simgrid::vm::VmMigrationExt(simgrid::s4u::Actor::self(), rx, tx)); /* wait until the migration have finished or on error has occurred */ XBT_DEBUG("wait for reception of the final ACK (i.e. migration has been correctly performed"); - simgrid::s4u::MailboxPtr mbox_ctl = simgrid::s4u::Mailbox::byName( - std::string("__mbox_mig_ctl:") + vm->getCname() + "(" + src_pm->getCname() + "-" + dst_pm->getCname() + ")"); + simgrid::s4u::MailboxPtr mbox_ctl = simgrid::s4u::Mailbox::by_name( + std::string("__mbox_mig_ctl:") + vm->get_cname() + "(" + src_pm->get_cname() + "-" + dst_pm->get_cname() + ")"); delete static_cast(mbox_ctl->get()); - tx->join(); rx->join(); - vm->pimpl_vm_->isMigrating = false; -} + vm->get_impl()->is_migrating_ = false; + simgrid::s4u::VirtualMachine::on_migration_end(*vm); }