X-Git-Url: http://info.iut-bm.univ-fcomte.fr/pub/gitweb/simgrid.git/blobdiff_plain/0b12f8c2c1c67c98251c9e523725c74ac172c0f6..b372d23d3d8818b4547ef207f43b45709298a002:/src/plugins/host_dvfs.cpp diff --git a/src/plugins/host_dvfs.cpp b/src/plugins/host_dvfs.cpp index da093ade75..4378b2b5ee 100644 --- a/src/plugins/host_dvfs.cpp +++ b/src/plugins/host_dvfs.cpp @@ -1,32 +1,59 @@ -/* Copyright (c) 2010-2018. The SimGrid Team. All rights reserved. */ +/* Copyright (c) 2010-2020. The SimGrid Team. All rights reserved. */ /* This program is free software; you can redistribute it and/or modify it * under the terms of the license (GNU LGPL) which comes with this package. */ #include "simgrid/plugins/dvfs.h" #include "simgrid/plugins/load.h" +#include "simgrid/s4u/Engine.hpp" +#include "src/internal_config.h" // HAVE_SMPI +#include "src/kernel/activity/ExecImpl.hpp" #include "src/plugins/vm/VirtualMachineImpl.hpp" +#if HAVE_SMPI +#include "src/smpi/plugins/ampi/ampi.hpp" +#endif #include #include +#if HAVE_SMPI +#include "src/smpi/include/smpi_request.hpp" +#endif SIMGRID_REGISTER_PLUGIN(host_dvfs, "Dvfs support", &sg_host_dvfs_plugin_init) -static simgrid::config::Flag cfg_sampling_rate("plugin/dvfs/sampling-rate", {"plugin/dvfs/sampling_rate"}, - "How often should the dvfs plugin check whether the frequency needs to be changed?", 0.1, - [](double val){if (val != 0.1) sg_host_dvfs_plugin_init();}); +static simgrid::config::Flag + cfg_sampling_rate("plugin/dvfs/sampling-rate", + "How often should the dvfs plugin check whether the frequency needs to be changed?", 0.1, + [](double val) { + if (val != 0.1) + sg_host_dvfs_plugin_init(); + }); static simgrid::config::Flag cfg_governor("plugin/dvfs/governor", - "Which Governor should be used that adapts the CPU frequency?", "performance", - - std::map({ - {"conservative", "TODO: Doc"}, - {"ondemand", "TODO: Doc"}, - {"performance", "TODO: Doc"}, - {"powersave", "TODO: Doc"}, - }), - - [](std::string val){if (val != "performance") sg_host_dvfs_plugin_init();}); + "Which Governor should be used that adapts the CPU frequency?", + "performance", + + std::map>({ +#if HAVE_SMPI + {"adagio", "TODO: Doc"}, +#endif + {"conservative", "TODO: Doc"}, {"ondemand", "TODO: Doc"}, + {"performance", "TODO: Doc"}, {"powersave", "TODO: Doc"}, + }), + + [](const std::string& val) { + if (val != "performance") + sg_host_dvfs_plugin_init(); + }); + +static simgrid::config::Flag + cfg_min_pstate("plugin/dvfs/min-pstate", + "Which pstate is the minimum (and hence fastest) pstate for this governor?", 0); + +static const int max_pstate_not_limited = -1; +static simgrid::config::Flag + cfg_max_pstate("plugin/dvfs/max-pstate", + "Which pstate is the maximum (and hence slowest) pstate for this governor?", max_pstate_not_limited); /** @addtogroup SURF_plugin_load @@ -60,31 +87,49 @@ namespace dvfs { * global configuration */ class Governor { - -private: simgrid::s4u::Host* const host_; double sampling_rate_; + int min_pstate = cfg_min_pstate; //< Never use a pstate less than this one + int max_pstate = cfg_max_pstate; //< Never use a pstate larger than this one public: - - explicit Governor(simgrid::s4u::Host* ptr) : host_(ptr) { init(); } + explicit Governor(simgrid::s4u::Host* ptr) + : host_(ptr) + { + if (cfg_max_pstate == max_pstate_not_limited) + max_pstate = host_->get_pstate_count() - 1; + init(); + } virtual ~Governor() = default; - virtual std::string get_name() = 0; + virtual std::string get_name() const = 0; simgrid::s4u::Host* get_host() const { return host_; } + int get_min_pstate() const { return min_pstate; } + int get_max_pstate() const { return max_pstate; } void init() { const char* local_sampling_rate_config = host_->get_property(cfg_sampling_rate.get_name()); - double global_sampling_rate_config = cfg_sampling_rate; if (local_sampling_rate_config != nullptr) { sampling_rate_ = std::stod(local_sampling_rate_config); } else { - sampling_rate_ = global_sampling_rate_config; + sampling_rate_ = cfg_sampling_rate; + } + const char* local_min_pstate_config = host_->get_property(cfg_min_pstate.get_name()); + if (local_min_pstate_config != nullptr) { + min_pstate = std::stoi(local_min_pstate_config); + } + + const char* local_max_pstate_config = host_->get_property(cfg_max_pstate.get_name()); + if (local_max_pstate_config != nullptr) { + max_pstate = std::stod(local_max_pstate_config); } + xbt_assert(max_pstate <= host_->get_pstate_count() - 1, "Value for max_pstate too large!"); + xbt_assert(min_pstate <= max_pstate, "min_pstate is larger than max_pstate!"); + xbt_assert(0 <= min_pstate, "min_pstate is negative!"); } virtual void update() = 0; - double get_sampling_rate() { return sampling_rate_; } + double get_sampling_rate() const { return sampling_rate_; } }; /** @@ -99,10 +144,10 @@ public: */ class Performance : public Governor { public: - explicit Performance(simgrid::s4u::Host* ptr) : Governor(ptr) {} - std::string get_name() override { return "Performance"; } + using Governor::Governor; + std::string get_name() const override { return "Performance"; } - void update() override { get_host()->set_pstate(0); } + void update() override { get_host()->set_pstate(get_min_pstate()); } }; /** @@ -117,10 +162,10 @@ public: */ class Powersave : public Governor { public: - explicit Powersave(simgrid::s4u::Host* ptr) : Governor(ptr) {} - std::string get_name() override { return "Powersave"; } + using Governor::Governor; + std::string get_name() const override { return "Powersave"; } - void update() override { get_host()->set_pstate(get_host()->get_pstate_count() - 1); } + void update() override { get_host()->set_pstate(get_max_pstate()); } }; /** @@ -140,8 +185,8 @@ class OnDemand : public Governor { double freq_up_threshold_ = 0.80; public: - explicit OnDemand(simgrid::s4u::Host* ptr) : Governor(ptr) {} - std::string get_name() override { return "OnDemand"; } + using Governor::Governor; + std::string get_name() const override { return "OnDemand"; } void update() override { @@ -149,8 +194,8 @@ public: sg_host_load_reset(get_host()); // Only consider the period between two calls to this method! if (load > freq_up_threshold_) { - get_host()->set_pstate(0); /* Run at max. performance! */ - XBT_INFO("Load: %f > threshold: %f --> changed to pstate %i", load, freq_up_threshold_, 0); + get_host()->set_pstate(get_min_pstate()); /* Run at max. performance! */ + XBT_INFO("Load: %f > threshold: %f --> changed to pstate %i", load, freq_up_threshold_, get_min_pstate()); } else { /* The actual implementation uses a formula here: (See Kernel file cpufreq_ondemand.c:158) * @@ -159,10 +204,11 @@ public: * So they assume that frequency increases by 100 MHz. We will just use * lowest_pstate - load*pstatesCount() */ - int max_pstate = get_host()->get_pstate_count() - 1; // Load is now < freq_up_threshold; exclude pstate 0 (the fastest) // because pstate 0 can only be selected if load > freq_up_threshold_ - int new_pstate = max_pstate - load * (max_pstate + 1); + int new_pstate = get_max_pstate() - load * (get_max_pstate() + 1); + if (new_pstate < get_min_pstate()) + new_pstate = get_min_pstate(); get_host()->set_pstate(new_pstate); XBT_DEBUG("Load: %f < threshold: %f --> changed to pstate %i", load, freq_up_threshold_, new_pstate); @@ -177,9 +223,9 @@ public: * * > The CPUfreq governor "conservative", much like the "ondemand" * > governor, sets the CPU frequency depending on the current usage. It - * > differs in behaviour in that it gracefully increases and decreases the + * > differs in behavior in that it gracefully increases and decreases the * > CPU speed rather than jumping to max speed the moment there is any load - * > on the CPU. This behaviour is more suitable in a battery powered + * > on the CPU. This behavior is more suitable in a battery powered * > environment. */ class Conservative : public Governor { @@ -187,17 +233,17 @@ class Conservative : public Governor { double freq_down_threshold_ = .2; public: - explicit Conservative(simgrid::s4u::Host* ptr) : Governor(ptr) {} - virtual std::string get_name() override { return "Conservative"; } + using Governor::Governor; + std::string get_name() const override { return "Conservative"; } - virtual void update() override + void update() override { double load = get_host()->get_core_count() * sg_host_get_avg_load(get_host()); int pstate = get_host()->get_pstate(); sg_host_load_reset(get_host()); // Only consider the period between two calls to this method! if (load > freq_up_threshold_) { - if (pstate != 0) { + if (pstate != get_min_pstate()) { get_host()->set_pstate(pstate - 1); XBT_INFO("Load: %f > threshold: %f -> increasing performance to pstate %d", load, freq_up_threshold_, pstate - 1); @@ -206,8 +252,7 @@ public: freq_up_threshold_, pstate); } } else if (load < freq_down_threshold_) { - int max_pstate = get_host()->get_pstate_count() - 1; - if (pstate != max_pstate) { // Are we in the slowest pstate already? + if (pstate != get_max_pstate()) { // Are we in the slowest pstate already? get_host()->set_pstate(pstate + 1); XBT_INFO("Load: %f < threshold: %f -> slowing down to pstate %d", load, freq_down_threshold_, pstate + 1); } else { @@ -218,6 +263,102 @@ public: } }; +#if HAVE_SMPI +class Adagio : public Governor { +private: + int best_pstate = 0; + double start_time = 0; + double comp_counter = 0; + double comp_timer = 0; + + std::vector> rates; // Each host + all frequencies of that host + + unsigned int task_id = 0; + bool iteration_running = false; /*< Are we currently between iteration_in and iteration_out calls? */ + +public: + explicit Adagio(simgrid::s4u::Host* ptr) + : Governor(ptr), rates(100, std::vector(ptr->get_pstate_count(), 0.0)) + { + simgrid::smpi::plugin::ampi::on_iteration_in.connect([this](simgrid::s4u::Actor const& actor) { + // Every instance of this class subscribes to this event, so one per host + // This means that for any actor, all 'hosts' are normally notified of these + // changes, even those who don't currently run the actor 'proc_id'. + // -> Let's check if this signal call is for us! + if (get_host() == actor.get_host()) { + iteration_running = true; + } + }); + simgrid::smpi::plugin::ampi::on_iteration_out.connect([this](simgrid::s4u::Actor const& actor) { + if (get_host() == actor.get_host()) { + iteration_running = false; + task_id = 0; + } + }); + simgrid::s4u::Exec::on_start.connect([this](simgrid::s4u::Exec const& activity) { + if (activity.get_host() == get_host()) + pre_task(); + }); + simgrid::s4u::Exec::on_completion.connect([this](simgrid::s4u::Exec const& activity) { + // For more than one host (not yet supported), we can access the host via + // simcalls_.front()->issuer->get_iface()->get_host() + if (activity.get_host() == get_host() && iteration_running) { + comp_timer += activity.get_finish_time() - activity.get_start_time(); + } + }); + // FIXME I think that this fires at the same time for all hosts, so when the src sends something, + // the dst will be notified even though it didn't even arrive at the recv yet + simgrid::s4u::Link::on_communicate.connect([this](const kernel::resource::NetworkAction& act) { + if ((get_host() == &act.get_src() || get_host() == &act.get_dst()) && iteration_running) { + post_task(); + } + }); + } + + std::string get_name() const override { return "Adagio"; } + + void pre_task() + { + sg_host_load_reset(get_host()); + comp_counter = sg_host_get_computed_flops(get_host()); // Should be 0 because of the reset + comp_timer = 0; + start_time = simgrid::s4u::Engine::get_clock(); + if (rates.size() <= task_id) + rates.resize(task_id + 5, std::vector(get_host()->get_pstate_count(), 0.0)); + if (rates[task_id][best_pstate] == 0) + best_pstate = 0; + get_host()->set_pstate(best_pstate); // Load our schedule + XBT_DEBUG("Set pstate to %i", best_pstate); + } + + void post_task() + { + double computed_flops = sg_host_get_computed_flops(get_host()) - comp_counter; + double target_time = (simgrid::s4u::Engine::get_clock() - start_time); + target_time = target_time * 99.0 / 100.0; // FIXME We account for t_copy arbitrarily with 1% + // -- this needs to be fixed + + bool is_initialized = rates[task_id][best_pstate] != 0; + rates[task_id][best_pstate] = computed_flops / comp_timer; + if (not is_initialized) { + for (int i = 1; i < get_host()->get_pstate_count(); i++) { + rates[task_id][i] = rates[task_id][0] * (get_host()->get_pstate_speed(i) / get_host()->get_speed()); + } + } + + for (int pstate = get_host()->get_pstate_count() - 1; pstate >= 0; pstate--) { + if (computed_flops / rates[task_id][pstate] <= target_time) { + // We just found the pstate we want to use! + best_pstate = pstate; + break; + } + } + task_id++; + } + + void update() override {} +}; +#endif } // namespace dvfs } // namespace plugin } // namespace simgrid @@ -249,28 +390,29 @@ static void on_host_added(simgrid::s4u::Host& host) boost::algorithm::to_lower(dvfs_governor); } - auto governor = [&dvfs_governor, &daemon_proc]() { + auto governor = [&dvfs_governor, &daemon_proc]() -> std::unique_ptr { if (dvfs_governor == "conservative") { - return std::unique_ptr( - new simgrid::plugin::dvfs::Conservative(daemon_proc->get_host())); + return std::make_unique(daemon_proc->get_host()); } else if (dvfs_governor == "ondemand") { - return std::unique_ptr( - new simgrid::plugin::dvfs::OnDemand(daemon_proc->get_host())); - } else if (dvfs_governor == "performance") { - return std::unique_ptr( - new simgrid::plugin::dvfs::Performance(daemon_proc->get_host())); + return std::make_unique(daemon_proc->get_host()); + } +#if HAVE_SMPI + else if (dvfs_governor == "adagio") { + return std::make_unique(daemon_proc->get_host()); + } +#endif + else if (dvfs_governor == "performance") { + return std::make_unique(daemon_proc->get_host()); } else if (dvfs_governor == "powersave") { - return std::unique_ptr( - new simgrid::plugin::dvfs::Powersave(daemon_proc->get_host())); + return std::make_unique(daemon_proc->get_host()); } else { XBT_CRITICAL("No governor specified for host %s, falling back to Performance", daemon_proc->get_host()->get_cname()); - return std::unique_ptr( - new simgrid::plugin::dvfs::Performance(daemon_proc->get_host())); + return std::make_unique(daemon_proc->get_host()); } }(); - while (1) { + while (true) { // Sleep *before* updating; important for startup (i.e., t = 0). // In the beginning, we want to go with the pstates specified in the platform file // (so we sleep first) @@ -290,7 +432,7 @@ static void on_host_added(simgrid::s4u::Host& host) /* **************************** Public interface *************************** */ -/** @ingroup SURF_plugin_load +/** * @brief Initializes the HostDvfs plugin * @details The HostDvfs plugin provides an API to get the current load of each host. */