1 /* Copyright (c) 2010-2020. The SimGrid Team. All rights reserved. */
3 /* This program is free software; you can redistribute it and/or modify it
4 * under the terms of the license (GNU LGPL) which comes with this package. */
6 #include "simgrid/plugins/load.h"
7 #include "src/include/surf/surf.hpp"
8 #include "src/kernel/activity/ExecImpl.hpp"
9 #include "src/plugins/vm/VirtualMachineImpl.hpp"
10 #include <simgrid/s4u.hpp>
12 // Makes sure that this plugin can be activated from the command line with ``--cfg=plugin:host_load``
13 SIMGRID_REGISTER_PLUGIN(host_load, "Cpu load", &sg_host_load_plugin_init)
15 /** @defgroup plugin_host_load Simple plugin that monitors the current load for each host.
18 In addition, this constitutes a good introductory example on how to write a plugin.
19 It attaches an extension to each host to store some data, and places callbacks in the following signals:
21 - :cpp:member:`simgrid::s4u::Host::on_creation`: Attach a new extension to the newly created host.
22 - :cpp:member:`simgrid::s4u::Exec::on_start`: Make note that a new execution started, increasing the load.
23 - :cpp:member:`simgrid::s4u::Exec::on_completion`: Make note that an execution completed, decreasing the load.
24 - :cpp:member:`simgrid::s4u::Host::on_state_change`: Do what is appropriate when the host gets suspended, turned off
26 - :cpp:member:`simgrid::s4u::Host::on_speed_change`: Do what is appropriate when the DVFS is modified.
28 Note that extensions are automatically destroyed when the host gets destroyed.
32 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(surf_plugin_load, surf, "Logging specific to the HostLoad plugin");
37 static const double activity_uninitialized_remaining_cost = -1;
39 /** This class stores the extra data needed by this plugin about a given host
41 * It is stored as an extension of s4u::Host. Such extensions are retrieved by type as follows:
44 * simgrid::s4u::Host* this_host = ???;
45 * this_extension = host->extension<HostLoad>();
48 * If no extension of that type was ever attached to the inspected object, the ``extension<X>()`` template returns
51 * Please refer to the implementation of ``sg_host_load_plugin_init()`` to see the extension objects are attached to
52 * hosts at initialization time.
56 static simgrid::xbt::Extension<simgrid::s4u::Host, HostLoad> EXTENSION_ID;
58 explicit HostLoad(simgrid::s4u::Host* ptr)
60 , last_updated_(surf_get_clock())
61 , last_reset_(surf_get_clock())
62 , current_speed_(host_->get_speed())
63 , current_flops_(host_->get_load())
66 ~HostLoad() = default;
68 explicit HostLoad(simgrid::s4u::Host& ptr) = delete;
69 explicit HostLoad(simgrid::s4u::Host&& ptr) = delete;
71 double get_current_load();
72 /** Get the the average load since last reset(), as a ratio
74 * That's the ratio (amount of flops that were actually computed) / (amount of flops that could have been computed at full speed)
76 double get_average_load() { update(); return (theor_max_flops_ == 0) ? 0 : computed_flops_ / theor_max_flops_; };
77 /** Amount of flops computed since last reset() */
78 double get_computed_flops() { update(); return computed_flops_; }
79 /** Return idle time since last reset() */
80 double get_idle_time() { update(); return idle_time_; }
81 /** Return idle time over the whole simulation */
82 double get_total_idle_time() { update(); return total_idle_time_; }
84 void add_activity(simgrid::kernel::activity::ExecImpl* activity);
88 simgrid::s4u::Host* host_ = nullptr;
89 /* Stores all currently ongoing activities (computations) on this machine */
90 std::map<simgrid::kernel::activity::ExecImpl*, /* cost still remaining*/ double> current_activities;
91 double last_updated_ = 0;
92 double last_reset_ = 0;
94 * current_speed each core is running at; we need to store this as the speed
95 * will already have changed once we get notified
97 double current_speed_ = 0;
99 * How many flops are currently used by all the processes running on this
102 double current_flops_ = 0;
103 double computed_flops_ = 0;
104 double idle_time_ = 0;
105 double total_idle_time_ = 0; /* This updated but never gets reset */
106 double theor_max_flops_ = 0;
109 // Create the static field that the extension mechanism needs
110 simgrid::xbt::Extension<simgrid::s4u::Host, HostLoad> HostLoad::EXTENSION_ID;
112 void HostLoad::add_activity(simgrid::kernel::activity::ExecImpl* activity)
114 current_activities.insert({activity, activity_uninitialized_remaining_cost});
117 void HostLoad::update()
119 double now = surf_get_clock();
121 // This loop updates the flops that the host executed for the ongoing computations
122 auto iter = begin(current_activities);
123 while (iter != end(current_activities)) {
124 auto& activity = iter->first; // Just an alias
125 auto& remaining_cost_after_last_update = iter->second; // Just an alias
126 auto& action = activity->surf_action_;
127 auto current_iter = iter;
130 if (action != nullptr && action->get_finish_time() != now && activity->state_ == kernel::activity::State::RUNNING) {
131 if (remaining_cost_after_last_update == activity_uninitialized_remaining_cost) {
132 remaining_cost_after_last_update = action->get_cost();
134 double computed_flops_since_last_update = remaining_cost_after_last_update - /*remaining now*/activity->get_remaining();
135 computed_flops_ += computed_flops_since_last_update;
136 remaining_cost_after_last_update = activity->get_remaining();
137 } else if (activity->state_ == kernel::activity::State::DONE) {
138 computed_flops_ += remaining_cost_after_last_update;
139 current_activities.erase(current_iter);
143 /* Current flop per second computed by the cpu; current_flops = k * pstate_speed_in_flops, k @in {0, 1, ..., cores-1}
144 * designates number of active cores; will be 0 if CPU is currently idle */
145 current_flops_ = host_->get_load();
147 if (current_flops_ == 0) {
148 idle_time_ += (now - last_updated_);
149 total_idle_time_ += (now - last_updated_);
150 XBT_DEBUG("[%s]: Currently idle -> Added %f seconds to idle time (totaling %fs)", host_->get_cname(), (now - last_updated_), idle_time_);
153 theor_max_flops_ += current_speed_ * host_->get_core_count() * (now - last_updated_);
154 current_speed_ = host_->get_speed();
158 /** @brief Get the current load as a ratio = achieved_flops / (core_current_speed * core_amount)
160 * You may also want to check simgrid::s4u::Host::get_load() that simply returns
161 * the achieved flop rate (in flops per seconds), ie the load that a new action arriving on
162 * that host would suffer.
164 * Please note that this function only returns an instantaneous load that may be deceiving
165 * in some scenarios. For example, imagine that an activity terminates at time t, and that
166 * another activity is created on the same host at the exact same timestamp. The load was
167 * never 0 on the simulated machine since the time did not advance between the two events.
168 * But still, if you call this function between the two events (in the simulator course), it
169 * returns 0 although there is no time (in the simulated time) where this value is valid.
171 double HostLoad::get_current_load()
173 // We don't need to call update() here because it is called every time an action terminates or starts
174 return current_flops_ / (host_->get_speed() * host_->get_core_count());
178 * Resets the counters
180 void HostLoad::reset()
182 last_updated_ = surf_get_clock();
183 last_reset_ = surf_get_clock();
186 theor_max_flops_ = 0;
187 current_flops_ = host_->get_load();
188 current_speed_ = host_->get_speed();
190 } // namespace plugin
191 } // namespace simgrid
193 using simgrid::plugin::HostLoad;
195 /* **************************** events callback *************************** */
196 /* This callback is fired either when the host changes its state (on/off) or its speed
197 * (because the user changed the pstate, or because of external trace events) */
198 static void on_host_change(simgrid::s4u::Host const& host)
200 if (dynamic_cast<simgrid::s4u::VirtualMachine const*>(&host)) // Ignore virtual machines
203 host.extension<HostLoad>()->update();
206 /* **************************** Public interface *************************** */
208 /** @brief Initializes the HostLoad plugin
209 * @ingroup plugin_host_load
211 void sg_host_load_plugin_init()
213 if (HostLoad::EXTENSION_ID.valid()) // Don't do the job twice
216 // First register our extension of Hosts properly
217 HostLoad::EXTENSION_ID = simgrid::s4u::Host::extension_create<HostLoad>();
219 // If SimGrid is already initialized, we need to attach an extension to each existing host
220 if (simgrid::s4u::Engine::is_initialized()) {
221 simgrid::s4u::Engine* e = simgrid::s4u::Engine::get_instance();
222 for (auto& host : e->get_all_hosts()) {
223 host->extension_set(new HostLoad(host));
227 // Make sure that every future host also gets an extension (in case the platform is not loaded yet)
228 simgrid::s4u::Host::on_creation.connect([](simgrid::s4u::Host& host) {
229 if (dynamic_cast<simgrid::s4u::VirtualMachine*>(&host)) // Ignore virtual machines
231 host.extension_set(new HostLoad(&host));
234 simgrid::s4u::Exec::on_start.connect([](simgrid::s4u::Actor const&, simgrid::s4u::Exec const& activity) {
235 if (activity.get_host_number() == 1) { // We only run on one host
236 simgrid::s4u::Host* host = activity.get_host();
237 const simgrid::s4u::VirtualMachine* vm = dynamic_cast<simgrid::s4u::VirtualMachine*>(host);
240 xbt_assert(host != nullptr);
241 host->extension<HostLoad>()->add_activity(static_cast<simgrid::kernel::activity::ExecImpl*>(activity.get_impl()));
242 host->extension<HostLoad>()->update(); // If the system was idle until now, we need to update *before*
243 // this computation starts running so we can keep track of the
244 // idle time. (Communication operations don't trigger this hook!)
246 else { // This runs on multiple hosts
247 XBT_WARN("HostLoad plugin currently does not support executions on several hosts");
250 simgrid::s4u::Exec::on_completion.connect([](simgrid::s4u::Actor const&, simgrid::s4u::Exec const& activity) {
251 if (activity.get_host_number() == 1) { // We only run on one host
252 simgrid::s4u::Host* host = activity.get_host();
253 const simgrid::s4u::VirtualMachine* vm = dynamic_cast<simgrid::s4u::VirtualMachine*>(host);
256 xbt_assert(host != nullptr);
257 host->extension<HostLoad>()->update();
259 else { // This runs on multiple hosts
260 XBT_WARN("HostLoad plugin currently does not support executions on several hosts");
263 simgrid::s4u::Host::on_state_change.connect(&on_host_change);
264 simgrid::s4u::Host::on_speed_change.connect(&on_host_change);
267 /** @brief Returns the current load of that host, as a ratio = achieved_flops / (core_current_speed * core_amount)
268 * @ingroup plugin_host_load
270 double sg_host_get_current_load(const_sg_host_t host)
272 xbt_assert(HostLoad::EXTENSION_ID.valid(), "Please sg_host_load_plugin_init() to initialize this plugin.");
274 return host->extension<HostLoad>()->get_current_load();
277 /** @brief Returns the current load of that host
278 * @ingroup plugin_host_load
280 double sg_host_get_avg_load(const_sg_host_t host)
282 xbt_assert(HostLoad::EXTENSION_ID.valid(), "Please sg_host_load_plugin_init() to initialize this plugin.");
284 return host->extension<HostLoad>()->get_average_load();
287 /** @brief Returns the time this host was idle since the last reset
288 * @ingroup plugin_host_load
290 double sg_host_get_idle_time(const_sg_host_t host)
292 xbt_assert(HostLoad::EXTENSION_ID.valid(), "Please sg_host_load_plugin_init() to initialize this plugin.");
294 return host->extension<HostLoad>()->get_idle_time();
297 /** @brief Returns the time this host was idle since the beginning of the simulation
298 * @ingroup plugin_host_load
300 double sg_host_get_total_idle_time(const_sg_host_t host)
302 xbt_assert(HostLoad::EXTENSION_ID.valid(), "Please sg_host_load_plugin_init() to initialize this plugin.");
304 return host->extension<HostLoad>()->get_total_idle_time();
307 /** @brief Returns the amount of flops computed by that host since the last reset
308 * @ingroup plugin_host_load
310 double sg_host_get_computed_flops(const_sg_host_t host)
312 xbt_assert(HostLoad::EXTENSION_ID.valid(), "Please sg_host_load_plugin_init() to initialize this plugin.");
314 return host->extension<HostLoad>()->get_computed_flops();
317 /** @brief Resets the idle time and flops amount of that host
318 * @ingroup plugin_host_load
320 void sg_host_load_reset(const_sg_host_t host)
322 xbt_assert(HostLoad::EXTENSION_ID.valid(), "Please sg_host_load_plugin_init() to initialize this plugin.");
324 host->extension<HostLoad>()->reset();