src/mc/explo/UdporChecker.cpp

   1 /* Copyright (c) 2016-2023. The SimGrid Team. All rights reserved.          */
   2
   3 /* This program is free software; you can redistribute it and/or modify it
   4  * under the terms of the license (GNU LGPL) which comes with this package. */
   5
   6 #include "src/mc/explo/UdporChecker.hpp"
   7 #include "src/mc/api/State.hpp"
   8 #include "src/mc/explo/udpor/Comb.hpp"
   9 #include "src/mc/explo/udpor/ExtensionSetCalculator.hpp"
  10 #include "src/mc/explo/udpor/History.hpp"
  11 #include "src/mc/explo/udpor/maximal_subsets_iterator.hpp"
  12
  13 #include <numeric>
  14 #include <xbt/asserts.h>
  15 #include <xbt/log.h>
  16 #include <xbt/string.hpp>
  17
  18 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(mc_udpor, mc, "Logging specific to verification using UDPOR");
  19
  20 namespace simgrid::mc::udpor {
  21
  22 UdporChecker::UdporChecker(const std::vector<char*>& args) : Exploration(args, true) {}
  23
  24 void UdporChecker::run()
  25 {
  26   XBT_INFO("Starting a UDPOR exploration");
  27   state_stack.clear();
  28   state_stack.push_back(get_current_state());
  29   explore(Configuration(), EventSet(), EventSet(), EventSet());
  30   XBT_INFO("UDPOR exploration terminated -- model checking completed");
  31 }
  32
  33 void UdporChecker::explore(const Configuration& C, EventSet D, EventSet A, EventSet prev_exC)
  34 {
  35   auto& stateC   = *state_stack.back();
  36   auto exC       = compute_exC(C, stateC, prev_exC);
  37   const auto enC = compute_enC(C, exC);
  38   XBT_DEBUG("explore(C, D, A) with:\n"
  39             "C\t := %s \n"
  40             "D\t := %s \n"
  41             "A\t := %s \n"
  42             "ex(C)\t := %s \n"
  43             "en(C)\t := %s \n",
  44             C.to_string().c_str(), D.to_string().c_str(), A.to_string().c_str(), exC.to_string().c_str(),
  45             enC.to_string().c_str());
  46   XBT_DEBUG("ex(C) has %zu elements, of which %zu are in en(C)", exC.size(), enC.size());
  47
  48   // If enC is a subset of D, intuitively
  49   // there aren't any enabled transitions
  50   // which are "worth" exploring since their
  51   // exploration would lead to a so-called
  52   // "sleep-set blocked" trace.
  53   if (enC.is_subset_of(D)) {
  54     XBT_DEBUG("en(C) is a subset of the sleep set D (size %zu); if we "
  55               "kept exploring, we'd hit a sleep-set blocked trace",
  56               D.size());
  57     XBT_DEBUG("The current configuration has %zu elements", C.get_events().size());
  58
  59     // When `en(C)` is empty, intuitively this means that there
  60     // are no enabled transitions that can be executed from the
  61     // state reached by `C` (denoted `state(C)`), i.e. by some
  62     // execution of the transitions in C obeying the causality
  63     // relation. Here, then, we may be in a deadlock (the other
  64     // possibility is that we've finished running everything, and
  65     // we wouldn't be in deadlock then)
  66     if (enC.empty()) {
  67       XBT_VERB("**************************");
  68       XBT_VERB("*** TRACE INVESTIGATED ***");
  69       XBT_VERB("**************************");
  70       XBT_VERB("Execution sequence:");
  71       for (auto const& s : get_textual_trace())
  72         XBT_VERB("  %s", s.c_str());
  73       get_remote_app().check_deadlock();
  74     }
  75
  76     return;
  77   }
  78   UnfoldingEvent* e = select_next_unfolding_event(A, enC);
  79   xbt_assert(e != nullptr, "\n\n****** INVARIANT VIOLATION ******\n"
  80                            "UDPOR guarantees that an event will be chosen at each point in\n"
  81                            "the search, yet no events were actually chosen\n"
  82                            "*********************************\n\n");
  83   XBT_DEBUG("Selected event `%s` (%zu dependencies) to extend the configuration", e->to_string().c_str(),
  84             e->get_immediate_causes().size());
  85
  86   // Ce := C + {e}
  87   Configuration Ce = C;
  88   Ce.add_event(e);
  89
  90   A.remove(e);
  91   exC.remove(e);
  92
  93   // Explore(C + {e}, D, A \ {e})
  94
  95   // Move the application into stateCe (i.e. `state(C + {e})`) and make note of that state
  96   move_to_stateCe(&stateC, e);
  97   state_stack.push_back(record_current_state());
  98
  99   explore(Ce, D, std::move(A), std::move(exC));
 100
 101   // Prepare to move the application back one state.
 102   // We need only remove the state from the stack here: if we perform
 103   // another `Explore()` after computing an alternative, at that
 104   // point we'll actually create a fresh RemoteProcess
 105   state_stack.pop_back();
 106
 107   // D <-- D + {e}
 108   D.insert(e);
 109
 110   XBT_DEBUG("Checking for the existence of an alternative...");
 111   if (auto J = C.compute_alternative_to(D, this->unfolding); J.has_value()) {
 112     // Before searching the "right half", we need to make
 113     // sure the program actually reflects the fact
 114     // that we are searching again from `state(C)`. While the
 115     // stack of states is properly adjusted to represent
 116     // `state(C)` all together, the RemoteApp is currently sitting
 117     // at some *future* state with resepct to `state(C)` since the
 118     // recursive calls have moved it there.
 119     restore_program_state_with_current_stack();
 120
 121     // Explore(C, D + {e}, J \ C)
 122     auto J_minus_C = J.value().get_events().subtracting(C.get_events());
 123
 124     XBT_DEBUG("Alternative detected! The alternative is:\n"
 125               "J\t := %s \n"
 126               "J / C := %s\n"
 127               "UDPOR is going to explore it...",
 128               J.value().to_string().c_str(), J_minus_C.to_string().c_str());
 129     explore(C, D, std::move(J_minus_C), std::move(prev_exC));
 130   } else {
 131     XBT_DEBUG("No alternative detected with:\n"
 132               "C\t := %s \n"
 133               "D\t := %s \n"
 134               "A\t := %s \n",
 135               C.to_string().c_str(), D.to_string().c_str(), A.to_string().c_str());
 136   }
 137
 138   // D <-- D - {e}
 139   D.remove(e);
 140
 141   // Remove(e, C, D)
 142   clean_up_explore(e, C, D);
 143 }
 144
 145 EventSet UdporChecker::compute_exC(const Configuration& C, const State& stateC, const EventSet& prev_exC)
 146 {
 147   // See eqs. 5.7 of section 5.2 of [3]
 148   // C = C' + {e_cur}, i.e. C' = C - {e_cur}
 149   //
 150   // Then
 151   //
 152   // ex(C) = ex(C' + {e_cur}) = ex(C') / {e_cur} +
 153   //    U{<a, K> : K is maximal, `a` depends on all of K, `a` enabled at config(K) }
 154   const UnfoldingEvent* e_cur = C.get_latest_event();
 155   EventSet exC                = prev_exC;
 156   exC.remove(e_cur);
 157
 158   // IMPORTANT NOTE: In order to have deterministic results, we need to process
 159   // the actors in a deterministic manner so that events are discovered by
 160   // UDPOR in a deterministic order. The processing done here always processes
 161   // actors in a consistent order since `std::map` is by-default ordered using
 162   // `std::less<Key>` (see the return type of `State::get_actors_list()`)
 163   for (const auto& [aid, actor_state] : stateC.get_actors_list()) {
 164     for (const auto& transition : actor_state.get_enabled_transitions()) {
 165       XBT_DEBUG("\t Considering partial extension for %s", transition->to_string().c_str());
 166       EventSet extension = ExtensionSetCalculator::partially_extend(C, &unfolding, transition);
 167       exC.form_union(extension);
 168     }
 169   }
 170   return exC;
 171 }
 172
 173 EventSet UdporChecker::compute_enC(const Configuration& C, const EventSet& exC) const
 174 {
 175   EventSet enC;
 176   for (const auto* e : exC) {
 177     if (C.is_compatible_with(e)) {
 178       enC.insert(e);
 179     }
 180   }
 181   return enC;
 182 }
 183
 184 void UdporChecker::move_to_stateCe(State* state, UnfoldingEvent* e)
 185 {
 186   const aid_t next_actor = e->get_transition()->aid_;
 187
 188   // TODO: Add the trace if possible for reporting a bug
 189   xbt_assert(next_actor >= 0, "\n\n****** INVARIANT VIOLATION ******\n"
 190                               "In reaching this execution path, UDPOR ensures that at least one\n"
 191                               "one transition of the state of an visited event is enabled, yet no\n"
 192                               "state was actually enabled. Please report this as a bug.\n"
 193                               "*********************************\n\n");
 194   auto latest_transition_by_next_actor = state->execute_next(next_actor, get_remote_app());
 195
 196   // The transition that is associated with the event was just
 197   // executed, so it's possible that the new version of the transition
 198   // (i.e. the one after execution) has *more* information than
 199   // that which existed *prior* to execution.
 200   //
 201   //
 202   // ------- !!!!! UDPOR INVARIANT !!!!! -------
 203   //
 204   // At this point, we are leveraging the fact that
 205   // UDPOR will not contain more than one copy of any
 206   // transition executed by any actor for any
 207   // particular step taken by that actor. That is,
 208   // if transition `i` of the `j`th actor is contained in the
 209   // configuration `C` currently under consideration
 210   // by UDPOR, then only one and only one copy exists in `C`
 211   //
 212   // This means that we can referesh the transitions associated
 213   // with each event lazily, i.e. only after we have chosen the
 214   // event to continue our execution.
 215   e->set_transition(std::move(latest_transition_by_next_actor));
 216 }
 217
 218 void UdporChecker::restore_program_state_with_current_stack()
 219 {
 220   XBT_DEBUG("Restoring state using the current stack");
 221   get_remote_app().restore_initial_state();
 222
 223   /* Traverse the stack from the state at position start and re-execute the transitions */
 224   for (const std::unique_ptr<State>& state : state_stack) {
 225     if (state == state_stack.back()) /* If we are arrived on the target state, don't replay the outgoing transition */
 226       break;
 227     state->get_transition_out()->replay(get_remote_app());
 228   }
 229 }
 230
 231 std::unique_ptr<State> UdporChecker::record_current_state()
 232 {
 233   auto next_state = this->get_current_state();
 234
 235   // In UDPOR, we care about all enabled transitions in a given state
 236   next_state->consider_all();
 237
 238   return next_state;
 239 }
 240
 241 UnfoldingEvent* UdporChecker::select_next_unfolding_event(const EventSet& A, const EventSet& enC)
 242 {
 243   if (enC.empty()) {
 244     throw std::invalid_argument("There are no unfolding events to select. "
 245                                 "Are you sure that you checked that en(C) was not "
 246                                 "empty before attempting to select an event from it?");
 247   }
 248
 249   // UDPOR's exploration is non-deterministic (as is DPOR's)
 250   // in the sense that at any given point there may
 251   // be multiple paths that can be followed. The correctness and optimality
 252   // of the algorithm remains unaffected by the route taken by UDPOR when
 253   // given multiple choices; but to ensure that SimGrid itself has deterministic
 254   // behavior on all platforms, we always pick events with lower id's
 255   // to ensure we explore the unfolding deterministically.
 256   if (A.empty()) {
 257     const auto min_event = std::min_element(enC.begin(), enC.end(),
 258                                             [](const auto e1, const auto e2) { return e1->get_id() < e2->get_id(); });
 259     return const_cast<UnfoldingEvent*>(*min_event);
 260   } else {
 261     const auto intersection = A.make_intersection(enC);
 262     const auto min_event    = std::min_element(intersection.begin(), intersection.end(),
 263                                                [](const auto e1, const auto e2) { return e1->get_id() < e2->get_id(); });
 264     return const_cast<UnfoldingEvent*>(*min_event);
 265   }
 266 }
 267
 268 void UdporChecker::clean_up_explore(const UnfoldingEvent* e, const Configuration& C, const EventSet& D)
 269 {
 270   // The "clean-up set" conceptually represents
 271   // those events which will no longer be considered
 272   // by UDPOR during its exploration. The concept is
 273   // introduced to avoid modification during iteration
 274   // over the current unfolding to determine who needs to
 275   // be removed. Since sets are unordered, it's quite possible
 276   // that e.g. two events `e` and `e'` such that `e < e'`
 277   // which are determined eligible for removal are removed
 278   // in the order `e` and then `e'`. Determining that `e'`
 279   // needs to be removed requires that its history be in
 280   // tact to e.g. compute the conflicts with the event.
 281   //
 282   // Thus, we compute the set and remove all of the events
 283   // at once in lieu of removing events while iterating over them.
 284   // We can hypothesize that processing the events in reverse
 285   // topological order would prevent any issues concerning
 286   // the order in which are processed
 287   EventSet clean_up_set;
 288
 289   // Q_(C, D, U) = C u D u U (complicated expression)
 290   // See page 9 of "Unfolding-based Partial Order Reduction"
 291
 292   // "C u D" portion
 293   const EventSet C_union_D = C.get_events().make_union(D);
 294
 295   // "U (complicated expression)" portion
 296   const EventSet conflict_union = std::accumulate(
 297       C_union_D.begin(), C_union_D.end(), EventSet(), [&](const EventSet acc, const UnfoldingEvent* e_prime) {
 298         return acc.make_union(unfolding.get_immediate_conflicts_of(e_prime));
 299       });
 300
 301   const EventSet Q_CDU = C_union_D.make_union(conflict_union.get_local_config());
 302
 303   XBT_DEBUG("Computed Q_CDU as '%s'", Q_CDU.to_string().c_str());
 304
 305   // Move {e} \ Q_CDU from U to G
 306   if (not Q_CDU.contains(e)) {
 307     XBT_DEBUG("Moving %s from U to G...", e->to_string().c_str());
 308     clean_up_set.insert(e);
 309   }
 310
 311   // foreach ê in #ⁱ_U(e)
 312   for (const auto* e_hat : this->unfolding.get_immediate_conflicts_of(e)) {
 313     // Move [ê] \ Q_CDU from U to G
 314     const EventSet to_remove = e_hat->get_local_config().subtracting(Q_CDU);
 315     XBT_DEBUG("Moving {%s} from U to G...", to_remove.to_string().c_str());
 316     clean_up_set.form_union(to_remove);
 317   }
 318
 319   // TODO: We still perhaps need to
 320   // figure out how to deal with the fact that the previous
 321   // extension sets computed for past configurations
 322   // contain events that may be removed from `U`. Perhaps
 323   // it would be best to keep them around forever (they
 324   // are moved to `G` after all and can be discarded at will,
 325   // which means they may never have to be removed at all).
 326   //
 327   // Of course, the benefit of moving them into the set `G`
 328   // is that the computation for immediate conflicts becomes
 329   // more efficient (we have to search all of `U` for such conflicts,
 330   // and there would be no reason to search those events
 331   // that UDPOR has marked as no longer being important)
 332   // For now, there appear to be no "obvious" issues (although
 333   // UDPOR's behavior is often far from obvious...)
 334   this->unfolding.mark_finished(clean_up_set);
 335 }
 336
 337 RecordTrace UdporChecker::get_record_trace()
 338 {
 339   RecordTrace res;
 340   for (auto const& state : state_stack)
 341     res.push_back(state->get_transition_out().get());
 342   return res;
 343 }
 344
 345 } // namespace simgrid::mc::udpor
 346
 347 namespace simgrid::mc {
 348
 349 Exploration* create_udpor_checker(const std::vector<char*>& args)
 350 {
 351   return new simgrid::mc::udpor::UdporChecker(args);
 352 }
 353
 354 } // namespace simgrid::mc