1 /* Copyright (c) 2013-2021. The SimGrid Team. All rights reserved. */
3 /* This program is free software; you can redistribute it and/or modify it
4 * under the terms of the license (GNU LGPL) which comes with this package. */
7 #include "src/kernel/resource/profile/Event.hpp"
8 #include "src/kernel/resource/profile/Profile.hpp"
9 #include "src/surf/surf_interface.hpp"
10 #include "surf/surf.hpp"
15 constexpr double EPSILON = 0.000000001;
17 XBT_LOG_NEW_DEFAULT_SUBCATEGORY(cpu_ti, cpu, "CPU resource, Trace Integration model");
27 CpuTiProfile::CpuTiProfile(const profile::Profile* profile)
31 unsigned nb_points = profile->event_list.size() + 1;
32 time_points_.reserve(nb_points);
33 integral_.reserve(nb_points);
34 for (auto const& val : profile->event_list) {
35 time_points_.push_back(time);
36 integral_.push_back(integral);
38 integral += val.date_ * val.value_;
40 time_points_.push_back(time);
41 integral_.push_back(integral);
45 * @brief Integrate trace
47 * Wrapper around surf_cpu_integrate_trace_simple() to get
50 * @param a Begin of interval
51 * @param b End of interval
52 * @return the integrate value. -1 if an error occurs.
54 double CpuTiTmgr::integrate(double a, double b) const
56 if ((a < 0.0) || (a > b)) {
57 xbt_die("Error, invalid integration interval [%.2f,%.2f]. "
58 "You probably have a task executing with negative computation amount. Check your code.", a, b);
60 if (fabs(a - b) < EPSILON)
63 if (type_ == Type::FIXED) {
64 return (b - a) * value_;
68 if (fabs(ceil(a / last_time_) - a / last_time_) < EPSILON)
69 a_index = 1 + ceil(a / last_time_);
71 a_index = ceil(a / last_time_);
72 double b_index = floor(b / last_time_);
74 if (a_index > b_index) { /* Same chunk */
75 return profile_->integrate_simple(a - (a_index - 1) * last_time_, b - b_index * last_time_);
78 double first_chunk = profile_->integrate_simple(a - (a_index - 1) * last_time_, last_time_);
79 double middle_chunk = (b_index - a_index) * total_;
80 double last_chunk = profile_->integrate_simple(0.0, b - b_index * last_time_);
82 XBT_DEBUG("first_chunk=%.2f middle_chunk=%.2f last_chunk=%.2f\n", first_chunk, middle_chunk, last_chunk);
84 return (first_chunk + middle_chunk + last_chunk);
88 * @brief Auxiliary function to compute the integral between a and b.
89 * It simply computes the integrals at point a and b and returns the difference between them.
90 * @param a Initial point
91 * @param b Final point
93 double CpuTiProfile::integrate_simple(double a, double b) const
95 return integrate_simple_point(b) - integrate_simple_point(a);
99 * @brief Auxiliary function to compute the integral at point a.
102 double CpuTiProfile::integrate_simple_point(double a) const
106 int ind = binary_search(time_points_, a);
107 integral += integral_[ind];
109 XBT_DEBUG("a %f ind %d integral %f ind + 1 %f ind %f time +1 %f time %f", a, ind, integral, integral_[ind + 1],
110 integral_[ind], time_points_[ind + 1], time_points_[ind]);
111 double_update(&a_aux, time_points_[ind], sg_maxmin_precision * sg_surf_precision);
114 ((integral_[ind + 1] - integral_[ind]) / (time_points_[ind + 1] - time_points_[ind])) * (a - time_points_[ind]);
115 XBT_DEBUG("Integral a %f = %f", a, integral);
121 * @brief Computes the time needed to execute "amount" on cpu.
123 * Here, amount can span multiple trace periods
125 * @param a Initial time
126 * @param amount Amount to be executed
129 double CpuTiTmgr::solve(double a, double amount) const
131 /* Fix very small negative numbers */
132 if ((a < 0.0) && (a > -EPSILON)) {
135 if ((amount < 0.0) && (amount > -EPSILON)) {
140 if ((a < 0.0) || (amount < 0.0)) {
141 XBT_CRITICAL ("Error, invalid parameters [a = %.2f, amount = %.2f]. "
142 "You probably have a task executing with negative computation amount. Check your code.", a, amount);
146 /* At this point, a and amount are positive */
147 if (amount < EPSILON)
150 /* Is the trace fixed ? */
151 if (type_ == Type::FIXED) {
152 return (a + (amount / value_));
155 XBT_DEBUG("amount %f total %f", amount, total_);
156 /* Reduce the problem to one where amount <= trace_total */
157 double quotient = floor(amount / total_);
158 double reduced_amount = (total_) * ((amount / total_) - floor(amount / total_));
159 double reduced_a = a - (last_time_) * static_cast<int>(floor(a / last_time_));
161 XBT_DEBUG("Quotient: %g reduced_amount: %f reduced_a: %f", quotient, reduced_amount, reduced_a);
163 /* Now solve for new_amount which is <= trace_total */
165 XBT_DEBUG("Solve integral: [%.2f, amount=%.2f]", reduced_a, reduced_amount);
166 double amount_till_end = integrate(reduced_a, last_time_);
168 if (amount_till_end > reduced_amount) {
169 reduced_b = profile_->solve_simple(reduced_a, reduced_amount);
171 reduced_b = last_time_ + profile_->solve_simple(0.0, reduced_amount - amount_till_end);
174 /* Re-map to the original b and amount */
175 return last_time_ * floor(a / last_time_) + (quotient * last_time_) + reduced_b;
179 * @brief Auxiliary function to solve integral.
180 * It returns the date when the requested amount of flops is available
181 * @param a Initial point
182 * @param amount Amount of flops
183 * @return The date when amount is available.
185 double CpuTiProfile::solve_simple(double a, double amount) const
187 double integral_a = integrate_simple_point(a);
188 int ind = binary_search(integral_, integral_a + amount);
189 double time = time_points_[ind];
190 time += (integral_a + amount - integral_[ind]) /
191 ((integral_[ind + 1] - integral_[ind]) / (time_points_[ind + 1] - time_points_[ind]));
197 * @brief Auxiliary function to update the CPU speed scale.
199 * This function uses the trace structure to return the speed scale at the determined time a.
201 * @return CPU speed scale
203 double CpuTiTmgr::get_power_scale(double a) const
205 double reduced_a = a - floor(a / last_time_) * last_time_;
206 int point = CpuTiProfile::binary_search(profile_->time_points_, reduced_a);
207 kernel::profile::DatedValue val = speed_profile_->event_list.at(point);
212 * @brief Creates a new integration trace from a tmgr_trace_t
214 * @param speed_trace CPU availability trace
215 * @param value Percentage of CPU speed available (useful to fixed tracing)
216 * @return Integration trace structure
218 CpuTiTmgr::CpuTiTmgr(kernel::profile::Profile* speed_profile, double value) : speed_profile_(speed_profile)
220 double total_time = 0.0;
221 profile_.reset(nullptr);
223 /* no availability file, fixed trace */
224 if (not speed_profile) {
226 XBT_DEBUG("No availability trace. Constant value = %f", value);
230 /* only one point available, fixed trace */
231 if (speed_profile->event_list.size() == 1) {
232 value_ = speed_profile->event_list.front().value_;
236 type_ = Type::DYNAMIC;
238 /* count the total time of trace file */
239 for (auto const& val : speed_profile->event_list)
240 total_time += val.date_;
242 profile_ = std::make_unique<CpuTiProfile>(speed_profile);
243 last_time_ = total_time;
244 total_ = profile_->integrate_simple(0, total_time);
246 XBT_DEBUG("Total integral %f, last_time %f ", total_, last_time_);
250 * @brief Binary search in array.
251 * It returns the last point of the interval in which "a" is.
253 * @param a Value to search
254 * @return Index of point
256 int CpuTiProfile::binary_search(const std::vector<double>& array, double a)
260 auto pos = std::upper_bound(begin(array), end(array), a);
261 return std::distance(begin(array), pos) - 1;
268 void CpuTiModel::create_pm_vm_models()
270 xbt_assert(surf_cpu_model_pm == nullptr, "CPU model already initialized. This should not happen.");
271 xbt_assert(surf_cpu_model_vm == nullptr, "CPU model already initialized. This should not happen.");
273 surf_cpu_model_pm = new CpuTiModel();
274 surf_cpu_model_vm = new CpuTiModel();
277 CpuTiModel::CpuTiModel() : CpuModel(Model::UpdateAlgo::FULL)
279 all_existing_models.push_back(this);
282 CpuTiModel::~CpuTiModel()
284 surf_cpu_model_pm = nullptr;
287 Cpu* CpuTiModel::create_cpu(s4u::Host* host, const std::vector<double>& speed_per_pstate, int core)
289 return new CpuTi(this, host, speed_per_pstate, core);
292 double CpuTiModel::next_occurring_event(double now)
294 double min_action_duration = -1;
296 /* iterates over modified cpus to update share resources */
297 for (auto it = std::begin(modified_cpus_); it != std::end(modified_cpus_);) {
299 ++it; // increment iterator here since the following call to ti.update_actions_finish_time() may invalidate it
300 cpu.update_actions_finish_time(now);
303 /* get the min next event if heap not empty */
304 if (not get_action_heap().empty())
305 min_action_duration = get_action_heap().top_date() - now;
307 XBT_DEBUG("Share resources, min next event date: %f", min_action_duration);
309 return min_action_duration;
312 void CpuTiModel::update_actions_state(double now, double /*delta*/)
314 while (not get_action_heap().empty() && double_equals(get_action_heap().top_date(), now, sg_surf_precision)) {
315 auto* action = static_cast<CpuTiAction*>(get_action_heap().pop());
316 XBT_DEBUG("Action %p: finish", action);
317 action->finish(Action::State::FINISHED);
318 /* update remaining amount of all actions */
319 action->cpu_->update_remaining_amount(surf_get_clock());
326 CpuTi::CpuTi(CpuTiModel* model, s4u::Host* host, const std::vector<double>& speed_per_pstate, int core)
327 : Cpu(model, host, speed_per_pstate, core)
329 xbt_assert(core == 1, "Multi-core not handled by this model yet");
331 speed_.peak = speed_per_pstate.front();
332 XBT_DEBUG("CPU create: peak=%f", speed_.peak);
334 speed_integrated_trace_ = new CpuTiTmgr(nullptr, 1 /*scale*/);
340 delete speed_integrated_trace_;
343 void CpuTi::set_speed_profile(kernel::profile::Profile* profile)
345 delete speed_integrated_trace_;
346 speed_integrated_trace_ = new CpuTiTmgr(profile, speed_.scale);
348 /* add a fake trace event if periodicity == 0 */
349 if (profile && profile->event_list.size() > 1) {
350 kernel::profile::DatedValue val = profile->event_list.back();
351 if (val.date_ < 1e-12) {
352 auto* prof = new kernel::profile::Profile();
353 speed_.event = prof->schedule(&profile::future_evt_set, this);
358 void CpuTi::apply_event(kernel::profile::Event* event, double value)
360 if (event == speed_.event) {
361 XBT_DEBUG("Speed changed in trace! New fixed value: %f", value);
363 /* update remaining of actions and put in modified cpu list */
364 update_remaining_amount(surf_get_clock());
368 delete speed_integrated_trace_;
369 speed_integrated_trace_ = new CpuTiTmgr(value);
371 speed_.scale = value;
372 tmgr_trace_event_unref(&speed_.event);
374 } else if (event == state_event_) {
377 XBT_VERB("Restart actors on host %s", get_host()->get_cname());
378 get_host()->turn_on();
381 get_host()->turn_off();
382 double date = surf_get_clock();
384 /* put all action running on cpu to failed */
385 for (CpuTiAction& action : action_set_) {
386 if (action.get_state() == Action::State::INITED || action.get_state() == Action::State::STARTED ||
387 action.get_state() == Action::State::IGNORED) {
388 action.set_finish_time(date);
389 action.set_state(Action::State::FAILED);
390 get_model()->get_action_heap().remove(&action);
394 tmgr_trace_event_unref(&state_event_);
397 xbt_die("Unknown event!\n");
401 /** Update the actions that are running on this CPU (which was modified recently) */
402 void CpuTi::update_actions_finish_time(double now)
404 /* update remaining amount of actions */
405 update_remaining_amount(now);
407 /* Compute the sum of priorities for the actions running on that CPU */
409 for (CpuTiAction const& action : action_set_) {
410 /* action not running, skip it */
411 if (action.get_state_set() != surf_cpu_model_pm->get_started_action_set())
414 /* bogus priority, skip it */
415 if (action.get_sharing_penalty() <= 0)
418 /* action suspended, skip it */
419 if (not action.is_running())
422 sum_priority_ += 1.0 / action.get_sharing_penalty();
425 for (CpuTiAction& action : action_set_) {
426 double min_finish = -1;
427 /* action not running, skip it */
428 if (action.get_state_set() != surf_cpu_model_pm->get_started_action_set())
431 /* verify if the action is really running on cpu */
432 if (action.is_running() && action.get_sharing_penalty() > 0) {
433 /* total area needed to finish the action. Used in trace integration */
434 double total_area = (action.get_remains() * sum_priority_ * action.get_sharing_penalty()) / speed_.peak;
436 action.set_finish_time(speed_integrated_trace_->solve(now, total_area));
437 /* verify which event will happen before (max_duration or finish time) */
438 if (action.get_max_duration() != NO_MAX_DURATION &&
439 action.get_start_time() + action.get_max_duration() < action.get_finish_time())
440 min_finish = action.get_start_time() + action.get_max_duration();
442 min_finish = action.get_finish_time();
444 /* put the max duration time on heap */
445 if (action.get_max_duration() != NO_MAX_DURATION)
446 min_finish = action.get_start_time() + action.get_max_duration();
448 /* add in action heap */
449 if (min_finish != NO_MAX_DURATION)
450 get_model()->get_action_heap().update(&action, min_finish, ActionHeap::Type::unset);
452 get_model()->get_action_heap().remove(&action);
454 XBT_DEBUG("Update finish time: Cpu(%s) Action: %p, Start Time: %f Finish Time: %f Max duration %f", get_cname(),
455 &action, action.get_start_time(), action.get_finish_time(), action.get_max_duration());
457 /* remove from modified cpu */
461 bool CpuTi::is_used() const
463 return not action_set_.empty();
466 double CpuTi::get_speed_ratio()
468 speed_.scale = speed_integrated_trace_->get_power_scale(surf_get_clock());
469 return Cpu::get_speed_ratio();
472 /** @brief Update the remaining amount of actions */
473 void CpuTi::update_remaining_amount(double now)
475 /* already up to date */
476 if (last_update_ >= now)
479 /* compute the integration area */
480 double area_total = speed_integrated_trace_->integrate(last_update_, now) * speed_.peak;
481 XBT_DEBUG("Flops total: %f, Last update %f", area_total, last_update_);
482 for (CpuTiAction& action : action_set_) {
483 /* action not running, skip it */
484 if (action.get_state_set() != get_model()->get_started_action_set())
487 /* bogus priority, skip it */
488 if (action.get_sharing_penalty() <= 0)
491 /* action suspended, skip it */
492 if (not action.is_running())
495 /* action don't need update */
496 if (action.get_start_time() >= now)
499 /* skip action that are finishing now */
500 if (action.get_finish_time() >= 0 && action.get_finish_time() <= now)
503 /* update remaining */
504 action.update_remains(area_total / (sum_priority_ * action.get_sharing_penalty()));
505 XBT_DEBUG("Update remaining action(%p) remaining %f", &action, action.get_remains_no_update());
510 CpuAction* CpuTi::execution_start(double size)
512 XBT_IN("(%s,%g)", get_cname(), size);
513 auto* action = new CpuTiAction(this, size);
515 action_set_.push_back(*action); // Actually start the action
521 CpuAction* CpuTi::sleep(double duration)
524 duration = std::max(duration, sg_surf_precision);
526 XBT_IN("(%s,%g)", get_cname(), duration);
527 auto* action = new CpuTiAction(this, 1.0);
529 action->set_max_duration(duration);
530 action->set_suspend_state(Action::SuspendStates::SLEEPING);
531 if (duration == NO_MAX_DURATION)
532 action->set_state(Action::State::IGNORED);
534 action_set_.push_back(*action);
540 void CpuTi::set_modified(bool modified)
542 CpuTiList& modified_cpus = static_cast<CpuTiModel*>(get_model())->modified_cpus_;
544 if (not cpu_ti_hook.is_linked()) {
545 modified_cpus.push_back(*this);
548 if (cpu_ti_hook.is_linked())
549 xbt::intrusive_erase(modified_cpus, *this);
557 CpuTiAction::CpuTiAction(CpuTi* cpu, double cost) : CpuAction(cpu->get_model(), cost, not cpu->is_on()), cpu_(cpu)
559 cpu_->set_modified(true);
561 CpuTiAction::~CpuTiAction()
563 /* remove from action_set */
564 if (action_ti_hook.is_linked())
565 xbt::intrusive_erase(cpu_->action_set_, *this);
566 /* remove from heap */
567 get_model()->get_action_heap().remove(this);
568 cpu_->set_modified(true);
571 void CpuTiAction::set_state(Action::State state)
573 CpuAction::set_state(state);
574 cpu_->set_modified(true);
577 void CpuTiAction::cancel()
579 this->set_state(Action::State::FAILED);
580 get_model()->get_action_heap().remove(this);
581 cpu_->set_modified(true);
584 void CpuTiAction::suspend()
586 XBT_IN("(%p)", this);
588 set_suspend_state(Action::SuspendStates::SUSPENDED);
589 get_model()->get_action_heap().remove(this);
590 cpu_->set_modified(true);
595 void CpuTiAction::resume()
597 XBT_IN("(%p)", this);
598 if (is_suspended()) {
599 set_suspend_state(Action::SuspendStates::RUNNING);
600 cpu_->set_modified(true);
605 void CpuTiAction::set_max_duration(double duration)
609 XBT_IN("(%p,%g)", this, duration);
611 Action::set_max_duration(duration);
614 min_finish = (get_start_time() + get_max_duration()) < get_finish_time() ? (get_start_time() + get_max_duration())
617 min_finish = get_finish_time();
619 /* add in action heap */
620 get_model()->get_action_heap().update(this, min_finish, ActionHeap::Type::unset);
625 void CpuTiAction::set_sharing_penalty(double sharing_penalty)
627 XBT_IN("(%p,%g)", this, sharing_penalty);
628 set_sharing_penalty_no_update(sharing_penalty);
629 cpu_->set_modified(true);
633 double CpuTiAction::get_remains()
635 XBT_IN("(%p)", this);
636 cpu_->update_remaining_amount(surf_get_clock());
638 return get_remains_no_update();
641 } // namespace resource
642 } // namespace kernel
643 } // namespace simgrid