google-benchmark/src/statistics.cc

*c303c47eSjoerg// Copyright 2016 Ismael Jimenez Martinez. All rights reserved.
*c303c47eSjoerg// Copyright 2017 Roman Lebedev. All rights reserved.
*c303c47eSjoerg//
*c303c47eSjoerg// Licensed under the Apache License, Version 2.0 (the "License");
*c303c47eSjoerg// you may not use this file except in compliance with the License.
*c303c47eSjoerg// You may obtain a copy of the License at
*c303c47eSjoerg//
*c303c47eSjoerg//     http://www.apache.org/licenses/LICENSE-2.0
*c303c47eSjoerg//
*c303c47eSjoerg// Unless required by applicable law or agreed to in writing, software
*c303c47eSjoerg// distributed under the License is distributed on an "AS IS" BASIS,
*c303c47eSjoerg// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
*c303c47eSjoerg// See the License for the specific language governing permissions and
*c303c47eSjoerg// limitations under the License.
*c303c47eSjoerg
*c303c47eSjoerg#include "benchmark/benchmark.h"
*c303c47eSjoerg
*c303c47eSjoerg#include <algorithm>
*c303c47eSjoerg#include <cmath>
*c303c47eSjoerg#include <numeric>
*c303c47eSjoerg#include <string>
*c303c47eSjoerg#include <vector>
*c303c47eSjoerg#include "check.h"
*c303c47eSjoerg#include "statistics.h"
*c303c47eSjoerg
*c303c47eSjoergnamespace benchmark {
*c303c47eSjoerg
*c303c47eSjoergauto StatisticsSum = [](const std::vector<double>& v) {
*c303c47eSjoerg  return std::accumulate(v.begin(), v.end(), 0.0);
*c303c47eSjoerg};
*c303c47eSjoerg
*c303c47eSjoergdouble StatisticsMean(const std::vector<double>& v) {
*c303c47eSjoerg  if (v.empty()) return 0.0;
*c303c47eSjoerg  return StatisticsSum(v) * (1.0 / v.size());
*c303c47eSjoerg}
*c303c47eSjoerg
*c303c47eSjoergdouble StatisticsMedian(const std::vector<double>& v) {
*c303c47eSjoerg  if (v.size() < 3) return StatisticsMean(v);
*c303c47eSjoerg  std::vector<double> copy(v);
*c303c47eSjoerg
*c303c47eSjoerg  auto center = copy.begin() + v.size() / 2;
*c303c47eSjoerg  std::nth_element(copy.begin(), center, copy.end());
*c303c47eSjoerg
*c303c47eSjoerg  // did we have an odd number of samples?
*c303c47eSjoerg  // if yes, then center is the median
*c303c47eSjoerg  // it no, then we are looking for the average between center and the value
*c303c47eSjoerg  // before
*c303c47eSjoerg  if (v.size() % 2 == 1) return *center;
*c303c47eSjoerg  auto center2 = copy.begin() + v.size() / 2 - 1;
*c303c47eSjoerg  std::nth_element(copy.begin(), center2, copy.end());
*c303c47eSjoerg  return (*center + *center2) / 2.0;
*c303c47eSjoerg}
*c303c47eSjoerg
*c303c47eSjoerg// Return the sum of the squares of this sample set
*c303c47eSjoergauto SumSquares = [](const std::vector<double>& v) {
*c303c47eSjoerg  return std::inner_product(v.begin(), v.end(), v.begin(), 0.0);
*c303c47eSjoerg};
*c303c47eSjoerg
*c303c47eSjoergauto Sqr = [](const double dat) { return dat * dat; };
*c303c47eSjoergauto Sqrt = [](const double dat) {
*c303c47eSjoerg  // Avoid NaN due to imprecision in the calculations
*c303c47eSjoerg  if (dat < 0.0) return 0.0;
*c303c47eSjoerg  return std::sqrt(dat);
*c303c47eSjoerg};
*c303c47eSjoerg
*c303c47eSjoergdouble StatisticsStdDev(const std::vector<double>& v) {
*c303c47eSjoerg  const auto mean = StatisticsMean(v);
*c303c47eSjoerg  if (v.empty()) return mean;
*c303c47eSjoerg
*c303c47eSjoerg  // Sample standard deviation is undefined for n = 1
*c303c47eSjoerg  if (v.size() == 1) return 0.0;
*c303c47eSjoerg
*c303c47eSjoerg  const double avg_squares = SumSquares(v) * (1.0 / v.size());
*c303c47eSjoerg  return Sqrt(v.size() / (v.size() - 1.0) * (avg_squares - Sqr(mean)));
*c303c47eSjoerg}
*c303c47eSjoerg
*c303c47eSjoergstd::vector<BenchmarkReporter::Run> ComputeStats(
*c303c47eSjoerg    const std::vector<BenchmarkReporter::Run>& reports) {
*c303c47eSjoerg  typedef BenchmarkReporter::Run Run;
*c303c47eSjoerg  std::vector<Run> results;
*c303c47eSjoerg
*c303c47eSjoerg  auto error_count =
*c303c47eSjoerg      std::count_if(reports.begin(), reports.end(),
*c303c47eSjoerg                    [](Run const& run) { return run.error_occurred; });
*c303c47eSjoerg
*c303c47eSjoerg  if (reports.size() - error_count < 2) {
*c303c47eSjoerg    // We don't report aggregated data if there was a single run.
*c303c47eSjoerg    return results;
*c303c47eSjoerg  }
*c303c47eSjoerg
*c303c47eSjoerg  // Accumulators.
*c303c47eSjoerg  std::vector<double> real_accumulated_time_stat;
*c303c47eSjoerg  std::vector<double> cpu_accumulated_time_stat;
*c303c47eSjoerg
*c303c47eSjoerg  real_accumulated_time_stat.reserve(reports.size());
*c303c47eSjoerg  cpu_accumulated_time_stat.reserve(reports.size());
*c303c47eSjoerg
*c303c47eSjoerg  // All repetitions should be run with the same number of iterations so we
*c303c47eSjoerg  // can take this information from the first benchmark.
*c303c47eSjoerg  int64_t const run_iterations = reports.front().iterations;
*c303c47eSjoerg  // create stats for user counters
*c303c47eSjoerg  struct CounterStat {
*c303c47eSjoerg    Counter c;
*c303c47eSjoerg    std::vector<double> s;
*c303c47eSjoerg  };
*c303c47eSjoerg  std::map<std::string, CounterStat> counter_stats;
*c303c47eSjoerg  for (Run const& r : reports) {
*c303c47eSjoerg    for (auto const& cnt : r.counters) {
*c303c47eSjoerg      auto it = counter_stats.find(cnt.first);
*c303c47eSjoerg      if (it == counter_stats.end()) {
*c303c47eSjoerg        counter_stats.insert({cnt.first, {cnt.second, std::vector<double>{}}});
*c303c47eSjoerg        it = counter_stats.find(cnt.first);
*c303c47eSjoerg        it->second.s.reserve(reports.size());
*c303c47eSjoerg      } else {
*c303c47eSjoerg        CHECK_EQ(counter_stats[cnt.first].c.flags, cnt.second.flags);
*c303c47eSjoerg      }
*c303c47eSjoerg    }
*c303c47eSjoerg  }
*c303c47eSjoerg
*c303c47eSjoerg  // Populate the accumulators.
*c303c47eSjoerg  for (Run const& run : reports) {
*c303c47eSjoerg    CHECK_EQ(reports[0].benchmark_name(), run.benchmark_name());
*c303c47eSjoerg    CHECK_EQ(run_iterations, run.iterations);
*c303c47eSjoerg    if (run.error_occurred) continue;
*c303c47eSjoerg    real_accumulated_time_stat.emplace_back(run.real_accumulated_time);
*c303c47eSjoerg    cpu_accumulated_time_stat.emplace_back(run.cpu_accumulated_time);
*c303c47eSjoerg    // user counters
*c303c47eSjoerg    for (auto const& cnt : run.counters) {
*c303c47eSjoerg      auto it = counter_stats.find(cnt.first);
*c303c47eSjoerg      CHECK_NE(it, counter_stats.end());
*c303c47eSjoerg      it->second.s.emplace_back(cnt.second);
*c303c47eSjoerg    }
*c303c47eSjoerg  }
*c303c47eSjoerg
*c303c47eSjoerg  // Only add label if it is same for all runs
*c303c47eSjoerg  std::string report_label = reports[0].report_label;
*c303c47eSjoerg  for (std::size_t i = 1; i < reports.size(); i++) {
*c303c47eSjoerg    if (reports[i].report_label != report_label) {
*c303c47eSjoerg      report_label = "";
*c303c47eSjoerg      break;
*c303c47eSjoerg    }
*c303c47eSjoerg  }
*c303c47eSjoerg
*c303c47eSjoerg  const double iteration_rescale_factor =
*c303c47eSjoerg      double(reports.size()) / double(run_iterations);
*c303c47eSjoerg
*c303c47eSjoerg  for (const auto& Stat : *reports[0].statistics) {
*c303c47eSjoerg    // Get the data from the accumulator to BenchmarkReporter::Run's.
*c303c47eSjoerg    Run data;
*c303c47eSjoerg    data.run_name = reports[0].benchmark_name();
*c303c47eSjoerg    data.run_type = BenchmarkReporter::Run::RT_Aggregate;
*c303c47eSjoerg    data.aggregate_name = Stat.name_;
*c303c47eSjoerg    data.report_label = report_label;
*c303c47eSjoerg
*c303c47eSjoerg    // It is incorrect to say that an aggregate is computed over
*c303c47eSjoerg    // run's iterations, because those iterations already got averaged.
*c303c47eSjoerg    // Similarly, if there are N repetitions with 1 iterations each,
*c303c47eSjoerg    // an aggregate will be computed over N measurements, not 1.
*c303c47eSjoerg    // Thus it is best to simply use the count of separate reports.
*c303c47eSjoerg    data.iterations = reports.size();
*c303c47eSjoerg
*c303c47eSjoerg    data.real_accumulated_time = Stat.compute_(real_accumulated_time_stat);
*c303c47eSjoerg    data.cpu_accumulated_time = Stat.compute_(cpu_accumulated_time_stat);
*c303c47eSjoerg
*c303c47eSjoerg    // We will divide these times by data.iterations when reporting, but the
*c303c47eSjoerg    // data.iterations is not nessesairly the scale of these measurements,
*c303c47eSjoerg    // because in each repetition, these timers are sum over all the iterations.
*c303c47eSjoerg    // And if we want to say that the stats are over N repetitions and not
*c303c47eSjoerg    // M iterations, we need to multiply these by (N/M).
*c303c47eSjoerg    data.real_accumulated_time *= iteration_rescale_factor;
*c303c47eSjoerg    data.cpu_accumulated_time *= iteration_rescale_factor;
*c303c47eSjoerg
*c303c47eSjoerg    data.time_unit = reports[0].time_unit;
*c303c47eSjoerg
*c303c47eSjoerg    // user counters
*c303c47eSjoerg    for (auto const& kv : counter_stats) {
*c303c47eSjoerg      // Do *NOT* rescale the custom counters. They are already properly scaled.
*c303c47eSjoerg      const auto uc_stat = Stat.compute_(kv.second.s);
*c303c47eSjoerg      auto c = Counter(uc_stat, counter_stats[kv.first].c.flags,
*c303c47eSjoerg                       counter_stats[kv.first].c.oneK);
*c303c47eSjoerg      data.counters[kv.first] = c;
*c303c47eSjoerg    }
*c303c47eSjoerg
*c303c47eSjoerg    results.push_back(data);
*c303c47eSjoerg  }
*c303c47eSjoerg
*c303c47eSjoerg  return results;
*c303c47eSjoerg}
*c303c47eSjoerg
*c303c47eSjoerg}  // end namespace benchmark