vendor/criterion/src/routine.rs

   1 use crate::benchmark::BenchmarkConfig;
   2 use crate::connection::OutgoingMessage;
   3 use crate::measurement::Measurement;
   4 use crate::report::{BenchmarkId, Report, ReportContext};
   5 use crate::{black_box, ActualSamplingMode, Bencher, Criterion};
   6 use std::marker::PhantomData;
   7 use std::time::Duration;
   8
   9 /// PRIVATE
  10 pub(crate) trait Routine<M: Measurement, T: ?Sized> {
  11     /// PRIVATE
  12     fn bench(&mut self, m: &M, iters: &[u64], parameter: &T) -> Vec<f64>;
  13     /// PRIVATE
  14     fn warm_up(&mut self, m: &M, how_long: Duration, parameter: &T) -> (u64, u64);
  15
  16     /// PRIVATE
  17     fn test(&mut self, m: &M, parameter: &T) {
  18         self.bench(m, &[1u64], parameter);
  19     }
  20
  21     /// Iterates the benchmarked function for a fixed length of time, but takes no measurements.
  22     /// This keeps the overall benchmark suite runtime constant-ish even when running under a
  23     /// profiler with an unknown amount of overhead. Since no measurements are taken, it also
  24     /// reduces the amount of time the execution spends in Criterion.rs code, which should help
  25     /// show the performance of the benchmarked code more clearly as well.
  26     fn profile(
  27         &mut self,
  28         measurement: &M,
  29         id: &BenchmarkId,
  30         criterion: &Criterion<M>,
  31         report_context: &ReportContext,
  32         time: Duration,
  33         parameter: &T,
  34     ) {
  35         criterion
  36             .report
  37             .profile(id, report_context, time.as_nanos() as f64);
  38
  39         let mut profile_path = report_context.output_directory.clone();
  40         if (*crate::CARGO_CRITERION_CONNECTION).is_some() {
  41             // If connected to cargo-criterion, generate a cargo-criterion-style path.
  42             // This is kind of a hack.
  43             profile_path.push("profile");
  44             profile_path.push(id.as_directory_name());
  45         } else {
  46             profile_path.push(id.as_directory_name());
  47             profile_path.push("profile");
  48         }
  49         criterion
  50             .profiler
  51             .borrow_mut()
  52             .start_profiling(id.id(), &profile_path);
  53
  54         let time = time.as_nanos() as u64;
  55
  56         // TODO: Some profilers will show the two batches of iterations as
  57         // being different code-paths even though they aren't really.
  58
  59         // Get the warmup time for one second
  60         let (wu_elapsed, wu_iters) = self.warm_up(measurement, Duration::from_secs(1), parameter);
  61         if wu_elapsed < time {
  62             // Initial guess for the mean execution time
  63             let met = wu_elapsed as f64 / wu_iters as f64;
  64
  65             // Guess how many iterations will be required for the remaining time
  66             let remaining = (time - wu_elapsed) as f64;
  67
  68             let iters = remaining / met;
  69             let iters = iters as u64;
  70
  71             self.bench(measurement, &[iters], parameter);
  72         }
  73
  74         criterion
  75             .profiler
  76             .borrow_mut()
  77             .stop_profiling(id.id(), &profile_path);
  78
  79         criterion.report.terminated(id, report_context);
  80     }
  81
  82     fn sample(
  83         &mut self,
  84         measurement: &M,
  85         id: &BenchmarkId,
  86         config: &BenchmarkConfig,
  87         criterion: &Criterion<M>,
  88         report_context: &ReportContext,
  89         parameter: &T,
  90     ) -> (ActualSamplingMode, Box<[f64]>, Box<[f64]>) {
  91         if config.quick_mode {
  92             let minimum_bench_duration = Duration::from_millis(100);
  93             let maximum_bench_duration = config.measurement_time; // default: 5 seconds
  94             let target_rel_stdev = config.significance_level; // default: 5%, 0.05
  95
  96             use std::time::Instant;
  97             let time_start = Instant::now();
  98
  99             let sq = |val| val * val;
 100             let mut n = 1;
 101             let mut t_prev = *self.bench(measurement, &[n], parameter).first().unwrap();
 102
 103             // Early exit for extremely long running benchmarks:
 104             if time_start.elapsed() > maximum_bench_duration {
 105                 let iters = vec![n as f64, n as f64].into_boxed_slice();
 106                 // prevent gnuplot bug when all values are equal
 107                 let elapsed = vec![t_prev, t_prev + 0.000001].into_boxed_slice();
 108                 return (ActualSamplingMode::Flat, iters, elapsed);
 109             }
 110
 111             // Main data collection loop.
 112             loop {
 113                 let t_now = *self
 114                     .bench(measurement, &[n * 2], parameter)
 115                     .first()
 116                     .unwrap();
 117                 let t = (t_prev + 2. * t_now) / 5.;
 118                 let stdev = (sq(t_prev - t) + sq(t_now - 2. * t)).sqrt();
 119                 // println!("Sample: {} {:.2}", n, stdev / t);
 120                 let elapsed = time_start.elapsed();
 121                 if (stdev < target_rel_stdev * t && elapsed > minimum_bench_duration)
 122                     || elapsed > maximum_bench_duration
 123                 {
 124                     let iters = vec![n as f64, (n * 2) as f64].into_boxed_slice();
 125                     let elapsed = vec![t_prev, t_now].into_boxed_slice();
 126                     return (ActualSamplingMode::Linear, iters, elapsed);
 127                 }
 128                 n *= 2;
 129                 t_prev = t_now;
 130             }
 131         }
 132         let wu = config.warm_up_time;
 133         let m_ns = config.measurement_time.as_nanos();
 134
 135         criterion
 136             .report
 137             .warmup(id, report_context, wu.as_nanos() as f64);
 138
 139         if let Some(conn) = &criterion.connection {
 140             conn.send(&OutgoingMessage::Warmup {
 141                 id: id.into(),
 142                 nanos: wu.as_nanos() as f64,
 143             })
 144             .unwrap();
 145         }
 146
 147         let (wu_elapsed, wu_iters) = self.warm_up(measurement, wu, parameter);
 148         if crate::debug_enabled() {
 149             println!(
 150                 "\nCompleted {} iterations in {} nanoseconds, estimated execution time is {} ns",
 151                 wu_iters,
 152                 wu_elapsed,
 153                 wu_elapsed as f64 / wu_iters as f64
 154             );
 155         }
 156
 157         // Initial guess for the mean execution time
 158         let met = wu_elapsed as f64 / wu_iters as f64;
 159
 160         let n = config.sample_size as u64;
 161
 162         let actual_sampling_mode = config
 163             .sampling_mode
 164             .choose_sampling_mode(met, n, m_ns as f64);
 165
 166         let m_iters = actual_sampling_mode.iteration_counts(met, n, &config.measurement_time);
 167
 168         let expected_ns = m_iters
 169             .iter()
 170             .copied()
 171             .map(|count| count as f64 * met)
 172             .sum();
 173
 174         // Use saturating_add to handle overflow.
 175         let mut total_iters = 0u64;
 176         for count in m_iters.iter().copied() {
 177             total_iters = total_iters.saturating_add(count);
 178         }
 179
 180         criterion
 181             .report
 182             .measurement_start(id, report_context, n, expected_ns, total_iters);
 183
 184         if let Some(conn) = &criterion.connection {
 185             conn.send(&OutgoingMessage::MeasurementStart {
 186                 id: id.into(),
 187                 sample_count: n,
 188                 estimate_ns: expected_ns,
 189                 iter_count: total_iters,
 190             })
 191             .unwrap();
 192         }
 193
 194         let m_elapsed = self.bench(measurement, &m_iters, parameter);
 195
 196         let m_iters_f: Vec<f64> = m_iters.iter().map(|&x| x as f64).collect();
 197
 198         (
 199             actual_sampling_mode,
 200             m_iters_f.into_boxed_slice(),
 201             m_elapsed.into_boxed_slice(),
 202         )
 203     }
 204 }
 205
 206 pub struct Function<M: Measurement, F, T>
 207 where
 208     F: FnMut(&mut Bencher<'_, M>, &T),
 209     T: ?Sized,
 210 {
 211     f: F,
 212     // TODO: Is there some way to remove these?
 213     _phantom: PhantomData<T>,
 214     _phamtom2: PhantomData<M>,
 215 }
 216 impl<M: Measurement, F, T> Function<M, F, T>
 217 where
 218     F: FnMut(&mut Bencher<'_, M>, &T),
 219     T: ?Sized,
 220 {
 221     pub fn new(f: F) -> Function<M, F, T> {
 222         Function {
 223             f,
 224             _phantom: PhantomData,
 225             _phamtom2: PhantomData,
 226         }
 227     }
 228 }
 229
 230 impl<M: Measurement, F, T> Routine<M, T> for Function<M, F, T>
 231 where
 232     F: FnMut(&mut Bencher<'_, M>, &T),
 233     T: ?Sized,
 234 {
 235     fn bench(&mut self, m: &M, iters: &[u64], parameter: &T) -> Vec<f64> {
 236         let f = &mut self.f;
 237
 238         let mut b = Bencher {
 239             iterated: false,
 240             iters: 0,
 241             value: m.zero(),
 242             measurement: m,
 243             elapsed_time: Duration::from_millis(0),
 244         };
 245
 246         iters
 247             .iter()
 248             .map(|iters| {
 249                 b.iters = *iters;
 250                 (*f)(&mut b, black_box(parameter));
 251                 b.assert_iterated();
 252                 m.to_f64(&b.value)
 253             })
 254             .collect()
 255     }
 256
 257     fn warm_up(&mut self, m: &M, how_long: Duration, parameter: &T) -> (u64, u64) {
 258         let f = &mut self.f;
 259         let mut b = Bencher {
 260             iterated: false,
 261             iters: 1,
 262             value: m.zero(),
 263             measurement: m,
 264             elapsed_time: Duration::from_millis(0),
 265         };
 266
 267         let mut total_iters = 0;
 268         let mut elapsed_time = Duration::from_millis(0);
 269         loop {
 270             (*f)(&mut b, black_box(parameter));
 271
 272             b.assert_iterated();
 273
 274             total_iters += b.iters;
 275             elapsed_time += b.elapsed_time;
 276             if elapsed_time > how_long {
 277                 return (elapsed_time.as_nanos() as u64, total_iters);
 278             }
 279
 280             b.iters = b.iters.wrapping_mul(2);
 281         }
 282     }
 283 }