From 224d7e4a9b754dcd2ebf3df567d914ab4621e855 Mon Sep 17 00:00:00 2001 From: Andrew Brown Date: Mon, 24 Oct 2022 16:37:43 -0700 Subject: [PATCH] Display benchmark progress This change emits a string to `stderr` that indicates how far Sightglass has come in running its benchmarks: ``` Iterations completed: 42/100 ``` The idea is to provide more immediate and clear feedback than `RUST_LOG` that Sightglass is doing work and the user can wait for it to finish. This turns out to be rather tricky to do due to the single-process and multi-process paradigms for running benchmarks; the solution is to communicate here with an internal environment variable "protocol." The other tricky bit is the addition of ANSI terminal escape codes. This allows Sightglass to overwrite the same line and avoid filling up a screen with repeated `Iterations completed: ...` messages. This part of the PR could be safely removed without change to the counting functionality but I hope that the implementation is simple enough--and pessimistic enough--that it should not cause trouble down the road. I say "pessimistic" because the heuristic for determining if a terminal can support these "overwriting" terminal codes should just default to printing extra lines if anything looks amiss. This PR is related to #203 and may close that issue. --- Cargo.lock | 6 +- crates/cli/Cargo.toml | 2 + crates/cli/src/benchmark.rs | 40 +++++++++--- crates/cli/src/counter.rs | 122 ++++++++++++++++++++++++++++++++++++ crates/cli/src/main.rs | 1 + 5 files changed, 159 insertions(+), 12 deletions(-) create mode 100644 crates/cli/src/counter.rs diff --git a/Cargo.lock b/Cargo.lock index 2e9b6393..96154aea 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -1006,9 +1006,9 @@ dependencies = [ [[package]] name = "once_cell" -version = "1.13.1" +version = "1.15.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "074864da206b4973b84eb91683020dbefd6a8c3f0f38e054d93954e891935e4e" +checksum = "e82dad04139b71a90c080c8463fe0dc7902db5192d939bd0950f074d014339e1" [[package]] name = "openssl" @@ -1540,10 +1540,12 @@ version = "0.1.0" dependencies = [ "anyhow", "assert_cmd", + "atty", "csv", "env_logger 0.8.4", "libloading", "log", + "once_cell", "predicates 1.0.8", "pretty_env_logger", "rand", diff --git a/crates/cli/Cargo.toml b/crates/cli/Cargo.toml index 6de932e4..6736d8f1 100644 --- a/crates/cli/Cargo.toml +++ b/crates/cli/Cargo.toml @@ -6,8 +6,10 @@ edition = "2021" [dependencies] anyhow = "1.0" +atty = "0.2" libloading = "0.7" log = "0.4" +once_cell = "1.15" pretty_env_logger = "0.4" serde_json = "1.0.64" sightglass-analysis = { path = "../analysis" } diff --git a/crates/cli/src/benchmark.rs b/crates/cli/src/benchmark.rs index cce16476..ebaa7dfa 100644 --- a/crates/cli/src/benchmark.rs +++ b/crates/cli/src/benchmark.rs @@ -1,16 +1,17 @@ +use crate::counter; use crate::suite::BenchmarkOrSuite; use anyhow::{anyhow, Context, Result}; use rand::{rngs::SmallRng, Rng, SeedableRng}; use sightglass_data::{Format, Measurement, Phase}; -use sightglass_recorder::cpu_affinity::bind_to_single_core; -use sightglass_recorder::measure::Measurements; -use sightglass_recorder::{bench_api::BenchApi, benchmark::benchmark, measure::MeasureType}; +use sightglass_recorder::{ + bench_api::BenchApi, benchmark::benchmark, cpu_affinity::bind_to_single_core, + measure::MeasureType, measure::Measurements, +}; use std::{ - fs, + env, fs, io::{self, BufWriter, Write}, path::{Path, PathBuf}, - process::Command, - process::Stdio, + process::{Command, Stdio}, }; use structopt::StructOpt; @@ -161,6 +162,17 @@ impl BenchmarkCommand { .collect(); let mut all_measurements = vec![]; + // Track completion of each benchmark iteration for this process. This + // can get tricky because iterations can run across many processes. To + // communicate progress, the `SingleProcess` and `MultiProcess` counters + // communicate using environment variables (see `counter.rs`). + let mut counter = counter::SingleProcess::new( + self.iterations_per_process * wasm_files.len() * self.engines.len(), + )?; + if counter.is_empty() { + eprintln!("{}", counter.display_to_stderr()); + } + for engine in &self.engines { let engine_path = check_engine_path(engine)?; log::info!("Using benchmark engine: {}", engine_path.display()); @@ -212,6 +224,8 @@ impl BenchmarkCommand { self.check_output(Path::new(wasm_file), stdout, stderr)?; measurements.next_iteration(); + counter.increment(); + eprintln!("{}", counter.display_to_stderr()); } all_measurements.extend(measurements.finish()); @@ -300,14 +314,12 @@ impl BenchmarkCommand { Box::new(io::stdout()) }; - let this_exe = - std::env::current_exe().context("failed to get the current executable's path")?; + let this_exe = env::current_exe().context("failed to get the current executable's path")?; // Shuffle the order in which we spawn benchmark processes. This helps // us avoid some measurement bias from CPU state transitions that aren't // constrained within the duration of process execution, like dynamic // CPU throttling due to overheating. - let mut rng = SmallRng::seed_from_u64(0x1337_4242); // Worklist that we randomly sample from. @@ -324,6 +336,11 @@ impl BenchmarkCommand { } } + // Track completion of each iteration across all processes. + let mut counter = counter::MultiProcess::new( + self.processes * self.iterations_per_process * choices.len(), + ); + // Accumulated measurements from all of our subprocesses. let mut measurements = vec![]; @@ -336,6 +353,7 @@ impl BenchmarkCommand { .stdin(Stdio::null()) .stdout(Stdio::piped()) .stderr(Stdio::inherit()) + .envs(counter.to_environ_vars()) .arg("benchmark") .arg("--processes") .arg("1") @@ -385,6 +403,8 @@ impl BenchmarkCommand { .context("failed to read benchmark subprocess's results")?, ); + counter.increment_by(self.iterations_per_process); + *procs_left -= 1; if *procs_left == 0 { choices.swap_remove(index); @@ -420,7 +440,7 @@ impl BenchmarkCommand { } else if let Some(dir) = wasm_file.as_ref().parent() { dir.into() } else { - std::env::current_dir().context("failed to get the current working directory")? + env::current_dir().context("failed to get the current working directory")? }; Ok(working_dir) } diff --git a/crates/cli/src/counter.rs b/crates/cli/src/counter.rs new file mode 100644 index 00000000..f86b526e --- /dev/null +++ b/crates/cli/src/counter.rs @@ -0,0 +1,122 @@ +//! Track completion of benchmark iterations. +//! +//! In order to give users feedback about when Sightglass will finish running +//! benchmarks, we need to keep track of how many iterations will run. This is +//! complicated by the fact that benchmarks can be run both in a single process +//! (the current one) or across many processes. [`SingleProcess`] and +//! [`MultiProcess`] are completely separate implementations of counters in +//! order to account for this. +//! +//! Because a multi-process run delegates the running of benchmarks to a single +//! process, we need a way to communicate what iteration the single process +//! starts at. This is accomplished here by an internal environment variable +//! protocol: +//! - [`MultiProcess::to_environ_vars`] sets some environment variables with the +//! `completed` and `total` number of iterations +//! - [`SingleProcess::new`] reads the environment to retrieve `completed` and +//! `total`, which it uses when incrementing and printing its state to +//! `stderr`. + +use anyhow::Result; +use once_cell::sync::Lazy; +use std::env; +use std::ffi::OsString; + +const ENV_COMPLETED: &str = "SIGHTGLASS_COUNTER_COMPLETED_ITERATIONS"; +const ENV_TOTAL: &str = "SIGHTGLASS_COUNTER_TOTAL_ITERATIONS"; + +/// Calculate once whether the terminal has the ability to emit [escape +/// codes](https://en.wikipedia.org/wiki/ANSI_escape_code). If so, we can avoid +/// printing repeated `"Iterations completed: ..."` lines. This is loosely based +/// on this [StackOverflow +/// discussion](https://stackoverflow.com/questions/7445658). +static HAS_TERMINAL_ESCAPE_CODES: Lazy = Lazy::new(|| { + let is_atty = atty::is(atty::Stream::Stderr); + let is_supported_platform = if env::consts::OS == "windows" { + env::var_os("TERM") == Some(OsString::from("ANSI")) + } else { + true + }; + let is_rust_logging_enabled = env::var_os("RUST_LOG").is_some(); + + is_atty && is_supported_platform && !is_rust_logging_enabled +}); + +/// Track iterations completed in a single process. +pub struct SingleProcess { + completed: usize, + total: usize, +} + +impl SingleProcess { + /// Construct the initial state by either reading the start state from the + /// environment (i.e., part of a multi-process run) or using the known total iterations + /// (i.e., single-process run). + pub fn new(iterations_per_process: usize) -> Result { + let total = if let Ok(total) = env::var(ENV_TOTAL) { + total.parse()? + } else { + iterations_per_process + }; + let completed = if let Ok(completed) = env::var(ENV_COMPLETED) { + completed.parse()? + } else { + 0 + }; + Ok(Self { completed, total }) + } + pub fn is_empty(&self) -> bool { + self.completed == 0 + } + pub fn increment(&mut self) { + self.completed += 1; + } + /// Print the current number of iterations completed to `stderr`: e.g., + /// `"Iterations completed: 5/10"`. + /// + /// If the terminal supports ANSI terminal escape codes, this will attempt + /// to overwrite the current line, avoiding excessive output. See escape + /// sequences for "escape", "cursor up", "carriage return" + /// [here](https://en.wikipedia.org/wiki/ANSI_escape_code). + /// + /// __Important__: this function (due to `HAS_TERMINAL_ESCAPE_CODES`) has an + /// implicit assumption that it will be used with `eprintln!` (e.g.). + pub fn display_to_stderr(&self) -> String { + let reset_line = if self.completed > 0 && *HAS_TERMINAL_ESCAPE_CODES { + "\x1B[A\r" + } else { + "" + }; + format!( + "{}Iterations completed: {}/{}", + reset_line, self.completed, self.total + ) + } +} + +/// Track iterations completed over a multi-process run. +pub struct MultiProcess { + completed: usize, + total: usize, +} + +impl MultiProcess { + pub fn new(total: usize) -> Self { + Self { + completed: 0, + total, + } + } + /// Communicate the internal counter state to a single-process run; this + /// must match up with [`SingleProcess::new`]. + pub fn to_environ_vars(&self) -> impl IntoIterator { + vec![ + (ENV_COMPLETED, self.completed.to_string()), + (ENV_TOTAL, self.total.to_string()), + ] + } + pub fn increment_by(&mut self, iterations: usize) { + self.completed += iterations; + assert!(self.completed <= self.total) + } +} diff --git a/crates/cli/src/main.rs b/crates/cli/src/main.rs index 68b49828..07b38d6c 100644 --- a/crates/cli/src/main.rs +++ b/crates/cli/src/main.rs @@ -1,4 +1,5 @@ mod benchmark; +mod counter; mod effect_size; mod fingerprint; mod suite;