Skip to content

Commit

Permalink
Organize benchmarks into suites (#204)
Browse files Browse the repository at this point in the history
* Organize benchmarks into suites

This change closes #202 by adding a way to group benchmarks into
`*.suite` files. This incorporates @jameysharp's comments, e.g., to
calculate the benchmark path relative to the suite path and to detect
suite files based on their `.suite` extension.

Though more suites could be added in the future, the result of this is
that suite files can be built (see `benchmarks/shootout.suite`, e.g.)
and then run like:

```console
$ sightglass-cli benchmark benchmarks/shootout.suite -e ...
```

* review: avoid ignoring buffered read errors

* review: return `Vec<PathBuf>` from `BenchmarkOrSuite::paths`

* review: ensure `execute_in_multiple_processes` assigns a single benchmark to each subprocess

* review: document Windows canonicalization concerns

* review: suites are files
  • Loading branch information
abrown authored Oct 12, 2022
1 parent 18ec4c3 commit 1ab26cd
Show file tree
Hide file tree
Showing 5 changed files with 191 additions and 8 deletions.
8 changes: 8 additions & 0 deletions benchmarks/default.suite
Original file line number Diff line number Diff line change
@@ -0,0 +1,8 @@
# These benchmarks are the default Sightglass benchmarks to run when no others
# are specified. Other benchmarks in the repository are valuable, but running
# all benchmarks could take quite some time. This list is a compromise between
# picking representative real-world benchmarks and measurement time.

bz2/benchmark.wasm
pulldown-cmark/benchmark.wasm
spidermonkey/benchmark.wasm
25 changes: 25 additions & 0 deletions benchmarks/shootout.suite
Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
# These benchmarks are adapted from the "The Computer Language Benchmarks Game"
# for use within Sightglass. Sightglass only includes a subset of those
# benchmarks which are typically smaller kernels (in some cases, true
# micro-benchmarks) extracted from larger programs. More information is
# available at https://benchmarksgame-team.pages.debian.net/benchmarksgame.

shootout-ackermann/benchmark.wasm
shootout-base64/benchmark.wasm
shootout-ctype/benchmark.wasm
shootout-ed25519/benchmark.wasm
shootout-fib2/benchmark.wasm
shootout-gimli/benchmark.wasm
shootout-heapsort/benchmark.wasm
shootout-keccak/benchmark.wasm
shootout-matrix/benchmark.wasm
shootout-memmove/benchmark.wasm
shootout-minicsv/benchmark.wasm
shootout-nestedloop/benchmark.wasm
shootout-random/benchmark.wasm
shootout-ratelimit/benchmark.wasm
shootout-seqhash/benchmark.wasm
shootout-sieve/benchmark.wasm
shootout-switch/benchmark.wasm
shootout-xblabla20/benchmark.wasm
shootout-xchacha20/benchmark.wasm
27 changes: 19 additions & 8 deletions crates/cli/src/benchmark.rs
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
use crate::suite::BenchmarkOrSuite;
use anyhow::{anyhow, Context, Result};
use rand::{rngs::SmallRng, Rng, SeedableRng};
use sightglass_data::{Format, Measurement, Phase};
Expand All @@ -19,14 +20,23 @@ use structopt::StructOpt;
/// NUMBER_OF_ITERATIONS_PER_PROCESS`.
#[derive(StructOpt, Debug)]
pub struct BenchmarkCommand {
/// The path to the Wasm file(s) to benchmark.
/// The path to the file(s) to benchmark. This accepts one or more:
///
/// - `*.wasm` files: individual benchmarks that meet the requirements
/// outlined in `benchmarks/README.md`
///
/// - `*.suite` files: a file containing a newline-delimited list of
/// benchmarks to execute. A `*.suite` file may contain `#`-prefixed line
/// comments. Relative paths are resolved against the parent directory of
/// the `*.suite` file.
///
/// By default, this will use `benchmarks/default.suite`.
#[structopt(
index = 1,
required = true,
value_name = "WASMFILE",
parse(from_os_str)
default_value = "benchmarks/default.suite",
value_name = "FILE"
)]
wasm_files: Vec<PathBuf>,
benchmarks: Vec<BenchmarkOrSuite>,

/// The benchmark engine(s) with which to run the benchmark.
///
Expand Down Expand Up @@ -144,9 +154,10 @@ impl BenchmarkCommand {
}

let wasm_files: Vec<_> = self
.wasm_files
.benchmarks
.iter()
.map(|f| f.display().to_string())
.flat_map(|f| f.paths())
.map(|p| p.display().to_string())
.collect();
let mut all_measurements = vec![];

Expand Down Expand Up @@ -308,7 +319,7 @@ impl BenchmarkCommand {
// and therefore potentially invalidating relative paths used here).
let engine = check_engine_path(engine)?;

for wasm in &self.wasm_files {
for wasm in self.benchmarks.iter().flat_map(|s| s.paths()) {
choices.push((engine.clone(), wasm, self.processes));
}
}
Expand Down
1 change: 1 addition & 0 deletions crates/cli/src/main.rs
Original file line number Diff line number Diff line change
@@ -1,6 +1,7 @@
mod benchmark;
mod effect_size;
mod fingerprint;
mod suite;
mod summarize;
mod upload;
mod validate;
Expand Down
138 changes: 138 additions & 0 deletions crates/cli/src/suite.rs
Original file line number Diff line number Diff line change
@@ -0,0 +1,138 @@
//! Group benchmarks into suites.
//!
//! [Suite]s are files that contain a newline-separated list of benchmark files
//! to run; see [Suite::parse] for more details on the syntax of these files. To
//! distinguish between a [Suite] file and a regular benchmark file, we use
//! [BenchmarkOrSuite].
use anyhow::Result;
use std::{
ffi::OsStr,
fs, io,
path::{Path, PathBuf},
str::FromStr,
};

/// Decide between a suite of benchmarks or an individual benchmark file.
#[derive(Debug)]
pub enum BenchmarkOrSuite {
Suite(Suite),
Benchmark(PathBuf),
}

impl BenchmarkOrSuite {
/// List all of paths to the benchmarks to run.
pub fn paths(&self) -> Vec<PathBuf> {
match self {
BenchmarkOrSuite::Suite(suite) => suite.benchmarks.clone(),
BenchmarkOrSuite::Benchmark(path) => vec![path.clone()],
}
}
}

/// It is helpful to reference the original path.
impl AsRef<OsStr> for BenchmarkOrSuite {
fn as_ref(&self) -> &OsStr {
match self {
BenchmarkOrSuite::Suite(suite) => suite.path.as_os_str(),
BenchmarkOrSuite::Benchmark(path) => path.as_os_str(),
}
}
}

/// Parse a [BenchmarkOrSuite] from a string path; files ending in `.suite` are
/// assumed to be suite files.
impl FromStr for BenchmarkOrSuite {
type Err = anyhow::Error;
fn from_str(path: &str) -> Result<Self, Self::Err> {
Ok(if Suite::has_extension(path) {
Self::Suite(Suite::parse(path)?)
} else {
Self::Benchmark(PathBuf::from(path))
})
}
}

#[derive(Debug)]
pub struct Suite {
path: PathBuf,
benchmarks: Vec<PathBuf>,
}

impl Suite {
/// Parse the contents of a suite file:
/// - empty lines are ignored
/// - `#`-prefixed lines are ignored
/// - relative paths are resolved using the parent directory of the
/// `suite_path`.
///
/// Note that paths are not canonicalized due to some [concerns on
/// Windows](https://github.com/bytecodealliance/sightglass/pull/204#discussion_r993434406).
/// This choice here should not affect how suites are used by sightglass.
pub fn parse<P: AsRef<Path>>(suite_path: P) -> Result<Self> {
debug_assert!(suite_path.as_ref().is_file());
Self::parse_contents(suite_path.as_ref(), &fs::read(suite_path.as_ref())?)
}

/// Utility function for easier testing.
fn parse_contents<P: AsRef<Path>>(suite_path: P, file_contents: &[u8]) -> Result<Self> {
use io::BufRead;
let suite_path = suite_path.as_ref().to_path_buf();
let parent_dir = suite_path
.parent()
.expect("the suite path must be a file and files must have a parent directory");
let mut benchmarks = vec![];
for line in io::BufReader::new(file_contents).lines() {
let line = line?;
let line = line.trim();
if !line.starts_with("#") && !line.is_empty() {
benchmarks.push(parent_dir.join(line))
}
}
Ok(Self {
path: suite_path,
benchmarks,
})
}

/// Check if a path has the `suite` extension.
fn has_extension<P: AsRef<Path>>(path: P) -> bool {
match path.as_ref().extension() {
Some(ext) => ext == "suite",
None => false,
}
}
}

#[cfg(test)]
mod tests {
use super::*;

const SUITE_PATH: &str = "/home/bench.suite";
const CONTENTS: &str = "
# These benchmarks are...
a.wasm
/b.wasm
../c.wasm
";

#[test]
fn parse() {
let suite = Suite::parse_contents(SUITE_PATH, CONTENTS.as_bytes()).unwrap();

// The suite path should be preserved.
assert_eq!(suite.path, PathBuf::from(SUITE_PATH));

assert_eq!(
suite.benchmarks,
vec![
// Relative paths are appended.
PathBuf::from("/home/a.wasm"),
// Absolute paths are preserved.
PathBuf::from("/b.wasm"),
// Canonicalization happens later.
PathBuf::from("/home/../c.wasm")
]
)
}
}

0 comments on commit 1ab26cd

Please sign in to comment.