Skip to content

Commit

Permalink
Merge pull request #119 from instaclustr/issue-118
Browse files Browse the repository at this point in the history
Issue-118, Auto compressor selection fix
  • Loading branch information
cjrolo authored Sep 18, 2024
2 parents 5ead490 + 02d2d85 commit 5f9e562
Show file tree
Hide file tree
Showing 2 changed files with 29 additions and 12 deletions.
39 changes: 28 additions & 11 deletions brro-compressor/src/frame/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -60,11 +60,7 @@ impl CompressorFrame {
// We need enough samples to do decent compression, minimum is 128 (2^7)
let data_sample = COMPRESSION_SPEED[compression_speed] as usize;
// Eligible compressors for use
let compressor_list = [
Compressor::Constant,
Compressor::FFT,
Compressor::Polynomial,
];
let compressor_list = [Compressor::FFT, Compressor::Polynomial];
// Do a statistical analysis of the data, let's see if we can pick a compressor out of this.
let stats = DataStats::new(data);
// Checking the statistical analysis and chose, if possible, a compressor
Expand All @@ -90,6 +86,7 @@ impl CompressorFrame {
compressor,
)
})
.filter(|(result, _)| result.error <= max_error as f64)
.min_by_key(|x| x.0.compressed_data.len())
.unwrap();
self.compressor = *chosen_compressor;
Expand All @@ -100,19 +97,39 @@ impl CompressorFrame {
.compressed_data;
} else {
// Run all the eligible compressors and choose smallest
let (smallest_result, chosen_compressor) = compressor_list
let compressor_results: Vec<_> = compressor_list
.iter()
.map(|compressor| {
(
compressor.get_compress_bounded_results(data, max_error as f64),
compressor,
*compressor,
)
})
.min_by_key(|x| x.0.compressed_data.len())
.unwrap();
.collect();

self.data = smallest_result.compressed_data;
self.compressor = *chosen_compressor;
#[allow(
clippy::neg_cmp_op_on_partial_ord,
reason = "we need to exactly negate `result.error < max_error`, we can't apply de morgans to the expression due to NaN values"
)]
let best_compressor = if compressor_results
.iter()
.all(|(result, _)| !(result.error <= max_error as f64))
{
// To ensure we always have at least one result,
// if all results are above the max error just pick the smallest.
compressor_results
.into_iter()
.min_by_key(|x| x.0.compressed_data.len())
} else {
compressor_results
.into_iter()
.filter(|(result, _)| result.error <= max_error as f64)
.min_by_key(|x| x.0.compressed_data.len())
};

let (result, compressor) = best_compressor.unwrap();
self.data = result.compressed_data;
self.compressor = compressor;
}
debug!("Auto Compressor Selection: {:?}", self.compressor);
}
Expand Down
2 changes: 1 addition & 1 deletion rust-toolchain.toml
Original file line number Diff line number Diff line change
@@ -1,3 +1,3 @@
[toolchain]
channel = "1.80"
channel = "1.81"
components = [ "rustfmt", "clippy" ]

0 comments on commit 5f9e562

Please sign in to comment.