-
Notifications
You must be signed in to change notification settings - Fork 25
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
plannertest: criterion-rs based benchmark for both planning and exec…
…ution (#262) Part of #263. ## Problem There is a lack of performance evaluation in optd. Without proper benchmarking, we will not know if some changes cause significant regression in performance. We should keep track of the two aspects of optimizer performance: - plan generation time - actual execution time ## Summary of changes - Add a [Criterion-rs](https://bheisler.github.io/criterion.rs/book/) based benchmark to measure optd performance. - Use the `sqlplannertest` yaml-based setup, bench if there is a `bench` task. - Bump `sqlplannertest` to version 0.4. - better individual test matching added in risinglightdb/sqlplannertest-rs#9 Planning: - Input: SQL statement (aka `datafusion_sql::parser::Statement`). - Measures the time it takes to generate a datafusion physical plan. Execution: - Input: datafusion physical plan outputted from optd (aka `Arc<dyn ExecutionPlan>`). - Measures the time it takes to execute the entire query. ## Next Steps https://github.com/benchmark-action/github-action-benchmark can directly take `cargo bench` results as input. So it will be easy to set up CI. --------- Signed-off-by: Yuchen Liang <[email protected]>
- Loading branch information
Showing
30 changed files
with
1,269 additions
and
339 deletions.
There are no files selected for viewing
Large diffs are not rendered by default.
Oops, something went wrong.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,150 @@ | ||
use std::{ | ||
future::Future, | ||
path::{Path, PathBuf}, | ||
}; | ||
|
||
use anyhow::{bail, Context, Result}; | ||
use criterion::{black_box, criterion_group, criterion_main, BatchSize, Criterion}; | ||
use optd_sqlplannertest::bench_helper::{ | ||
bench_run, bench_setup, ExecutionBenchRunner, PlannerBenchRunner, PlanningBenchRunner, | ||
}; | ||
use sqlplannertest::{discover_tests_with_selections, parse_test_cases, TestCase}; | ||
use tokio::runtime::Runtime; | ||
|
||
fn criterion_benchmark(c: &mut Criterion) { | ||
let selection = "tpch"; | ||
let selections = vec![selection.to_string()]; | ||
|
||
let tests_dir = Path::new(env!("CARGO_MANIFEST_DIR")).join("tests"); | ||
planner_bench_runner( | ||
&tests_dir, | ||
|| async { PlanningBenchRunner::new().await }, | ||
&selections, | ||
c, | ||
) | ||
.unwrap(); | ||
|
||
let path = tests_dir.join(format!("{selection}/bench_populate.sql")); | ||
let populate_sql = std::fs::read_to_string(&path) | ||
.with_context(|| format!("failed to read {}", path.display())) | ||
.unwrap(); | ||
|
||
planner_bench_runner( | ||
&tests_dir, | ||
move || { | ||
let populate_sql = populate_sql.clone(); | ||
async { ExecutionBenchRunner::new(populate_sql).await } | ||
}, | ||
&selections, | ||
c, | ||
) | ||
.unwrap(); | ||
} | ||
|
||
/// Discovers and bench each test case. | ||
/// | ||
/// The user needs to provide a runner function that creates a runner that | ||
/// implements the [`PlannerBenchRunner`] trait. | ||
/// | ||
/// A test case will be selected if: | ||
/// | ||
/// 1. it's included in the `tests_dir` as part of `selections`. | ||
/// 2. has `bench` listed in the task list. | ||
/// | ||
/// ## Limitation | ||
/// | ||
/// Currently only accept sqlplannertest files with single test case. | ||
fn planner_bench_runner<F, Ft, R>( | ||
tests_dir: impl AsRef<Path>, | ||
runner_fn: F, | ||
selections: &[String], | ||
c: &mut Criterion, | ||
) -> Result<()> | ||
where | ||
F: Fn() -> Ft + Send + Sync + 'static + Clone, | ||
Ft: Future<Output = Result<R>> + Send, | ||
R: PlannerBenchRunner + 'static, | ||
{ | ||
let tests = discover_tests_with_selections(&tests_dir, selections)? | ||
.map(|path| { | ||
let path = path?; | ||
let relative_path = path | ||
.strip_prefix(&tests_dir) | ||
.context("unable to relative path")? | ||
.as_os_str(); | ||
let testname = relative_path | ||
.to_str() | ||
.context("unable to convert to string")? | ||
.to_string(); | ||
Ok::<_, anyhow::Error>((path, testname)) | ||
}) | ||
.collect::<Result<Vec<_>, _>>()?; | ||
|
||
for (path, testname) in tests { | ||
bench_runner(path, testname, runner_fn.clone(), c)?; | ||
} | ||
|
||
Ok(()) | ||
} | ||
|
||
/// Bench runner for a test case. | ||
fn bench_runner<F, Ft, R>( | ||
path: PathBuf, | ||
testname: String, | ||
runner_fn: F, | ||
c: &mut Criterion, | ||
) -> Result<()> | ||
where | ||
F: Fn() -> Ft + Send + Sync + 'static + Clone, | ||
Ft: Future<Output = Result<R>> + Send, | ||
R: PlannerBenchRunner, | ||
{ | ||
fn build_runtime() -> Runtime { | ||
tokio::runtime::Builder::new_current_thread() | ||
.enable_all() | ||
.build() | ||
.unwrap() | ||
} | ||
|
||
let testcases = std::fs::read(&path)?; | ||
let testcases: Vec<TestCase> = serde_yaml::from_slice(&testcases)?; | ||
|
||
let testcases = parse_test_cases( | ||
{ | ||
let mut path = path.clone(); | ||
path.pop(); | ||
path | ||
}, | ||
testcases, | ||
)?; | ||
|
||
if testcases.len() != 1 { | ||
bail!( | ||
"planner_bench can only handle sqlplannertest yml file with one test cases, {} has {}", | ||
path.display(), | ||
testcases.len() | ||
); | ||
} | ||
|
||
let testcase = &testcases[0]; | ||
|
||
let should_bench = testcase.tasks.iter().any(|x| x.starts_with("bench")); | ||
if should_bench { | ||
let mut group = c.benchmark_group(testname.strip_suffix(".yml").unwrap()); | ||
let runtime = build_runtime(); | ||
group.bench_function(R::BENCH_NAME, |b| { | ||
b.iter_batched( | ||
|| bench_setup(&runtime, runner_fn.clone(), testcase), | ||
|(runner, input, flags)| { | ||
bench_run(&runtime, runner, black_box(input), testcase, &flags) | ||
}, | ||
BatchSize::PerIteration, | ||
); | ||
}); | ||
group.finish(); | ||
} | ||
Ok(()) | ||
} | ||
|
||
criterion_group!(benches, criterion_benchmark); | ||
criterion_main!(benches); |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,64 @@ | ||
pub mod execution; | ||
pub mod planning; | ||
|
||
use std::future::Future; | ||
|
||
use crate::TestFlags; | ||
use anyhow::Result; | ||
use tokio::runtime::Runtime; | ||
|
||
pub use execution::ExecutionBenchRunner; | ||
pub use planning::PlanningBenchRunner; | ||
|
||
pub trait PlannerBenchRunner { | ||
/// Describes what the benchmark is evaluating. | ||
const BENCH_NAME: &str; | ||
/// Benchmark's input. | ||
type BenchInput; | ||
|
||
/// Setups the necessary environment for the benchmark based on the test case. | ||
/// Returns the input needed for the benchmark. | ||
fn setup( | ||
&mut self, | ||
test_case: &sqlplannertest::ParsedTestCase, | ||
) -> impl std::future::Future<Output = Result<(Self::BenchInput, TestFlags)>> + Send; | ||
|
||
/// Runs the actual benchmark based on the test case and input. | ||
fn bench( | ||
self, | ||
input: Self::BenchInput, | ||
test_case: &sqlplannertest::ParsedTestCase, | ||
flags: &TestFlags, | ||
) -> impl std::future::Future<Output = Result<()>> + Send; | ||
} | ||
|
||
/// Sync wrapper for [`PlannerBenchRunner::setup`] | ||
pub fn bench_setup<F, Ft, R>( | ||
runtime: &Runtime, | ||
runner_fn: F, | ||
testcase: &sqlplannertest::ParsedTestCase, | ||
) -> (R, R::BenchInput, TestFlags) | ||
where | ||
F: Fn() -> Ft + Send + Sync + 'static + Clone, | ||
Ft: Future<Output = Result<R>> + Send, | ||
R: PlannerBenchRunner, | ||
{ | ||
runtime.block_on(async { | ||
let mut runner = runner_fn().await.unwrap(); | ||
let (input, flags) = runner.setup(testcase).await.unwrap(); | ||
(runner, input, flags) | ||
}) | ||
} | ||
|
||
/// Sync wrapper for [`PlannerBenchRunner::bench`] | ||
pub fn bench_run<R>( | ||
runtime: &Runtime, | ||
runner: R, | ||
input: R::BenchInput, | ||
testcase: &sqlplannertest::ParsedTestCase, | ||
flags: &TestFlags, | ||
) where | ||
R: PlannerBenchRunner, | ||
{ | ||
runtime.block_on(async { runner.bench(input, testcase, flags).await.unwrap() }); | ||
} |
Oops, something went wrong.