From 9a9d9905023d29d17a71ed81b2e81331b771db8f Mon Sep 17 00:00:00 2001 From: Clement Rey Date: Sat, 2 Dec 2023 12:49:44 +0100 Subject: [PATCH] GC improvements 0: use-case driven benchmarks (#4394) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Introduce 2 new benchmark suites that drive the development of this PR series: 1. Logging a tons of scalars, in order, across a bunch of series, themselves scattered across a bunch of plots. 2. Logging a tons of timeless data, across a bunch of entities. ### Benchmarks Hint: it's bad. ``` .../plotting_dashboard/drop_at_least=0.3/bucketsz=1024 1.00 1084.0±4.47ms 54.1 KElem/sec .../plotting_dashboard/drop_at_least=0.3/bucketsz=2048 1.00 2.1±0.02s 27.6 KElem/sec .../plotting_dashboard/drop_at_least=0.3/bucketsz=256 1.00 465.8±2.50ms 125.8 KElem/sec .../plotting_dashboard/drop_at_least=0.3/bucketsz=512 1.00 655.3±2.61ms 89.4 KElem/sec .../plotting_dashboard/drop_at_least=0.3/default 1.00 652.8±4.12ms 89.8 KElem/sec .../timeless_logs/drop_at_least=0.3/bucketsz=1024 1.00 2.4±0.05s 24.2 KElem/sec .../timeless_logs/drop_at_least=0.3/bucketsz=2048 1.00 2.4±0.03s 24.1 KElem/sec .../timeless_logs/drop_at_least=0.3/bucketsz=256 1.00 2.5±0.08s 23.5 KElem/sec .../timeless_logs/drop_at_least=0.3/bucketsz=512 1.00 2.4±0.02s 24.5 KElem/sec .../timeless_logs/drop_at_least=0.3/default 1.00 2.4±0.03s 24.4 KElem/sec ``` --- Part of the GC improvements series: - #4394 - #4395 - #4396 - #4397 - #4398 - #4399 - #4400 - #4401 --- crates/re_arrow_store/Cargo.toml | 15 +- crates/re_arrow_store/benches/gc.rs | 265 +++++++++++++++++++++ crates/re_sdk/Cargo.toml | 2 +- crates/re_types_core/src/loggable_batch.rs | 26 ++ 4 files changed, 299 insertions(+), 9 deletions(-) create mode 100644 crates/re_arrow_store/benches/gc.rs diff --git a/crates/re_arrow_store/Cargo.toml b/crates/re_arrow_store/Cargo.toml index b7b0b7da33cf..f21e6a78a1f6 100644 --- a/crates/re_arrow_store/Cargo.toml +++ b/crates/re_arrow_store/Cargo.toml @@ -19,9 +19,6 @@ all-features = true [features] default = [] -## Enables access to re_types' test components/datatypes. -testing = ["re_log_types/testing", "re_types/testing"] - ## Enables `parking_lot`'s deadlock detection background thread. deadlock_detection = ["parking_lot/deadlock_detection"] @@ -73,7 +70,7 @@ polars-ops = { workspace = true, optional = true, features = [ [dev-dependencies] re_log_types = { workspace = true, features = ["testing"] } -re_types = { workspace = true, features = ["datagen"] } +re_types = { workspace = true, features = ["datagen", "testing"] } anyhow.workspace = true criterion.workspace = true @@ -98,7 +95,7 @@ bench = false [[example]] name = "dump_dataframe" path = "examples/dump_dataframe.rs" -required-features = ["polars", "testing"] +required-features = ["polars"] [[example]] name = "latest_component" @@ -116,15 +113,17 @@ path = "examples/range_components.rs" required-features = ["polars"] +[[bench]] +name = "arrow2" +harness = false + [[bench]] name = "data_store" harness = false -required-features = ["testing"] [[bench]] -name = "arrow2" +name = "gc" harness = false -required-features = ["testing"] [[bench]] name = "vectors" diff --git a/crates/re_arrow_store/benches/gc.rs b/crates/re_arrow_store/benches/gc.rs new file mode 100644 index 000000000000..8504602aefb9 --- /dev/null +++ b/crates/re_arrow_store/benches/gc.rs @@ -0,0 +1,265 @@ +#[global_allocator] +static GLOBAL: mimalloc::MiMalloc = mimalloc::MiMalloc; + +use criterion::{criterion_group, criterion_main, BatchSize, Criterion}; + +use itertools::Itertools; +use re_arrow_store::{ + DataStore, DataStoreConfig, GarbageCollectionOptions, GarbageCollectionTarget, +}; +use re_log_types::{ + build_frame_nr, build_log_time, DataRow, DataTable, EntityPath, RowId, TableId, Time, TimePoint, +}; +use re_types::components::InstanceKey; +use re_types_core::{AsComponents, ComponentBatch, ComponentName, Loggable as _}; + +criterion_group!(benches, plotting_dashboard, timeless_logs); +criterion_main!(benches); + +// --- + +#[cfg(not(debug_assertions))] +mod constants { + pub const NUM_ENTITY_PATHS: usize = 20; + pub const NUM_ROWS_PER_ENTITY_PATH: usize = 10_000; +} + +// `cargo test` also runs the benchmark setup code, so make sure they run quickly: +#[cfg(debug_assertions)] +mod constants { + pub const NUM_ENTITY_PATHS: usize = 1; + pub const NUM_ROWS_PER_ENTITY_PATH: usize = 1; +} + +use constants::{NUM_ENTITY_PATHS, NUM_ROWS_PER_ENTITY_PATH}; + +fn num_rows_per_bucket() -> &'static [u64] { + #[cfg(feature = "core_benchmarks_only")] + { + &[] + } + #[cfg(not(feature = "core_benchmarks_only"))] + { + &[256, 512, 1024, 2048] + } +} + +// --- Benchmarks --- + +fn plotting_dashboard(c: &mut Criterion) { + const DROP_AT_LEAST: f64 = 0.3; + + let mut group = c.benchmark_group(format!( + "datastore/num_entities={NUM_ENTITY_PATHS}/num_rows_per_entity={NUM_ROWS_PER_ENTITY_PATH}/plotting_dashboard/drop_at_least={DROP_AT_LEAST}" + )); + group.throughput(criterion::Throughput::Elements( + ((NUM_ENTITY_PATHS * NUM_ROWS_PER_ENTITY_PATH) as f64 * DROP_AT_LEAST) as _, + )); + group.sample_size(10); + + let gc_settings = GarbageCollectionOptions { + target: GarbageCollectionTarget::DropAtLeastFraction(DROP_AT_LEAST), + gc_timeless: true, + protect_latest: 1, + purge_empty_tables: false, + dont_protect: Default::default(), + }; + + let mut timegen = |i| { + [ + build_log_time(Time::from_seconds_since_epoch(i as _)), + build_frame_nr((i as i64).into()), + ] + .into() + }; + + let mut datagen = |i| { + Box::new(re_types::archetypes::TimeSeriesScalar::new(i as f64)) as Box + }; + + // Default config + group.bench_function("default", |b| { + let store = build_store( + Default::default(), + InstanceKey::name(), + false, + &mut timegen, + &mut datagen, + ); + b.iter_batched( + || store.clone(), + |mut store| { + let (_, stats_diff) = store.gc(&gc_settings); + stats_diff + }, + BatchSize::LargeInput, + ); + }); + + // Emulate more or less bucket + for &num_rows_per_bucket in num_rows_per_bucket() { + group.bench_function(format!("bucketsz={num_rows_per_bucket}"), |b| { + let store = build_store( + DataStoreConfig { + indexed_bucket_num_rows: num_rows_per_bucket, + ..Default::default() + }, + InstanceKey::name(), + false, + &mut timegen, + &mut datagen, + ); + b.iter_batched( + || store.clone(), + |mut store| { + let (_, stats_diff) = store.gc(&gc_settings); + stats_diff + }, + BatchSize::LargeInput, + ); + }); + } +} + +fn timeless_logs(c: &mut Criterion) { + const DROP_AT_LEAST: f64 = 0.3; + + let mut group = c.benchmark_group(format!( + "datastore/num_entities={NUM_ENTITY_PATHS}/num_rows_per_entity={NUM_ROWS_PER_ENTITY_PATH}/timeless_logs/drop_at_least={DROP_AT_LEAST}" + )); + group.throughput(criterion::Throughput::Elements( + ((NUM_ENTITY_PATHS * NUM_ROWS_PER_ENTITY_PATH) as f64 * DROP_AT_LEAST) as _, + )); + group.sample_size(10); + + let gc_settings = GarbageCollectionOptions { + target: GarbageCollectionTarget::DropAtLeastFraction(DROP_AT_LEAST), + gc_timeless: true, + protect_latest: 1, + purge_empty_tables: false, + dont_protect: Default::default(), + }; + + let mut timegen = |_| TimePoint::timeless(); + + let mut datagen = |i: usize| { + Box::new(re_types::archetypes::TextLog::new(i.to_string())) as Box + }; + + // Default config + group.bench_function("default", |b| { + let store = build_store( + Default::default(), + InstanceKey::name(), + false, + &mut timegen, + &mut datagen, + ); + b.iter_batched( + || store.clone(), + |mut store| { + let (_, stats_diff) = store.gc(&gc_settings); + stats_diff + }, + BatchSize::LargeInput, + ); + }); + + // Emulate more or less bucket + for &num_rows_per_bucket in num_rows_per_bucket() { + group.bench_function(format!("bucketsz={num_rows_per_bucket}"), |b| { + let store = build_store( + DataStoreConfig { + indexed_bucket_num_rows: num_rows_per_bucket, + ..Default::default() + }, + InstanceKey::name(), + false, + &mut timegen, + &mut datagen, + ); + b.iter_batched( + || store.clone(), + |mut store| { + let (_, stats_diff) = store.gc(&gc_settings); + stats_diff + }, + BatchSize::LargeInput, + ); + }); + } +} + +// --- Helpers --- + +fn build_store( + config: DataStoreConfig, + cluster_key: ComponentName, + packed: bool, + timegen: &mut FT, + datagen: &mut FD, +) -> DataStore +where + FT: FnMut(usize) -> TimePoint, + FD: FnMut(usize) -> Box, +{ + let mut store = DataStore::new( + re_log_types::StoreId::random(re_log_types::StoreKind::Recording), + cluster_key, + config, + ); + + let tables = (0..NUM_ENTITY_PATHS) + .map(|i| build_table(format!("entity_path_{i}").into(), packed, timegen, datagen)) + .collect_vec(); + let mut rows_per_table = tables.iter().map(|table| table.to_rows()).collect_vec(); + + // NOTE: interleave insertions between entities to more closely match real world scenarios. + for _ in 0..NUM_ROWS_PER_ENTITY_PATH { + #[allow(clippy::needless_range_loop)] // readability + for i in 0..NUM_ENTITY_PATHS { + let row = rows_per_table[i].next().unwrap(); + store.insert_row(&row.unwrap()).unwrap(); + } + } + + store +} + +fn build_table( + entity_path: EntityPath, + packed: bool, + timegen: &mut FT, + datagen: &mut FD, +) -> DataTable +where + FT: FnMut(usize) -> TimePoint, + FD: FnMut(usize) -> Box, +{ + let mut table = DataTable::from_rows( + TableId::ZERO, + (0..NUM_ROWS_PER_ENTITY_PATH).map(move |i| { + DataRow::from_component_batches( + RowId::random(), + // NOTE: insert in multiple timelines to more closely match real world scenarios. + timegen(i), + entity_path.clone(), + datagen(i) + .as_component_batches() + .iter() + .map(|batch| batch as &dyn ComponentBatch), + ) + .unwrap() + }), + ); + + // Do a serialization roundtrip to pack everything in contiguous memory. + if packed { + let (schema, columns) = table.serialize().unwrap(); + table = DataTable::deserialize(TableId::ZERO, &schema, &columns).unwrap(); + } + + table.compute_all_size_bytes(); + + table +} diff --git a/crates/re_sdk/Cargo.toml b/crates/re_sdk/Cargo.toml index 5c0fa9a5578b..406f458689d6 100644 --- a/crates/re_sdk/Cargo.toml +++ b/crates/re_sdk/Cargo.toml @@ -68,7 +68,7 @@ webbrowser = { workspace = true, optional = true } [dev-dependencies] -re_arrow_store = { workspace = true, features = ["testing"] } +re_arrow_store.workspace = true itertools.workspace = true ndarray-rand.workspace = true diff --git a/crates/re_types_core/src/loggable_batch.rs b/crates/re_types_core/src/loggable_batch.rs index 9708e25e1f97..f1b260075cb5 100644 --- a/crates/re_types_core/src/loggable_batch.rs +++ b/crates/re_types_core/src/loggable_batch.rs @@ -89,6 +89,32 @@ impl<'a> std::ops::Deref for MaybeOwnedComponentBatch<'a> { } } +impl<'a> LoggableBatch for MaybeOwnedComponentBatch<'a> { + type Name = ComponentName; + + #[inline] + fn name(&self) -> Self::Name { + self.as_ref().name() + } + + #[inline] + fn num_instances(&self) -> usize { + self.as_ref().num_instances() + } + + #[inline] + fn arrow_field(&self) -> arrow2::datatypes::Field { + self.as_ref().arrow_field() + } + + #[inline] + fn to_arrow(&self) -> SerializationResult> { + self.as_ref().to_arrow() + } +} + +impl<'a> ComponentBatch for MaybeOwnedComponentBatch<'a> {} + // --- Unary --- impl LoggableBatch for L {