Skip to content

Commit 6761cba

Browse files
fix[bench]: correct s3 path to run benchmarks (#3837)
Signed-off-by: Joe Isaacs <[email protected]>
1 parent 07d69fc commit 6761cba

File tree

4 files changed

+21
-16
lines changed

4 files changed

+21
-16
lines changed

.github/workflows/nightly-bench.yml

Lines changed: 10 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,16 @@ jobs:
2626
"subcommand": "tpch",
2727
"name": "TPC-H on NVME",
2828
"targets": "datafusion:parquet,datafusion:vortex,duckdb:parquet,duckdb:vortex",
29-
"scale_factor": "--scale-factor 10"
29+
"scale_factor": "--scale-factor 10.0"
30+
},
31+
{
32+
"id": "tpch-s3",
33+
"subcommand": "tpch",
34+
"name": "TPC-H on S3",
35+
"local_dir": "bench-vortex/data/tpch/10.0",
36+
"remote_storage": "s3://vortex-bench-dev-eu/${{github.ref_name}}/tpch/10.0/",
37+
"targets": "datafusion:parquet,datafusion:vortex,duckdb:parquet",
38+
"scale_factor": "--scale-factor 10.0"
3039
},
3140
{
3241
"id": "tpch-nvme",

.github/workflows/sql-benchmarks.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -33,10 +33,10 @@ on:
3333
"id": "tpch-s3",
3434
"subcommand": "tpch",
3535
"name": "TPC-H on S3",
36-
"local_dir": "bench-vortex/data/tpch/1",
37-
"remote_storage": "s3://vortex-bench-dev-eu/${{github.ref_name}}/tpch/1/",
36+
"local_dir": "bench-vortex/data/tpch/1.0",
37+
"remote_storage": "s3://vortex-bench-dev-eu/${{github.ref_name}}/tpch/1.0/",
3838
"targets": "datafusion:parquet,datafusion:vortex,duckdb:parquet",
39-
"scale_factor": "--scale-factor 1"
39+
"scale_factor": "--scale-factor 1.0"
4040
}
4141
]
4242

bench-vortex/src/datasets/mod.rs

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -26,10 +26,10 @@ pub trait Dataset {
2626
async fn to_vortex_array(&self) -> ArrayRef;
2727
}
2828

29-
#[derive(Debug, Clone, PartialEq, Serialize)]
29+
#[derive(Debug, Clone, PartialEq, Eq, Serialize)]
3030
pub enum BenchmarkDataset {
3131
#[serde(rename = "tpch")]
32-
TpcH { scale_factor: f32 },
32+
TpcH { scale_factor: String },
3333
#[serde(rename = "tpcds")]
3434
TpcDS { scale_factor: u32 },
3535
#[serde(rename = "clickbench")]

bench-vortex/src/tpch_benchmark.rs

Lines changed: 6 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -128,11 +128,9 @@ impl Benchmark for TpcHBenchmark {
128128
}
129129

130130
fn dataset(&self) -> BenchmarkDataset {
131-
let scale_factor: f32 = self
132-
.scale_factor
133-
.parse()
134-
.expect("Scale factor should be valid float");
135-
BenchmarkDataset::TpcH { scale_factor }
131+
BenchmarkDataset::TpcH {
132+
scale_factor: self.scale_factor.clone(),
133+
}
136134
}
137135

138136
fn expected_row_counts(&self) -> Option<&[usize]> {
@@ -233,14 +231,12 @@ impl TpcHBenchmark {
233231
}
234232
fs::create_dir(&tmp_dir)?;
235233
let duckdb_ctx = DuckDBCtx::new_in_memory()?;
236-
let scale_factor: f32 = self
237-
.scale_factor
238-
.parse()
239-
.map_err(|_| anyhow!("Invalid scale factor: {}", self.scale_factor))?;
240234
duckdb_ctx.register_tables(
241235
self.data_url(),
242236
Format::OnDiskVortex,
243-
&BenchmarkDataset::TpcH { scale_factor },
237+
&BenchmarkDataset::TpcH {
238+
scale_factor: self.scale_factor.clone(),
239+
},
244240
)?;
245241

246242
let mut query_files = fs::read_dir(query_dir)?

0 commit comments

Comments
 (0)