fixup

joseph-isaacs · joseph-isaacs · commit 9671c53d285d · 2026-03-24T16:59:57.000Z
Signed-off-by: Joe Isaacs &lt;joe.isaacs@live.co.uk&gt;
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/benchmarks/datafusion-bench/src/main.rs b/benchmarks/datafusion-bench/src/main.rs
@@ -8,7 +8,6 @@ use std::time::Instant;
 use clap::Parser;
 use clap::value_parser;
 use custom_labels::asynchronous::Label;
-use datafusion::arrow::array::Array;
 use datafusion::arrow::array::RecordBatch;
 use datafusion::arrow::util::display::ArrayFormatter;
 use datafusion::arrow::util::display::FormatOptions;
@@ -420,23 +419,19 @@ impl BenchmarkQueryResult for DataFusionQueryResult {
             .unwrap_or_else(|e| format!("<error: {e}>"))
     }
 
-    fn normalized_result(&self) -> (Vec<String>, Vec<Vec<String>>) {
-        normalize_record_batches(&self.0)
+    fn result_rows(&self) -> (Vec<String>, Vec<Vec<String>>) {
+        extract_record_batch_rows(&self.0)
     }
 }
 
-/// Convert Arrow `RecordBatch`es into normalized column names and row values.
+/// Extract raw string values from Arrow `RecordBatch`es.
 ///
-/// Uses [`vortex_bench::validation`] normalization for floats and strings to
-/// match the sqllogictest conventions used by DuckDB's result normalization.
-fn normalize_record_batches(batches: &[RecordBatch]) -> (Vec<String>, Vec<Vec<String>>) {
-    use datafusion::arrow::datatypes::DataType;
+/// Uses `ArrayFormatter` to produce `to_string()` values for every cell.
+/// NULL cells are represented as `"NULL"`. No type-specific normalization is
+/// applied — each engine's per-engine `.slt.no` reference files contain the
+/// exact expected output.
+fn extract_record_batch_rows(batches: &[RecordBatch]) -> (Vec<String>, Vec<Vec<String>>) {
     use vortex::error::VortexExpect;
-    use vortex_bench::validation::normalize_decimal;
-    use vortex_bench::validation::normalize_f32;
-    use vortex_bench::validation::normalize_f64;
-    use vortex_bench::validation::normalize_string;
-    use vortex_bench::validation::normalize_timestamp;
 
     let column_names = batches
         .first()
@@ -462,48 +457,8 @@ fn normalize_record_batches(batches: &[RecordBatch]) -> (Vec<String>, Vec<Vec<St
 
         for row_idx in 0..batch.num_rows() {
             let mut row = Vec::with_capacity(batch.num_columns());
-            for (col_idx, formatter) in formatters.iter().enumerate() {
-                let col = batch.column(col_idx);
-                if col.is_null(row_idx) {
-                    row.push("NULL".to_string());
-                } else {
-                    let dt = col.data_type();
-                    let cell = match dt {
-                        DataType::Float32 => {
-                            let arr = col
-                                .as_any()
-                                .downcast_ref::<datafusion::arrow::array::Float32Array>()
-                                .vortex_expect("Float32 downcast");
-                            normalize_f32(arr.value(row_idx))
-                        }
-                        DataType::Float64 => {
-                            let arr = col
-                                .as_any()
-                                .downcast_ref::<datafusion::arrow::array::Float64Array>()
-                                .vortex_expect("Float64 downcast");
-                            normalize_f64(arr.value(row_idx))
-                        }
-                        DataType::Decimal128(_, scale) => {
-                            let arr = col
-                                .as_any()
-                                .downcast_ref::<datafusion::arrow::array::Decimal128Array>()
-                                .vortex_expect("Decimal128 downcast");
-                            normalize_decimal(arr.value(row_idx), *scale)
-                        }
-                        DataType::Utf8
-                        | DataType::LargeUtf8
-                        | DataType::Utf8View
-                        | DataType::Dictionary(..) => {
-                            let s = formatter.value(row_idx).to_string();
-                            normalize_string(&s)
-                        }
-                        DataType::Timestamp(..) | DataType::Date32 | DataType::Date64 => {
-                            normalize_timestamp(&formatter.value(row_idx).to_string())
-                        }
-                        _ => formatter.value(row_idx).to_string(),
-                    };
-                    row.push(cell);
-                }
+            for formatter in &formatters {
+                row.push(formatter.value(row_idx).to_string());
             }
             rows.push(row);
         }
diff --git a/benchmarks/duckdb-bench/src/lib.rs b/benchmarks/duckdb-bench/src/lib.rs
@@ -16,13 +16,10 @@ use vortex_bench::Format;
 use vortex_bench::IdempotentPath;
 use vortex_bench::generate_duckdb_registration_sql;
 use vortex_bench::runner::BenchmarkQueryResult;
-use vortex_bench::validation;
 use vortex_duckdb::duckdb::Config;
 use vortex_duckdb::duckdb::Connection;
 use vortex_duckdb::duckdb::Database;
-use vortex_duckdb::duckdb::ExtractedValue;
 use vortex_duckdb::duckdb::QueryResult;
-use vortex_duckdb::duckdb::Value;
 
 /// DuckDB context for benchmarks.
 pub struct DuckClient {
@@ -209,7 +206,7 @@ impl DuckClient {
 /// Eagerly materialized wrapper around DuckDB query results.
 ///
 /// Materializes the result on construction so that both `row_count()`,
-/// `display()`, and `normalized_result()` can be called via shared reference.
+/// `display()`, and `result_rows()` can be called via shared reference.
 pub struct DuckQueryResult {
     row_count: usize,
     display_string: String,
@@ -246,7 +243,7 @@ impl DuckQueryResult {
                 for col_idx in 0..chunk.column_count() {
                     let vector = chunk.get_vector(col_idx);
                     let cell = match vector.get_value(row_idx, chunk.len()) {
-                        Some(value) => normalize_duckdb_value(&value),
+                        Some(value) => value.to_string(),
                         None => "NULL".to_string(),
                     };
                     row.push(cell);
@@ -273,43 +270,7 @@ impl BenchmarkQueryResult for DuckQueryResult {
         self.display_string
     }
 
-    fn normalized_result(&self) -> (Vec<String>, Vec<Vec<String>>) {
+    fn result_rows(&self) -> (Vec<String>, Vec<Vec<String>>) {
         (self.column_names.clone(), self.normalized_rows.clone())
     }
 }
-
-/// Normalize a DuckDB value to a canonical string representation.
-///
-/// Uses the same normalization as `vortex-sqllogictest`'s `ValueDisplayAdapter`
-/// and the shared [`vortex_bench::validation`] helpers so that results are
-/// comparable with DataFusion output.
-fn normalize_duckdb_value(value: &Value) -> String {
-    match value.extract() {
-        ExtractedValue::Null => "NULL".to_string(),
-        ExtractedValue::TinyInt(v) => v.to_string(),
-        ExtractedValue::SmallInt(v) => v.to_string(),
-        ExtractedValue::Integer(v) => v.to_string(),
-        ExtractedValue::BigInt(v) => v.to_string(),
-        ExtractedValue::HugeInt(v) => v.to_string(),
-        ExtractedValue::UTinyInt(v) => v.to_string(),
-        ExtractedValue::USmallInt(v) => v.to_string(),
-        ExtractedValue::UInteger(v) => v.to_string(),
-        ExtractedValue::UBigInt(v) => v.to_string(),
-        ExtractedValue::UHugeInt(v) => v.to_string(),
-        ExtractedValue::Float(v) => validation::normalize_f32(v),
-        ExtractedValue::Double(v) => validation::normalize_f64(v),
-        ExtractedValue::Boolean(v) => v.to_string(),
-        ExtractedValue::Varchar(s) => validation::normalize_string(s.as_str()),
-        ExtractedValue::Decimal(_, scale, v) => validation::normalize_decimal(v, scale),
-        // Normalize timestamps to a canonical format for cross-engine comparison.
-        ExtractedValue::Date(_)
-        | ExtractedValue::TimestampNs(_)
-        | ExtractedValue::Timestamp(_)
-        | ExtractedValue::TimestampMs(_)
-        | ExtractedValue::TimestampS(_) => validation::normalize_timestamp(&value.to_string()),
-        // Delegate to DuckDB's native string representation for other types.
-        ExtractedValue::Blob(_) | ExtractedValue::Time(_) | ExtractedValue::List(_) => {
-            value.to_string()
-        }
-    }
-}
diff --git a/benchmarks/lance-bench/src/main.rs b/benchmarks/lance-bench/src/main.rs
@@ -168,7 +168,7 @@ impl BenchmarkQueryResult for LanceQueryResult {
             .unwrap_or_else(|e| format!("<error: {e}>"))
     }
 
-    fn normalized_result(&self) -> (Vec<String>, Vec<Vec<String>>) {
+    fn result_rows(&self) -> (Vec<String>, Vec<Vec<String>>) {
         unimplemented!("Lance benchmarks do not support result validation")
     }
 }
diff --git a/vortex-bench/Cargo.toml b/vortex-bench/Cargo.toml
@@ -22,7 +22,6 @@ arrow-array = { workspace = true }
 arrow-schema = { workspace = true }
 arrow-select = { workspace = true }
 async-trait = { workspace = true }
-bigdecimal = { workspace = true }
 bytes = { workspace = true }
 bzip2 = { workspace = true }
 clap = { workspace = true, features = ["derive"] }
diff --git a/vortex-bench/src/benchmark.rs b/vortex-bench/src/benchmark.rs
@@ -3,6 +3,7 @@
 
 //! Core benchmark trait and types.
 
+use std::path::Path;
 use std::path::PathBuf;
 
 use arrow_schema::Schema;
@@ -81,7 +82,15 @@ pub trait Benchmark: Send + Sync {
     /// Reference files are stored in engine-specific subdirectories as
     /// `{dir}/{engine}/q{idx:02}.slt.no` in sqllogictest format (e.g. `results/duckdb/q01.slt.no`).
     /// Use `--validate` to check results against them.
+    ///
+    /// The default implementation uses `dataset_name()` to locate the files at
+    /// `{CARGO_MANIFEST_DIR}/{dataset_name}/slt/results/`.
     fn expected_results_dir(&self) -> Option<PathBuf> {
-        None
+        Some(
+            Path::new(env!("CARGO_MANIFEST_DIR"))
+                .join(self.dataset_name())
+                .join("slt")
+                .join("results"),
+        )
     }
 }
diff --git a/vortex-bench/src/clickbench/benchmark.rs b/vortex-bench/src/clickbench/benchmark.rs
@@ -4,8 +4,6 @@
 use std::env;
 use std::fs;
 use std::path::Path;
-use std::path::PathBuf;
-
 use anyhow::Result;
 use reqwest::Client;
 use url::Url;
@@ -124,14 +122,6 @@ impl Benchmark for ClickBenchBenchmark {
         vec![TableSpec::new("hits", Some(HITS_SCHEMA.clone()))]
     }
 
-    fn expected_results_dir(&self) -> Option<PathBuf> {
-        Some(
-            Path::new(env!("CARGO_MANIFEST_DIR"))
-                .join("clickbench")
-                .join("slt")
-                .join("results"),
-        )
-    }
 }
 
 fn clickbench_flavor(flavor: Flavor) -> String {
diff --git a/vortex-bench/src/runner.rs b/vortex-bench/src/runner.rs
@@ -43,13 +43,11 @@ pub trait BenchmarkQueryResult {
     fn row_count(&self) -> usize;
     /// Human-readable representation of the result (used by Explain mode).
     fn display(self) -> String;
-    /// Normalized result for cross-engine validation.
+    /// Raw result rows for validation.
     ///
-    /// Returns column names and rows of normalized string values suitable for
-    /// comparison across different query engines. Values are normalized using
-    /// sqllogictest conventions (floats rounded to 12 decimal places, etc.)
-    /// via [`crate::validation`].
-    fn normalized_result(&self) -> (Vec<String>, Vec<Vec<String>>);
+    /// Returns column names and rows of string values extracted from the
+    /// query result. No cross-engine normalization is applied.
+    fn result_rows(&self) -> (Vec<String>, Vec<Vec<String>>);
 }
 use crate::display::DisplayFormat;
 use crate::display::print_measurements_json;
@@ -362,7 +360,7 @@ impl SqlBenchmarkRunner {
 
                         // Validate the last iteration's result against the reference file.
                         if validate && self.expected_results_dir.is_some() {
-                            let (_cols, mut rows) = result.normalized_result();
+                            let (_cols, mut rows) = result.result_rows();
                             if !self.validate_query_result(query_idx, &mut rows) {
                                 validation_failures.push((query_idx, format));
                             }
@@ -481,7 +479,7 @@ impl SqlBenchmarkRunner {
 
                         // Validate the last iteration's result against the reference file.
                         if validate && self.expected_results_dir.is_some() {
-                            let (_cols, mut rows) = result.normalized_result();
+                            let (_cols, mut rows) = result.result_rows();
                             if !self.validate_query_result(query_idx, &mut rows) {
                                 validation_failures.push((query_idx, format));
                             }
diff --git a/vortex-bench/src/tpch/benchmark.rs b/vortex-bench/src/tpch/benchmark.rs
@@ -3,10 +3,6 @@
 
 //! TPCH benchmark implementation
 
-use std::env;
-use std::path::Path;
-use std::path::PathBuf;
-
 use glob::Pattern;
 use tracing::info;
 use tracing::warn;
@@ -143,15 +139,6 @@ impl Benchmark for TpcHBenchmark {
         ]
     }
 
-    fn expected_results_dir(&self) -> Option<PathBuf> {
-        Some(
-            Path::new(env!("CARGO_MANIFEST_DIR"))
-                .join("tpch")
-                .join("slt")
-                .join("results"),
-        )
-    }
-
     #[expect(clippy::expect_used, clippy::unwrap_in_result)]
     fn pattern(&self, table_name: &str, format: Format) -> Option<Pattern> {
         Some(
diff --git a/vortex-bench/src/validation.rs b/vortex-bench/src/validation.rs

Original file line number	Diff line number	Diff line change
`@@ -168,7 +168,7 @@ impl BenchmarkQueryResult for LanceQueryResult {`
`168`	`168`	`.unwrap_or_else(\|e\| format!("<error: {e}>"))`
`169`	`169`	`}`
`170`	`170`
`171`		`- fn normalized_result(&self) -> (Vec<String>, Vec<Vec<String>>) {`
	`171`	`+ fn result_rows(&self) -> (Vec<String>, Vec<Vec<String>>) {`
`172`	`172`	`unimplemented!("Lance benchmarks do not support result validation")`
`173`	`173`	`}`
`174`	`174`	`}`