Skip to content

Commit 23264e7

Browse files
authored
Merge pull request #139 from Tmonster/result_oct_12_2025
More results
2 parents ab6d73b + 358a51d commit 23264e7

File tree

17 files changed

+5331
-58
lines changed

17 files changed

+5331
-58
lines changed

_benchplot/benchplot-dict.R

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -220,7 +220,7 @@ groupby.syntax.dict = {list(
220220
"sum v1:v3 by id6" = "SELECT id6, sum(v1) AS v1, sum(v2) AS v2, sum(v3) AS v3 FROM tbl GROUP BY id6",
221221
"median v3 sd v3 by id4 id5" = "SELECT id4, id5, quantile_cont(v3, 0.5) AS median_v3, stddev(v3) AS sd_v3 FROM tbl GROUP BY id4, id5",
222222
"max v1 - min v2 by id3" = "SELECT id3, max(v1)-min(v2) AS range_v1_v2 FROM tbl GROUP BY id3",
223-
"largest two v3 by id6" = "SELECT id6, v3 AS largest2_v3 FROM (SELECT id6, v3, row_number() OVER (PARTITION BY id6 ORDER BY v3 DESC) AS order_v3 FROM x WHERE v3 IS NOT NULL) sub_query WHERE order_v3 <= 2",
223+
"largest two v3 by id6" = "SELECT id6, unnest(max(v3, 2)) largest2_v3 FROM x WHERE v3 IS NOT NULL GROUP BY id6",
224224
"regression v1 v2 by id2 id4" = "SELECT id2, id4, pow(corr(v1, v2), 2) AS r2 FROM tbl GROUP BY id2, id4",
225225
"sum v3 count by id1:id6" = "SELECT id1, id2, id3, id4, id5, id6, sum(v3) AS v3, count(*) AS count FROM tbl GROUP BY id1, id2, id3, id4, id5, id6"
226226
)},
@@ -232,7 +232,7 @@ groupby.syntax.dict = {list(
232232
"sum v1:v3 by id6" = "SELECT id6, sum(v1) AS v1, sum(v2) AS v2, sum(v3) AS v3 FROM tbl GROUP BY id6",
233233
"median v3 sd v3 by id4 id5" = "SELECT id4, id5, quantile_cont(v3, 0.5) AS median_v3, stddev(v3) AS sd_v3 FROM tbl GROUP BY id4, id5",
234234
"max v1 - min v2 by id3" = "SELECT id3, max(v1)-min(v2) AS range_v1_v2 FROM tbl GROUP BY id3",
235-
"largest two v3 by id6" = "SELECT id6, v3 AS largest2_v3 FROM (SELECT id6, v3, row_number() OVER (PARTITION BY id6 ORDER BY v3 DESC) AS order_v3 FROM x WHERE v3 IS NOT NULL) sub_query WHERE order_v3 <= 2",
235+
"largest two v3 by id6" = "SELECT id6, unnest(max(v3, 2)) largest2_v3 FROM x WHERE v3 IS NOT NULL GROUP BY id6",
236236
"regression v1 v2 by id2 id4" = "SELECT id2, id4, pow(corr(v1, v2), 2) AS r2 FROM tbl GROUP BY id2, id4",
237237
"sum v3 count by id1:id6" = "SELECT id1, id2, id3, id4, id5, id6, sum(v3) AS v3, count(*) AS count FROM tbl GROUP BY id1, id2, id3, id4, id5, id6"
238238
)},

_control/skipped_benchmarks.csv

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -57,5 +57,4 @@ pandas,join,J1_1e9_NA_0_0,c6id.4xlarge
5757
polars,join,J1_1e9_NA_0_0,c6id.4xlarge
5858
pydatatable,join,J1_1e9_NA_0_0,c6id.4xlarge
5959
spark,join,J1_1e9_NA_0_0,c6id.4xlarge
60-
clickhouse,join,J1_1e9_NA_0_0,c6id.4xlarge
6160

_run/run_large.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,7 @@ echo "Running all solutions on large (50GB) datasets"
3030
./run.sh
3131

3232

33-
###
33+
##
3434
echo "done..."
3535
echo "removing data files"
3636
rm data/*.csv

clickhouse/VERSION

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
25.1.3.23
1+
25.9.3.48

clickhouse/setup-clickhouse.sh

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,8 @@ sudo service clickhouse-server start ||:
1515

1616
# modify clickhouse settings so data is stored on the mount.
1717
sudo mkdir -p /var/lib/mount/clickhouse-nvme-mount/
18-
sudo chown clickhouse:clickhouse /var/lib/mount/clickhouse-nvme-mount
18+
sudo chown -R clickhouse:clickhouse /var/lib/mount/clickhouse-nvme-mount
19+
sudo chown -R clickhouse:clickhouse /var/lib/mount/clickhouse-nvme-mount/store
1920

2021
# set up clickhouse tmp space
2122
sudo mkdir -p /var/lib/mount/clickhouse-tmp/

clickhouse/ver-clickhouse.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,4 +8,4 @@ ch_installed && clickhouse-client --version-clean > clickhouse/VERSION && echo "
88
if [[ $TEST_RUN != "true" ]]; then
99
sudo chown ubuntu:ubuntu clickhouse/VERSION
1010
sudo chown ubuntu:ubuntu clickhouse/REVISION
11-
fi
11+
fi

collapse/setup-collapse.sh

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,8 @@ set -e
33

44
# install stable collapse
55
mkdir -p ./collapse/r-collapse
6-
Rscript -e 'install.packages(c("Rcpp", "collapse"), lib="./collapse/r-collapse", repos = "http://cloud.r-project.org")'
6+
ncores=`python3 -c 'import multiprocessing as mp; print(mp.cpu_count())'`
7+
MAKEFLAGS="-j$ncores" Rscript -e 'install.packages(c("Rcpp", "collapse"), lib="./collapse/r-collapse", repos = "http://cloud.r-project.org")'
8+
9+
./collapse/ver-collapse.sh
710

8-
./collapse/ver-collapse.sh

datafusion/VERSION

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
50.0.0
1+
50.1.0

datatable/VERSION

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
1.16.99
1+
1.17.99

duckdb/VERSION

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
1.4.0
1+
1.4.1

0 commit comments

Comments
 (0)