Skip to content

Commit 6ff8c97

Browse files
authored
chore(spark): update images for 25.11.0 (#1280)
* spark: remove 3.5.5 * spark: add 3.5.7 * spark-connect-client: add 3.5.7 and remove unused example * update changelog * update changelog
1 parent 850ece9 commit 6ff8c97

File tree

9 files changed

+26
-42
lines changed

9 files changed

+26
-42
lines changed

CHANGELOG.md

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -17,6 +17,8 @@ All notable changes to this project will be documented in this file.
1717
- kafka: Add version `4.1.0` ([#1277]).
1818
- druid: Add `34.0.0` ([#1263]).
1919
- opa: Add `1.8.0` ([#1279]).
20+
- spark: Add `3.5.7` ([#1280]).
21+
- spark-connect-client: Add `3.5.7` ([#1280]).
2022

2123
### Changed
2224

@@ -36,6 +38,8 @@ All notable changes to this project will be documented in this file.
3638
- kafka: Remove version `4.0.0` ([#1277]).
3739
- druid: Remove `31.0.1` ([#1263]).
3840
- opa: Remove `1.0.1` ([#1279]).
41+
- spark: Remove `3.5.5` ([#1280]).
42+
- spark-connect-client: Remove unused example script from the image ([#1280]).
3943

4044
[#1207]: https://github.com/stackabletech/docker-images/pull/1207
4145
[#1215]: https://github.com/stackabletech/docker-images/pull/1215

spark-connect-client/Dockerfile

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -8,18 +8,17 @@ ARG PYTHON_VERSION
88
ARG RELEASE_VERSION
99
ARG STACKABLE_USER_UID
1010

11-
LABEL name="Stackable Spark Connect Examples" \
11+
LABEL name="Stackable Spark Connect Client" \
1212
maintainer="[email protected]" \
1313
vendor="Stackable GmbH" \
1414
version="${PRODUCT_VERSION}" \
1515
release="${RELEASE_VERSION}" \
1616
summary="Spark Connect Examples" \
17-
description="Spark Connect client libraries for Python and the JVM, including some examples."
17+
description="Spark Connect client libraries for Python and the JVM."
1818

1919
# Need root to install setuptools
2020
USER root
2121

22-
COPY --chown=${STACKABLE_USER_UID}:0 spark-connect-client/stackable/spark-connect-examples /stackable/spark-connect-examples
2322
COPY --chown=${STACKABLE_USER_UID}:0 spark-connect-client/stackable/.jupyter /stackable/.jupyter
2423

2524
RUN <<EOF
@@ -48,4 +47,4 @@ RUN pip install --no-cache-dir --user \
4847
"scikit-learn==1.3.1" \
4948
"matplotlib==3.10.1"
5049

51-
WORKDIR /stackable/spark-connect-examples/python
50+
WORKDIR /stackable

spark-connect-client/boil-config.toml

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,13 @@ java-base = "17"
55
[versions."3.5.6".build-arguments]
66
python-version = "3.11"
77

8+
[versions."3.5.7".local-images]
9+
spark-k8s = "3.5.7"
10+
java-base = "17"
11+
12+
[versions."3.5.7".build-arguments]
13+
python-version = "3.11"
14+
815
[versions."4.0.0".local-images]
916
spark-k8s = "4.0.0"
1017
java-base = "17"

spark-connect-client/stackable/spark-connect-examples/python/simple-connect-app.py

Lines changed: 0 additions & 24 deletions
This file was deleted.

spark-k8s/Dockerfile

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -197,10 +197,8 @@ RUN <<EOF
197197
sed -i "s/${NEW_VERSION}/${ORIGINAL_VERSION}/g" assembly/target/bom.json
198198
EOF
199199

200-
201-
# As of version 3.5.5, spark-connect jars are not included in the dist folder.
202200
# To avoid classpath conflicts with existing spark applications,
203-
# we create a new dist/connect folder, and copy them here.
201+
# we create a new dist/connect folder, and copy spark connect jars here.
204202
RUN <<EOF
205203

206204
SCALA_BINARY_VERSION=$(grep "scala.binary.version" pom.xml | head -n1 | awk -F '[<>]' '{print $3}')

spark-k8s/boil-config.toml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,11 @@
1-
[versions."3.5.5".local-images]
1+
[versions."3.5.6".local-images]
22
"hadoop/hadoop" = "3.4.1" # Current Stackable LTS version. Source of the AWS and Azure artifacts to Spark's classpath.
33
java-base = "17"
44
java-devel = "17"
55
hbase = "2.6.2" # Current Stackable LTS version. Used to build the HBase connector.
66
vector = "0.49.0"
77

8-
[versions."3.5.5".build-arguments]
8+
[versions."3.5.6".build-arguments]
99
python-version = "3.11"
1010
aws-java-sdk-bundle-version = "2.24.6" # https://mvnrepository.com/artifact/org.apache.hadoop/hadoop-aws/3.4.1
1111
azure-storage-version = "7.0.1" # https://mvnrepository.com/artifact/org.apache.hadoop/hadoop-azure/3.4.1
@@ -17,14 +17,14 @@ jmx-exporter-version = "1.3.0"
1717
tini-version = "0.19.0"
1818
hbase-connector-version = "1.0.1"
1919

20-
[versions."3.5.6".local-images]
20+
[versions."3.5.7".local-images]
2121
"hadoop/hadoop" = "3.4.1" # Current Stackable LTS version. Source of the AWS and Azure artifacts to Spark's classpath.
2222
java-base = "17"
2323
java-devel = "17"
2424
hbase = "2.6.2" # Current Stackable LTS version. Used to build the HBase connector.
2525
vector = "0.49.0"
2626

27-
[versions."3.5.6".build-arguments]
27+
[versions."3.5.7".build-arguments]
2828
python-version = "3.11"
2929
aws-java-sdk-bundle-version = "2.24.6" # https://mvnrepository.com/artifact/org.apache.hadoop/hadoop-aws/3.4.1
3030
azure-storage-version = "7.0.1" # https://mvnrepository.com/artifact/org.apache.hadoop/hadoop-azure/3.4.1

spark-k8s/stackable/patches/3.5.5/0001-Update-CycloneDX-plugin.patch renamed to spark-k8s/stackable/patches/3.5.7/0001-Update-CycloneDX-plugin.patch

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
From 37ad7dcbb2a77267bbddafc4f3b3d99fddda0b28 Mon Sep 17 00:00:00 2001
1+
From 5e3c5568d4bf0fdd4feb19e559d606a55a0d2569 Mon Sep 17 00:00:00 2001
22
From: Razvan-Daniel Mihai <[email protected]>
33
Date: Tue, 11 Mar 2025 17:29:39 +0200
44
Subject: Update CycloneDX plugin
@@ -21,7 +21,7 @@ index ef7c010e93..0f4c1c74e4 100755
2121

2222
# Actually build the jar
2323
diff --git a/pom.xml b/pom.xml
24-
index 9b009c3a42..483dceb8ea 100644
24+
index a0e25ce4d8..b3755a04e7 100644
2525
--- a/pom.xml
2626
+++ b/pom.xml
2727
@@ -3534,7 +3534,12 @@
Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
1-
From c4a23f0060f34a2e1c3b826b9698ad56a5ce7176 Mon Sep 17 00:00:00 2001
1+
From 0cfb1d6b733579ea91df842e685df9db5512ece8 Mon Sep 17 00:00:00 2001
22
From: Razvan-Daniel Mihai <[email protected]>
3-
Date: Tue, 22 Jul 2025 18:51:28 +0200
3+
Date: Tue, 22 Jul 2025 17:34:03 +0200
44
Subject: Backport [SPARK-51311][BUILD] Promote bcprov-jdk18on to compile scope
55

66
---
@@ -24,7 +24,7 @@ index 05645977a0..9834cf333f 100644
2424
org.slf4j:jul-to-slf4j
2525
org.slf4j:slf4j-api
2626
diff --git a/assembly/pom.xml b/assembly/pom.xml
27-
index 2066bbeb7e..05edd80958 100644
27+
index ffa6a0e2b0..19032d6054 100644
2828
--- a/assembly/pom.xml
2929
+++ b/assembly/pom.xml
3030
@@ -85,8 +85,22 @@
@@ -51,7 +51,7 @@ index 2066bbeb7e..05edd80958 100644
5151
<plugins>
5252
<plugin>
5353
diff --git a/dev/deps/spark-deps-hadoop-3-hive-2.3 b/dev/deps/spark-deps-hadoop-3-hive-2.3
54-
index 4feea62dfe..df85dcb6f5 100644
54+
index f110a1988f..88324d3e27 100644
5555
--- a/dev/deps/spark-deps-hadoop-3-hive-2.3
5656
+++ b/dev/deps/spark-deps-hadoop-3-hive-2.3
5757
@@ -28,6 +28,7 @@ aws-java-sdk-bundle/1.12.262//aws-java-sdk-bundle-1.12.262.jar
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,2 @@
1-
base = "7c29c664cdc9321205a98a14858aaf8daaa19db2"
1+
base = "ed00d046951a7ecda6429accd3b9c5b2dc792b65"
22
mirror = "https://github.com/stackabletech/spark.git"

0 commit comments

Comments
 (0)