File tree Expand file tree Collapse file tree 4 files changed +8
-7
lines changed Expand file tree Collapse file tree 4 files changed +8
-7
lines changed Original file line number Diff line number Diff line change 1- FROM jupyter/pyspark-notebook:latest
1+ FROM docker.io/ jupyter/pyspark-notebook:latest
22
33USER root
44
@@ -11,14 +11,13 @@ RUN wget https://repo1.maven.org/maven2/org/apache/iceberg/iceberg-spark-runtime
1111 wget https://repo1.maven.org/maven2/org/projectnessie/nessie-integrations/nessie-spark-extensions-3.5_2.12/0.102.5/nessie-spark-extensions-3.5_2.12-0.102.5.jar -P /usr/local/spark/jars/
1212
1313# Install Python packages (update pyiceberg to match JAR version)
14- RUN pip install pyiceberg==0.9.0 pynessie==0.67.0
14+ RUN pip install pyiceberg==0.9.0 pynessie==0.67.0 findspark
1515
1616# Create a directory for init scripts
1717RUN mkdir -p /usr/local/bin/start-notebook.d
1818
1919# Create init script to configure Spark environment
20- RUN echo '#!/bin/bash\n export PYSPARK_DRIVER_PYTHON=jupyter\n export PYSPARK_DRIVER_PYTHON_OPTS="lab --NotebookApp.token=\'\' --NotebookApp.password=\'\' "' > /usr/local/bin/start-notebook.d/spark-config.sh && \
21- chmod +x /usr/local/bin/start-notebook.d/spark-config.sh
20+ COPY spark-config.sh /usr/local/bin/start-notebook.d/spark-config.sh
2221
2322USER $NB_UID
2423
Original file line number Diff line number Diff line change @@ -120,11 +120,10 @@ services:
120120 --hiveconf hive.server2.thrift.port=10000 \
121121 --hiveconf hive.server2.thrift.bind.host=0.0.0.0 \
122122 --conf spark.sql.extensions=org.apache.iceberg.spark.extensions.IcebergSparkSessionExtensions \
123- --conf spark.sql.catalog.iceberg=org.apache.iceberg.spark.SparkCatalog \
124- --conf spark.sql.catalog.iceberg.type=nessie \
123+ --conf spark.sql.catalog.iceberg=org.apache.iceberg.spark.SparkSessionCatalog \
124+ --conf spark.sql.catalog.iceberg.type=NessieCatalog \
125125 --conf spark.sql.catalog.iceberg.uri=http://nessie:19120/api/v1 \
126126 --conf spark.sql.catalog.iceberg.ref=main \
127- --conf spark.sql.catalog.iceberg.catalog-impl=org.apache.iceberg.aws.s3.S3FileIO \
128127 --conf spark.sql.catalog.iceberg.s3.endpoint=http://minio:9000 \
129128 --conf spark.sql.catalog.iceberg.s3.path-style-access=true \
130129 --conf spark.sql.catalog.iceberg.warehouse=s3a://nessie \
Original file line number Diff line number Diff line change 1+ #! /bin/bash
2+ export PYSPARK_DRIVER_PYTHON=jupyter
3+ export PYSPARK_DRIVER_PYTHON_OPTS=" lab --NotebookApp.token='' --NotebookApp.password=''"
You can’t perform that action at this time.
0 commit comments