Skip to content

fix: use dataset file format version to write data files #619

fix: use dataset file format version to write data files

fix: use dataset file format version to write data files #619

Workflow file for this run

# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
name: Spark
on:
push:
branches:
- main
paths-ignore:
- 'docs/**'
- 'README.md'
pull_request:
types:
- opened
- synchronize
- ready_for_review
- reopened
paths-ignore:
- 'docs/**'
- 'README.md'
concurrency:
group: ${{ github.workflow }}-${{ github.ref }}
cancel-in-progress: ${{ github.event_name == 'pull_request' }}
env:
# This env var is used by Swatinem/rust-cache@v2 for the cache
# key, so we set it to make sure it is always consistent.
CARGO_TERM_COLOR: always
# Disable full debug symbol generation to speed up CI build and keep memory down
# "1" means line tables only, which is useful for panic tracebacks.
RUSTFLAGS: "-C debuginfo=1"
RUST_BACKTRACE: "1"
# according to: https://matklad.github.io/2021/09/04/fast-rust-builds.html
# CI builds are faster with incremental disabled.
CARGO_INCREMENTAL: "0"
CARGO_BUILD_JOBS: "1"
jobs:
lint:
name: Lint
runs-on: ubuntu-24.04
timeout-minutes: 10
steps:
- uses: actions/checkout@v4
- name: Set up Java
uses: actions/setup-java@v4
with:
distribution: temurin
java-version: 17
cache: "maven"
- name: Check code style
run: make lint
install:
name: Install
runs-on: ubuntu-24.04
timeout-minutes: 30
steps:
- uses: actions/checkout@v4
- name: Set up Java
uses: actions/setup-java@v4
with:
distribution: temurin
java-version: 17
cache: "maven"
- name: Install all modules
run: make install-all
test:
name: Test Spark ${{ matrix.spark-version }} / Scala ${{ matrix.scala-version }}
runs-on: ubuntu-24.04
timeout-minutes: 30
strategy:
fail-fast: false
matrix:
include:
- spark-version: "3.4"
scala-version: "2.12"
- spark-version: "3.4"
scala-version: "2.13"
- spark-version: "3.5"
scala-version: "2.12"
- spark-version: "3.5"
scala-version: "2.13"
- spark-version: "4.0"
scala-version: "2.13"
steps:
- uses: actions/checkout@v4
- name: Set up Java
uses: actions/setup-java@v4
with:
distribution: temurin
java-version: 17
cache: "maven"
- name: Run tests
run: make test SPARK_VERSION=${{ matrix.spark-version }} SCALA_VERSION=${{ matrix.scala-version }}
integration-test:
name: Integration Test Spark ${{ matrix.spark-version }} / Scala ${{ matrix.scala-version }}
runs-on: ubuntu-24.04
timeout-minutes: 45
strategy:
fail-fast: false
matrix:
include:
- spark-version: "3.4"
scala-version: "2.12"
- spark-version: "3.4"
scala-version: "2.13"
- spark-version: "3.5"
scala-version: "2.12"
- spark-version: "3.5"
scala-version: "2.13"
- spark-version: "4.0"
scala-version: "2.13"
steps:
- uses: actions/checkout@v4
- name: Set up Java
uses: actions/setup-java@v4
with:
distribution: temurin
java-version: 17
cache: "maven"
- name: Set up Docker Buildx
uses: docker/setup-buildx-action@v3
- name: Build bundle
run: make bundle SPARK_VERSION=${{ matrix.spark-version }} SCALA_VERSION=${{ matrix.scala-version }}
- name: Build Docker image
run: make docker-build-test-full SPARK_VERSION=${{ matrix.spark-version }} SCALA_VERSION=${{ matrix.scala-version }} DOCKER_CACHE_FROM="type=gha" DOCKER_CACHE_TO="type=gha,mode=max"
- name: Run Docker integration tests
run: make docker-test SPARK_VERSION=${{ matrix.spark-version }} SCALA_VERSION=${{ matrix.scala-version }}