feat(profiling): Add custom SQLAlchemy-based profiler to eventually remove Great Expectations profiler #18203
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| name: Airflow Plugin | |
| on: | |
| push: | |
| branches: | |
| - master | |
| - releases/** | |
| paths: | |
| - ".github/workflows/airflow-plugin.yml" | |
| - "metadata-ingestion-modules/airflow-plugin/**" | |
| - "metadata-ingestion/**" | |
| - "metadata-models/**" | |
| pull_request: | |
| branches: | |
| - "**" | |
| paths: | |
| - ".github/workflows/airflow-plugin.yml" | |
| - "metadata-ingestion-modules/airflow-plugin/**" | |
| - "metadata-ingestion/**" | |
| - "metadata-models/**" | |
| release: | |
| types: [published] | |
| workflow_dispatch: | |
| concurrency: | |
| group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }} | |
| cancel-in-progress: true | |
| env: | |
| DEPOT_PROJECT_ID: "${{ vars.DEPOT_PROJECT_ID }}" | |
| jobs: | |
| airflow-plugin: | |
| runs-on: ${{ vars.DEPOT_PROJECT_ID != '' && 'depot-ubuntu-latest' || 'ubuntu-latest' }} | |
| timeout-minutes: 30 | |
| env: | |
| DATAHUB_TELEMETRY_ENABLED: false | |
| strategy: | |
| matrix: | |
| include: | |
| # Note: this should be kept in sync with tox.ini. | |
| # Airflow 2.x versions use standalone openlineage-airflow package (airflow2) | |
| # Airflow 3.x versions use native OpenLineage provider (airflow3) | |
| # | |
| # Known limitation: Airflow constraints pin jaraco.context to older versions | |
| # (e.g., 5.3.0 in 2.9.x) which conflicts with acryl-datahub's requirement of | |
| # jaraco.context>=6.1.0 (security fix for GHSA-58pv-8j8x-9vj2). This is acceptable | |
| # for CI testing; the security constraint is enforced in Docker image builds via | |
| # docker/snippets/ingestion/constraints.txt. | |
| - python-version: "3.10" | |
| extra_pip_requirements: "apache-airflow~=2.7.3" | |
| extra_pip_constraints: "-c https://raw.githubusercontent.com/apache/airflow/constraints-2.7.3/constraints-3.10.txt" | |
| extra_pip_extras: "airflow2" | |
| - python-version: "3.10" | |
| extra_pip_requirements: "apache-airflow~=2.8.1" | |
| extra_pip_constraints: "-c https://raw.githubusercontent.com/apache/airflow/constraints-2.8.1/constraints-3.10.txt" | |
| extra_pip_extras: "airflow2" | |
| - python-version: "3.11" | |
| extra_pip_requirements: "apache-airflow~=2.9.3" | |
| extra_pip_constraints: "-c https://raw.githubusercontent.com/apache/airflow/constraints-2.9.3/constraints-3.11.txt" | |
| extra_pip_extras: "airflow2" | |
| - python-version: "3.11" | |
| extra_pip_requirements: "apache-airflow~=2.10.3" | |
| extra_pip_constraints: "-c https://raw.githubusercontent.com/apache/airflow/constraints-2.10.3/constraints-3.11.txt" | |
| extra_pip_extras: "airflow2" | |
| # Test Airflow 2.10 with apache-airflow-providers-openlineage instead of openlineage-airflow | |
| - python-version: "3.11" | |
| extra_pip_requirements: "apache-airflow~=2.10.3 apache-airflow-providers-openlineage>=1.0.0" | |
| extra_pip_constraints: "-c https://raw.githubusercontent.com/apache/airflow/constraints-2.10.3/constraints-3.11.txt" | |
| extra_pip_extras: "" | |
| - python-version: "3.11" | |
| extra_pip_requirements: "apache-airflow~=3.1.0 apache-airflow-providers-openlineage>=2.8.0" | |
| extra_pip_constraints: "-c https://raw.githubusercontent.com/apache/airflow/constraints-3.1.0/constraints-3.11.txt" | |
| extra_pip_extras: "airflow3" | |
| fail-fast: false | |
| steps: | |
| - name: Set up JDK 17 | |
| uses: actions/setup-java@v5 | |
| with: | |
| distribution: "zulu" | |
| java-version: 17 | |
| - uses: gradle/actions/setup-gradle@v4 | |
| - uses: acryldata/sane-checkout-action@v4 | |
| - uses: actions/setup-python@v6 | |
| with: | |
| python-version: ${{ matrix.python-version }} | |
| - name: Install dependencies | |
| run: ./metadata-ingestion/scripts/install_deps.sh | |
| - name: Install airflow package and test (extras ${{ matrix.extra_pip_requirements }}) | |
| run: ./gradlew -Pextra_pip_requirements='${{ matrix.extra_pip_requirements }}' -Pextra_pip_constraints='${{ matrix.extra_pip_constraints }}' -Pextra_pip_extras='${{ matrix.extra_pip_extras }}' :metadata-ingestion-modules:airflow-plugin:build | |
| - name: pip freeze show list installed | |
| if: always() | |
| run: source metadata-ingestion-modules/airflow-plugin/venv/bin/activate && uv pip freeze | |
| - uses: actions/upload-artifact@v4 | |
| if: ${{ always() && matrix.python-version == '3.10' && matrix.extra_pip_requirements == 'apache-airflow~=2.7.3' }} | |
| with: | |
| name: Test Results (Airflow Plugin ${{ matrix.python-version}}) | |
| path: | | |
| **/build/reports/tests/test/** | |
| **/build/test-results/test/** | |
| **/junit.*.xml | |
| !**/binary/** | |
| - name: Upload coverage to Codecov with ingestion flag | |
| if: always() | |
| uses: codecov/codecov-action@v5 | |
| with: | |
| token: ${{ secrets.CODECOV_TOKEN }} | |
| directory: ./build/coverage-reports/metadata-ingestion-modules/airflow-plugin/ | |
| fail_ci_if_error: false | |
| flags: ingestion-airflow | |
| name: pytest-airflow-${{ matrix.python-version }}-${{ matrix.extra_pip_requirements }} | |
| verbose: true | |
| override_branch: ${{ github.head_ref || github.ref_name }} | |
| - name: Upload test results to Codecov | |
| if: ${{ !cancelled() }} | |
| uses: codecov/test-results-action@v1 | |
| with: | |
| token: ${{ secrets.CODECOV_TOKEN }} | |
| override_branch: ${{ github.head_ref || github.ref_name }} | |
| event-file: | |
| runs-on: ubuntu-latest | |
| steps: | |
| - name: Upload | |
| uses: actions/upload-artifact@v4 | |
| with: | |
| name: Event File | |
| path: ${{ github.event_path }} |