Skip to content

Commit a665eaf

Browse files
committed
debug
1 parent e4b82d4 commit a665eaf

File tree

1 file changed

+5
-37
lines changed

1 file changed

+5
-37
lines changed

.github/workflows/trunk.yml

Lines changed: 5 additions & 37 deletions
Original file line numberDiff line numberDiff line change
@@ -787,7 +787,6 @@ jobs:
787787
# done
788788

789789
test-huggingface-transformers-xnnpack:
790-
# NB: Don't run this on fork PRs because they won't have access to the secret and would fail anyway
791790
if: ${{ !github.event.pull_request.head.repo.fork }}
792791
name: test-huggingface-transformers-xnnpack
793792
uses: pytorch/test-infra/.github/workflows/linux_job_v2.yml@main
@@ -796,33 +795,17 @@ jobs:
796795
contents: read
797796
secrets: inherit
798797
strategy:
799-
matrix:
800-
config: [
801-
# XNNPack.
802-
llama3.2-1b|xnnpack|--quantize,
803-
qwen3-0.6b|xnnpack|--quantize,
804-
qwen3-1.7b|xnnpack|--quantize,
805-
gemma3-1b|xnnpack|--quantize,
806-
phi4-mini|xnnpack|--quantize,
807-
smollm2-135m|xnnpack|--quantize,
808-
smollm3-3b|xnnpack|--quantize
809-
]
810798
fail-fast: false
799+
matrix:
800+
model: ["gemma3-4b"] # llava gives segfault so not covering.
811801
with:
812802
secrets-env: EXECUTORCH_HF_TOKEN
813-
runner: linux.2xlarge.memory
803+
runner: linux.24xlarge
814804
docker-image: ci-image:executorch-ubuntu-22.04-clang12
815805
submodules: 'recursive'
816806
ref: ${{ github.event_name == 'pull_request' && github.event.pull_request.head.sha || github.sha }}
817807
timeout: 90
818-
upload-artifact: profiling-artifacts-${{ strategy.job-index }}
819808
script: |
820-
set -eux
821-
IFS='|' read -r MODEL RECIPE QUANTIZE <<< "${{ matrix.config }}"
822-
echo "Model: $MODEL"
823-
echo "Recipe: $RECIPE"
824-
echo "Quantize: $QUANTIZE"
825-
826809
# The generic Linux job chooses to use base env, not the one setup by the image
827810
CONDA_ENV=$(conda env list --json | jq -r ".envs | .[-1]")
828811
conda activate "${CONDA_ENV}"
@@ -838,23 +821,8 @@ jobs:
838821
pip install git+https://github.com/huggingface/optimum-executorch.git@${OPTIMUM_ET_VERSION}
839822
echo "::endgroup::"
840823
841-
python -c "import torch, torchvision; print(torch.__version__, torchvision.__version__)"
842-
843-
echo "::group::Run tests"
844-
export OUTPUT_DIR="$(pwd)/${MODEL}_${RECIPE}_${QUANTIZE}"
845-
python .ci/scripts/test_huggingface_optimum_model.py --model ${MODEL} --recipe ${RECIPE} ${QUANTIZE} --model_dir ${OUTPUT_DIR}
846-
echo "::endgroup::"
847-
848-
echo "::group::Generate artifacts for performance profiling"
849-
./cmake-out/executor_runner \
850-
--model_path ${OUTPUT_DIR}/model.pte \
851-
--etdump_path ${OUTPUT_DIR}/etdump.etdp
852-
853-
export TSV_PATH=artifacts-to-be-uploaded/${MODEL}_op_prof.tsv
854-
mkdir -p $(dirname "$TSV_PATH")
855-
python3 -m devtools.inspector.inspector_cli \
856-
--etdump_path ${OUTPUT_DIR}/etdump.etdp \
857-
--tsv_path ${TSV_PATH}
824+
echo "::group::Test ${{ matrix.model }}"
825+
python .ci/scripts/test_huggingface_optimum_model.py --model ${{ matrix.model }} --quantize --recipe xnnpack
858826
echo "::endgroup::"
859827
860828
# test-huggingface-transformers-macos:

0 commit comments

Comments
 (0)