@@ -787,7 +787,6 @@ jobs:
787787 # done
788788
789789 test-huggingface-transformers-xnnpack :
790- # NB: Don't run this on fork PRs because they won't have access to the secret and would fail anyway
791790 if : ${{ !github.event.pull_request.head.repo.fork }}
792791 name : test-huggingface-transformers-xnnpack
793792 uses : pytorch/test-infra/.github/workflows/linux_job_v2.yml@main
@@ -796,33 +795,17 @@ jobs:
796795 contents : read
797796 secrets : inherit
798797 strategy :
799- matrix :
800- config : [
801- # XNNPack.
802- llama3.2-1b|xnnpack|--quantize,
803- qwen3-0.6b|xnnpack|--quantize,
804- qwen3-1.7b|xnnpack|--quantize,
805- gemma3-1b|xnnpack|--quantize,
806- phi4-mini|xnnpack|--quantize,
807- smollm2-135m|xnnpack|--quantize,
808- smollm3-3b|xnnpack|--quantize
809- ]
810798 fail-fast : false
799+ matrix :
800+ model : ["gemma3-4b"] # llava gives segfault so not covering.
811801 with :
812802 secrets-env : EXECUTORCH_HF_TOKEN
813- runner : linux.2xlarge.memory
803+ runner : linux.24xlarge
814804 docker-image : ci-image:executorch-ubuntu-22.04-clang12
815805 submodules : ' recursive'
816806 ref : ${{ github.event_name == 'pull_request' && github.event.pull_request.head.sha || github.sha }}
817807 timeout : 90
818- upload-artifact : profiling-artifacts-${{ strategy.job-index }}
819808 script : |
820- set -eux
821- IFS='|' read -r MODEL RECIPE QUANTIZE <<< "${{ matrix.config }}"
822- echo "Model: $MODEL"
823- echo "Recipe: $RECIPE"
824- echo "Quantize: $QUANTIZE"
825-
826809 # The generic Linux job chooses to use base env, not the one setup by the image
827810 CONDA_ENV=$(conda env list --json | jq -r ".envs | .[-1]")
828811 conda activate "${CONDA_ENV}"
@@ -838,23 +821,8 @@ jobs:
838821 pip install git+https://github.com/huggingface/optimum-executorch.git@${OPTIMUM_ET_VERSION}
839822 echo "::endgroup::"
840823
841- python -c "import torch, torchvision; print(torch.__version__, torchvision.__version__)"
842-
843- echo "::group::Run tests"
844- export OUTPUT_DIR="$(pwd)/${MODEL}_${RECIPE}_${QUANTIZE}"
845- python .ci/scripts/test_huggingface_optimum_model.py --model ${MODEL} --recipe ${RECIPE} ${QUANTIZE} --model_dir ${OUTPUT_DIR}
846- echo "::endgroup::"
847-
848- echo "::group::Generate artifacts for performance profiling"
849- ./cmake-out/executor_runner \
850- --model_path ${OUTPUT_DIR}/model.pte \
851- --etdump_path ${OUTPUT_DIR}/etdump.etdp
852-
853- export TSV_PATH=artifacts-to-be-uploaded/${MODEL}_op_prof.tsv
854- mkdir -p $(dirname "$TSV_PATH")
855- python3 -m devtools.inspector.inspector_cli \
856- --etdump_path ${OUTPUT_DIR}/etdump.etdp \
857- --tsv_path ${TSV_PATH}
824+ echo "::group::Test ${{ matrix.model }}"
825+ python .ci/scripts/test_huggingface_optimum_model.py --model ${{ matrix.model }} --quantize --recipe xnnpack
858826 echo "::endgroup::"
859827
860828 # test-huggingface-transformers-macos:
0 commit comments