Skip to content

Commit f673dc5

Browse files
committed
threshold with script
1 parent 7f0c68f commit f673dc5

File tree

2 files changed

+27
-2
lines changed

2 files changed

+27
-2
lines changed

.ci/scripts/test_qnn_static_llama_eval.sh

Lines changed: 24 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,29 @@ fi
2727

2828
which "${PYTHON_EXECUTABLE}"
2929

30+
# -------------------------------
31+
# Parse args
32+
# -------------------------------
33+
EXTRA_FLAGS=""
34+
THRESHOLD=62.0 # default fallback
35+
36+
while [[ $# -gt 0 ]]; do
37+
case "$1" in
38+
--flags)
39+
EXTRA_FLAGS="$2"
40+
shift 2
41+
;;
42+
--threshold)
43+
THRESHOLD="$2"
44+
shift 2
45+
;;
46+
*)
47+
echo "Unknown option: $1"
48+
exit 1
49+
;;
50+
esac
51+
done
52+
3053
# Config
3154
PYTHON_EXECUTABLE="${PYTHON_EXECUTABLE:-python3}"
3255
MODEL="qwen2_5-0_5b"
@@ -39,7 +62,7 @@ EXTRA_FLAGS="$@"
3962
# Run command and capture *both stdout and stderr*
4063
LOG_FILE="eval_${MODEL}_$(date +%Y%m%d_%H%M%S).log"
4164

42-
echo ">>> Running evaluation..."
65+
echo ">>> Running evaluation with flags: $EXTRA_FLAGS | threshold: $THRESHOLD"
4366
$PYTHON_EXECUTABLE -m executorch.examples.qualcomm.oss_scripts.llama.eval_llama_qnn \
4467
--decoder_model "$MODEL" \
4568
--quant_linear_only \

.github/workflows/pull.yml

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -639,7 +639,9 @@ jobs:
639639
640640
# Test static llama weight sharing and accuracy
641641
echo ">>> Running config: ${{ matrix.config.name }}"
642-
PYTHON_EXECUTABLE=python bash .ci/scripts/test_qnn_static_llama_eval.sh ${{ matrix.config.flags }}
642+
PYTHON_EXECUTABLE=python bash .ci/scripts/test_qnn_static_llama_eval.sh \
643+
${{ matrix.config.flags }} \
644+
--threshold ${{ matrix.config.threshold }}
643645
644646
645647
# test-qnn-models-linux:

0 commit comments

Comments
 (0)