Skip to content

Commit 6ebda96

Browse files
Benjamin CheungBenjamin Cheung
authored andcommitted
fix: remove the extra configs
1 parent 9e34f00 commit 6ebda96

File tree

1 file changed

+15
-11
lines changed

1 file changed

+15
-11
lines changed

.ci/scripts/test_llama.sh

Lines changed: 15 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -145,31 +145,35 @@ elif [[ "$(uname -m)" == "aarch64" ]] || [[ "$(uname -m)" == "arm64" ]]; then
145145
PLATFORM="arm64"
146146
fi
147147

148+
BUFFER_TIME=50
149+
148150
# Lookup threshold based on platform:dtype:mode
149151
case "${PLATFORM}:${DTYPE}:${MODE}" in
152+
150153
# Linux x86 configurations
151-
"x86:fp32:portable") MAX_EXPORT_TIME=100 ;; # actual: 72s
152-
"x86:fp32:xnnpack+custom") MAX_EXPORT_TIME=360 ;; # actual: 276s
153-
"x86:bf16:portable") MAX_EXPORT_TIME=100 ;; # actual: 75s
154+
"x86:fp32:portable") ACT_EXPORT_TIME=72 ;;
155+
"x86:fp32:xnnpack+custom") ACT_EXPORT_TIME=276 ;;
156+
"x86:bf16:portable") ACT_EXPORT_TIME=75 ;;
154157

155158
# Linux ARM64 configurations
156-
"arm64:fp32:portable") MAX_EXPORT_TIME=162 ;; # actual: 124s
157-
"arm64:fp32:xnnpack+custom") MAX_EXPORT_TIME=630 ;; # actual: 483s
158-
"arm64:bf16:portable") MAX_EXPORT_TIME=162 ;; # actual: 118s
159-
"arm64:bf16:custom") MAX_EXPORT_TIME=133 ;; # actual: 102s
159+
"arm64:fp32:portable") ACT_EXPORT_TIME=124 ;;
160+
"arm64:fp32:xnnpack+custom") ACT_EXPORT_TIME=483 ;;
161+
"arm64:bf16:portable") ACT_EXPORT_TIME=118 ;;
162+
"arm64:bf16:custom") ACT_EXPORT_TIME=102 ;;
160163

161164
# macOS configurations
162-
"macos:fp32:mps") MAX_EXPORT_TIME=60 ;; # actual: 30s
163-
"macos:fp32:coreml") MAX_EXPORT_TIME=80 ;; # actual: 61s
164-
"macos:fp32:xnnpack+custom+quantize_kv") MAX_EXPORT_TIME=170 ;; # actual: 133s
165+
"macos:fp32:mps") ACT_EXPORT_TIME=30 ;;
166+
"macos:fp32:coreml") ACT_EXPORT_TIME=61 ;;
167+
"macos:fp32:xnnpack+custom+quantize_kv") ACT_EXPORT_TIME=133 ;;
165168

166169
# Default fallback for unknown configurations
167170
*)
168-
MAX_EXPORT_TIME=500
171+
ACT_EXPORT_TIME=450
169172
echo "Warning: No threshold defined for ${PLATFORM}:${DTYPE}:${MODE}, using default: ${MAX_EXPORT_TIME}s"
170173
;;
171174
esac
172175

176+
MAX_EXPORT_TIME=$((ACT_EXPORT_TIME + BUFFER_TIME))
173177

174178
echo "QNN option ${QNN}"
175179
echo "QNN_SDK_ROOT: ${QNN_SDK_ROOT}"

0 commit comments

Comments
 (0)