Skip to content

Commit 199ff95

Browse files
committed
Update
[ghstack-poisoned]
1 parent 8f9faa2 commit 199ff95

File tree

2 files changed

+8
-8
lines changed

2 files changed

+8
-8
lines changed

.github/workflows/android-perf.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -228,7 +228,7 @@ jobs:
228228
export.output_name="${OUT_ET_MODEL_NAME}.pte" \
229229
model.use_kv_cache=true \
230230
model.dtype_override=fp32 \
231-
base.preq_embedding_quantize='8,0' \
231+
base.preq_embedding_quantize=\'8,0\' \
232232
quantization.use_spin_quant=native \
233233
base.metadata='{"get_bos_id":128000,"get_eos_ids":[128009,128001]}'
234234
ls -lh "${OUT_ET_MODEL_NAME}.pte"
@@ -249,7 +249,7 @@ jobs:
249249
base.use_lora=16 \
250250
base.preq_mode="8da4w_output_8da8w" \
251251
base.preq_group_size=32 \
252-
base.preq_embedding_quantize='8,0' \
252+
base.preq_embedding_quantize=\'8,0\' \
253253
model.use_sdpa_with_kv_cache=true \
254254
model.use_kv_cache=true \
255255
backend.xnnpack.enabled=true \
@@ -287,7 +287,7 @@ jobs:
287287
backend.xnnpack.extended_ops=true \
288288
quantization.qmode=8da4w \
289289
quantization.group_size=32 \
290-
quantization.embedding_quantize='8,0' \
290+
quantization.embedding_quantize=\'8,0\' \
291291
base.metadata='{"get_bos_id":128000,"get_eos_ids":[128009,128001]}' \
292292
export.output_name="${OUT_ET_MODEL_NAME}.pte"
293293
ls -lh "${OUT_ET_MODEL_NAME}.pte"
@@ -325,7 +325,7 @@ jobs:
325325
backend.xnnpack.extended_ops=true \
326326
quantization.qmode=8da4w \
327327
quantization.group_size=32 \
328-
quantization.embedding_quantize='8,0' \
328+
quantization.embedding_quantize=\'8,0\' \
329329
base.metadata='{"get_bos_id":151644,"get_eos_ids":[151645]}' \
330330
export.output_name="${OUT_ET_MODEL_NAME}.pte"
331331
ls -lh "${OUT_ET_MODEL_NAME}.pte"

.github/workflows/apple-perf.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -237,7 +237,7 @@ jobs:
237237
export.output_name="${OUT_ET_MODEL_NAME}.pte" \
238238
model.use_kv_cache=true \
239239
model.dtype_override=fp32 \
240-
base.preq_embedding_quantize='8,0' \
240+
base.preq_embedding_quantize=\'8,0\' \
241241
quantization.use_spin_quant=native \
242242
base.metadata='{"get_bos_id":128000,"get_eos_ids":[128009,128001]}'
243243
ls -lh "${OUT_ET_MODEL_NAME}.pte"
@@ -258,7 +258,7 @@ jobs:
258258
base.use_lora=16 \
259259
base.preq_mode="8da4w_output_8da8w" \
260260
base.preq_group_size=32 \
261-
base.preq_embedding_quantize='8,0' \
261+
base.preq_embedding_quantize=\'8,0\' \
262262
model.use_sdpa_with_kv_cache=true \
263263
model.use_kv_cache=true \
264264
backend.xnnpack.enabled=true \
@@ -296,7 +296,7 @@ jobs:
296296
backend.xnnpack.extended_ops=true \
297297
quantization.qmode=8da4w \
298298
quantization.group_size=32 \
299-
quantization.embedding_quantize='8,0' \
299+
quantization.embedding_quantize=\'8,0\' \
300300
base.metadata='{"get_bos_id":128000,"get_eos_ids":[128009,128001]}' \
301301
export.output_name="${OUT_ET_MODEL_NAME}.pte"
302302
ls -lh "${OUT_ET_MODEL_NAME}.pte"
@@ -330,7 +330,7 @@ jobs:
330330
backend.xnnpack.extended_ops=true \
331331
quantization.qmode=8da4w \
332332
quantization.group_size=32 \
333-
quantization.embedding_quantize='8,0' \
333+
quantization.embedding_quantize=\'8,0\' \
334334
base.metadata='{"get_bos_id":151644,"get_eos_ids":[151645]}' \
335335
export.output_name="${OUT_ET_MODEL_NAME}.pte"
336336
ls -lh "${OUT_ET_MODEL_NAME}.pte"

0 commit comments

Comments
 (0)