@@ -237,9 +237,9 @@ jobs:
237237 export.output_name="${OUT_ET_MODEL_NAME}.pte" \
238238 model.use_kv_cache=true \
239239 model.dtype_override=fp32 \
240- base.preq_embedding_quantize=" 8,0" \
240+ base.preq_embedding_quantize=' 8,0' \
241241 quantization.use_spin_quant=native \
242- base.metadata="\{\ "get_bos_id\ ":128000,\ "get_eos_ids\ ":[128009,128001]\}"
242+ base.metadata='{ "get_bos_id":128000,"get_eos_ids":[128009,128001]}'
243243 ls -lh "${OUT_ET_MODEL_NAME}.pte"
244244 elif [[ ${{ matrix.config }} == "llama3_qlora" ]]; then
245245 # QAT + LoRA
@@ -258,7 +258,7 @@ jobs:
258258 base.use_lora=16 \
259259 base.preq_mode="8da4w_output_8da8w" \
260260 base.preq_group_size=32 \
261- base.preq_embedding_quantize=" 8,0" \
261+ base.preq_embedding_quantize=' 8,0' \
262262 model.use_sdpa_with_kv_cache=true \
263263 model.use_kv_cache=true \
264264 backend.xnnpack.enabled=true \
@@ -267,7 +267,7 @@ jobs:
267267 export.max_seq_length=2048 \
268268 export.max_context_length=2048 \
269269 export.output_name="${OUT_ET_MODEL_NAME}.pte" \
270- base.metadata="\{\ "get_bos_id\ ":128000,\ "get_eos_ids\ ":[128009,128001]\}"
270+ base.metadata='{ "get_bos_id":128000,"get_eos_ids":[128009,128001]}'
271271 ls -lh "${OUT_ET_MODEL_NAME}.pte"
272272 elif [[ ${{ matrix.config }} == "llama3_fb16" ]]; then
273273 # Original BF16 version, without any quantization
@@ -280,7 +280,7 @@ jobs:
280280 model.use_sdpa_with_kv_cache=true \
281281 backend.xnnpack.enabled=true \
282282 model.dtype_override=bf16 \
283- base.metadata="\{\ "get_bos_id\ ":128000,\ "get_eos_ids\ ":[128009,128001]\}" \
283+ base.metadata='{ "get_bos_id":128000,"get_eos_ids":[128009,128001]}' \
284284 export.output_name="${OUT_ET_MODEL_NAME}.pte"
285285 ls -lh "${OUT_ET_MODEL_NAME}.pte"
286286 elif [[ ${{ matrix.config }} == "et_xnnpack_custom_spda_kv_cache_8da4w" ]]; then
@@ -296,8 +296,8 @@ jobs:
296296 backend.xnnpack.extended_ops=true \
297297 quantization.qmode=8da4w \
298298 quantization.group_size=32 \
299- quantization.embedding_quantize=" 8,0" \
300- base.metadata="\{\ "get_bos_id\ ":128000,\ "get_eos_ids\ ":[128009,128001]\}" \
299+ quantization.embedding_quantize=' 8,0' \
300+ base.metadata='{ "get_bos_id":128000,"get_eos_ids":[128009,128001]}' \
301301 export.output_name="${OUT_ET_MODEL_NAME}.pte"
302302 ls -lh "${OUT_ET_MODEL_NAME}.pte"
303303 elif [[ ${{ matrix.config }} == "llama3_coreml_ane" ]]; then
@@ -330,8 +330,8 @@ jobs:
330330 backend.xnnpack.extended_ops=true \
331331 quantization.qmode=8da4w \
332332 quantization.group_size=32 \
333- quantization.embedding_quantize=" 8,0" \
334- base.metadata="\{\ "get_bos_id\ ":151644,\ "get_eos_ids\ ":[151645]\}" \
333+ quantization.embedding_quantize=' 8,0' \
334+ base.metadata='{ "get_bos_id":151644,"get_eos_ids":[151645]}' \
335335 export.output_name="${OUT_ET_MODEL_NAME}.pte"
336336 ls -lh "${OUT_ET_MODEL_NAME}.pte"
337337 fi
0 commit comments