@@ -292,7 +292,7 @@ jobs:
292292        echo "::endgroup::" 
293293
294294        echo "::group::Run inference with quantize file" 
295-         for DEVICE in cpu; do # cuda   
295+         for DEVICE in cpu; do # cuda 
296296          # cuda - fails because `AttributeError: 'Linear' object has no attribute '_linear_extra_repr'` 
297297          # follow up with torchao as a separate PR 
298298          echo "saving snapshot for device ${DEVICE} and dtype bfloat16, and reloading as snapshot" 
@@ -349,7 +349,7 @@ jobs:
349349        # python3 torchchat.py export --output-snap model.tc --dtype float32 --quantize torchchat/quant_config/cuda-32.json --checkpoint "./checkpoints/${REPO_NAME}/model.pth" 
350350        # python3 torchchat.py generate --snap model.tc --dtype float32 --checkpoint "./checkpoints/${REPO_NAME}/model.pth" 
351351        # echo "::endgroup::" 
352-          
352+ 
353353test-gpu-aoti-float16 :
354354    permissions :
355355      id-token : write 
@@ -1198,6 +1198,11 @@ jobs:
11981198            sysctl machdep.cpu.brand_string 
11991199            sysctl machdep.cpu.core_count 
12001200          fi 
1201+ name : Install ET 
1202+         run : | 
1203+           echo "Installing ExecuTorch" 
1204+           export TORCHCHAT_ROOT=${PWD} 
1205+           bash torchchat/utils/scripts/install_et.sh 
12011206name : Install torchchat 
12021207        run : | 
12031208          echo "Intalling pip3 packages" 
@@ -1208,11 +1213,6 @@ jobs:
12081213        id : install-torchao-ops 
12091214        run : | 
12101215          bash torchchat/utils/scripts/build_torchao_ops.sh 
1211- name : Install ET 
1212-         run : | 
1213-           echo "Installing ExecuTorch" 
1214-           export TORCHCHAT_ROOT=${PWD} 
1215-           bash torchchat/utils/scripts/install_et.sh 
12161216name : Install runner 
12171217        run : | 
12181218          echo "Installing runner" 
0 commit comments