File tree
3 files changed
+40
-17
lines changed- examples/models/llama
- source_transformation
- third-party
3 files changed
+40
-17
lines changed| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
1238 | 1238 | | |
1239 | 1239 | | |
1240 | 1240 | | |
1241 | | - | |
1242 | | - | |
1243 | | - | |
1244 | | - | |
1245 | | - | |
1246 | | - | |
| 1241 | + | |
| 1242 | + | |
| 1243 | + | |
| 1244 | + | |
| 1245 | + | |
| 1246 | + | |
| 1247 | + | |
| 1248 | + | |
| 1249 | + | |
1247 | 1250 | | |
1248 | 1251 | | |
1249 | 1252 | | |
| |||
1322 | 1325 | | |
1323 | 1326 | | |
1324 | 1327 | | |
| 1328 | + | |
1325 | 1329 | | |
1326 | 1330 | | |
1327 | 1331 | | |
| |||
1391 | 1395 | | |
1392 | 1396 | | |
1393 | 1397 | | |
1394 | | - | |
| 1398 | + | |
| 1399 | + | |
| 1400 | + | |
| 1401 | + | |
1395 | 1402 | | |
1396 | 1403 | | |
1397 | 1404 | | |
| |||
1422 | 1429 | | |
1423 | 1430 | | |
1424 | 1431 | | |
| 1432 | + | |
1425 | 1433 | | |
1426 | 1434 | | |
1427 | 1435 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
49 | 49 | | |
50 | 50 | | |
51 | 51 | | |
| 52 | + | |
52 | 53 | | |
53 | 54 | | |
54 | 55 | | |
| |||
119 | 120 | | |
120 | 121 | | |
121 | 122 | | |
122 | | - | |
123 | 123 | | |
124 | 124 | | |
125 | 125 | | |
| |||
134 | 134 | | |
135 | 135 | | |
136 | 136 | | |
137 | | - | |
138 | 137 | | |
139 | 138 | | |
| 139 | + | |
| 140 | + | |
| 141 | + | |
| 142 | + | |
140 | 143 | | |
141 | 144 | | |
142 | 145 | | |
| |||
170 | 173 | | |
171 | 174 | | |
172 | 175 | | |
| 176 | + | |
| 177 | + | |
| 178 | + | |
| 179 | + | |
173 | 180 | | |
174 | 181 | | |
175 | 182 | | |
| |||
191 | 198 | | |
192 | 199 | | |
193 | 200 | | |
| 201 | + | |
| 202 | + | |
| 203 | + | |
| 204 | + | |
194 | 205 | | |
195 | 206 | | |
196 | 207 | | |
| |||
580 | 591 | | |
581 | 592 | | |
582 | 593 | | |
| 594 | + | |
583 | 595 | | |
584 | 596 | | |
585 | 597 | | |
| |||
592 | 604 | | |
593 | 605 | | |
594 | 606 | | |
| 607 | + | |
595 | 608 | | |
596 | 609 | | |
597 | 610 | | |
598 | 611 | | |
599 | | - | |
600 | | - | |
601 | | - | |
602 | | - | |
603 | | - | |
| 612 | + | |
604 | 613 | | |
605 | 614 | | |
606 | 615 | | |
| |||
627 | 636 | | |
628 | 637 | | |
629 | 638 | | |
630 | | - | |
| 639 | + | |
| 640 | + | |
| 641 | + | |
| 642 | + | |
631 | 643 | | |
632 | 644 | | |
633 | 645 | | |
| |||
765 | 777 | | |
766 | 778 | | |
767 | 779 | | |
| 780 | + | |
768 | 781 | | |
769 | 782 | | |
770 | 783 | | |
| |||
825 | 838 | | |
826 | 839 | | |
827 | 840 | | |
| 841 | + | |
828 | 842 | | |
829 | 843 | | |
830 | 844 | | |
| |||
838 | 852 | | |
839 | 853 | | |
840 | 854 | | |
| 855 | + | |
841 | 856 | | |
842 | 857 | | |
843 | 858 | | |
| |||
850 | 865 | | |
851 | 866 | | |
852 | 867 | | |
| 868 | + | |
853 | 869 | | |
854 | 870 | | |
855 | 871 | | |
| |||
877 | 893 | | |
878 | 894 | | |
879 | 895 | | |
880 | | - | |
881 | 896 | | |
882 | 897 | | |
883 | 898 | | |
| |||
- .github/scripts/torchao_model_releases/README.md+9-2
- .github/scripts/torchao_model_releases/eval.sh+11-2
- .github/scripts/torchao_model_releases/eval_quality.sh+15-7
- benchmarks/benchmark_e2e_fp8_sparse_linear.py+15
- benchmarks/float8/training/parse_torchtitan_logs.py+1-1
- benchmarks/prototype/moe_training/mxfp8/bench_all_to_all_v.py+291
- benchmarks/utils.py+24
- test/prototype/moe_training/mxfp8/__init__.py
- test/prototype/moe_training/mxfp8/test_mxfp8_a2a.py+270
- test/prototype/moe_training/testing_utils.py+31
- test/prototype/mx_formats/test_inference_workflow.py+61-11
- test/prototype/mx_formats/test_mx_tensor.py+35-394
- test/prototype/mx_formats/test_nvfp4_tensor.py+65-23
- test/prototype/safetensors/test_safetensors_support.py+29-8
- test/prototype/test_awq.py+138-138
- test/prototype/test_parq.py+3-3
- test/prototype/test_smoothquant.py+40-34
- test/prototype/test_tensor_conversion.py+2-2
- test/quantization/pt2e/test_quantize_pt2e.py+103
- test/quantization/quantize_/workflows/float8/test_float8_tensor.py+21-3
- test/quantization/quantize_/workflows/int4/test_int4_preshuffled_tensor.py+2-2
- test/quantization/quantize_/workflows/int4/test_int4_tensor.py+2-2
- test/quantization/quantize_/workflows/int4/test_int4_tile_packed_to_4d_tensor.py+24-2
- test/quantization/quantize_/workflows/intx/test_intx_unpacked_to_int8_tensor.py+32
- test/quantization/test_qat.py+17-11
- test/test_ops.py+11-15
- test/test_utils.py+4
- torchao/_models/_eval.py+8-3
- torchao/csrc/cpu/aten_kernels/scaled_embedding_bag.cpp+79-30
- torchao/csrc/cuda/rowwise_scaled_linear_sparse_cutlass/rowwise_scaled_linear_sparse_cutlass_f8f8.cu+8
- torchao/dtypes/floatx/cutlass_semi_sparse_layout.py+44-3
- torchao/prototype/awq/core.py+3-1
- torchao/prototype/inductor/codegen/cpp_int8_sdpa_template.py+9-17
- torchao/prototype/moe_training/kernels/mxfp8/__init__.py+11
- torchao/prototype/moe_training/kernels/mxfp8/comms.py+569
- torchao/prototype/moe_training/kernels/mxfp8/quant.py
- torchao/prototype/moe_training/kernels/triton_utils.py+211
- torchao/prototype/mx_formats/inference_workflow.py+22-8
- torchao/prototype/mx_formats/mx_ops.py-354
- torchao/prototype/mx_formats/mx_tensor.py+287-18
- torchao/prototype/mx_formats/nvfp4_tensor.py+81-50
- torchao/prototype/mx_formats/utils.py+22-1
- torchao/prototype/qat/__init__.py+2-2
- torchao/prototype/qat/nvfp4.py+152-34
- torchao/prototype/safetensors/safetensors_support.py+13-7
- torchao/prototype/safetensors/safetensors_utils.py+26-7
- torchao/prototype/tensor_conversion/api.py+2-2
- torchao/quantization/__init__.py+4
- torchao/quantization/granularity.py+15
- torchao/quantization/observer.py+1-21
- torchao/quantization/pt2e/__init__.py+10-8
- torchao/quantization/pt2e/_affine_quantization.py+2-2
- torchao/quantization/pt2e/observer.py+10-134
- torchao/quantization/pt2e/prepare.py+24-9
- torchao/quantization/qat/api.py+29-1
- torchao/quantization/qat/fake_quantize_config.py+10-7
- torchao/quantization/qat/fake_quantizer.py+1-9
- torchao/quantization/quant_api.py+23-2
- torchao/quantization/quant_primitives.py+94
- torchao/quantization/quantize_/workflows/__init__.py+2
- torchao/quantization/quantize_/workflows/float8/float8_tensor.py+29-7
- torchao/quantization/quantize_/workflows/int4/int4_tile_packed_to_4d_tensor.py+23-5
- torchao/quantization/quantize_/workflows/intx/intx_choose_qparams_algorithm.py+23
- torchao/quantization/quantize_/workflows/intx/intx_unpacked_to_int8_tensor.py+47-13
- torchao/quantization/utils.py+45-1
- torchao/testing/utils.py+19-1
- torchao/utils.py+2-4
0 commit comments