File tree Expand file tree Collapse file tree 4 files changed +4
-2
lines changed
Expand file tree Collapse file tree 4 files changed +4
-2
lines changed File renamed without changes.
File renamed without changes.
Original file line number Diff line number Diff line change @@ -4,10 +4,11 @@ scheme: NVFP4
44dataset_id : HuggingFaceH4/ultrachat_200k
55dataset_split : train_sft
66num_calibration_samples : 20
7- recipe : tests/e2e/vLLM/recipes/actorder /recipe_awq_nvfp4.yaml
7+ recipe : tests/e2e/vLLM/recipes/NVFP4 /recipe_awq_nvfp4.yaml
88lmeval :
99 # NVFP4 (4-bit weights + 4-bit activations) has lower recovery than FP8/INT8
1010 # Observed: strict-match ~92.81%, flexible-extract ~89.59%
11+ # TODO: check if recovery is consistent - 0.65 is too low for 0.94 recovery
1112 recovery_threshold :
1213 exact_match,strict-match : 0.92
1314 exact_match,flexible-extract : 0.88
Original file line number Diff line number Diff line change @@ -4,10 +4,11 @@ scheme: NVFP4
44dataset_id : HuggingFaceH4/ultrachat_200k
55dataset_split : train_sft
66num_calibration_samples : 20
7- recipe : tests/e2e/vLLM/recipes/actorder /recipe_awq_nvfp4a16.yaml
7+ recipe : tests/e2e/vLLM/recipes/NVFP4 /recipe_awq_nvfp4a16.yaml
88lmeval :
99 # NVFP4 (4-bit weights + 4-bit activations) has lower recovery than FP8/INT8
1010 # Observed: strict-match ~92.81%, flexible-extract ~89.59%
11+ # TODO: check if recovery is consistent - 0.65 is too low for 0.94 recovery
1112 recovery_threshold :
1213 exact_match,strict-match : 0.95
1314 exact_match,flexible-extract : 0.94
You can’t perform that action at this time.
0 commit comments