We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 2d42fc6 commit 6f04692Copy full SHA for 6f04692
paddlenlp/transformers/fp8_utils.py
@@ -89,7 +89,7 @@ def padding_and_quant_input(tensor):
89
return tensor_fp8, tensor_scale, tensor_t_fp8, tensor_t_scale
90
91
@staticmethod
92
- def kitchen_fp8_gemm(
+ def kitchen_gemm(
93
x_fp8, x_scale, w_fp8, w_scale, is_a_1d_scaled, is_b_1d_scaled, out=None, rtn_dtype=paddle.bfloat16
94
):
95
if USE_DS_GEMM:
0 commit comments