Skip to content

Commit 1ea3769

Browse files
committed
fix hip build
ggml-ci
1 parent a3b291e commit 1ea3769

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

ggml/src/ggml-cuda/mmq.cuh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -754,9 +754,9 @@ template <int mmq_y, bool need_check> static __device__ __forceinline__ void loa
754754
const block_mxfp4 * bxi = (const block_mxfp4 *) x + kbx0 + i*stride + kbxd;
755755

756756
#if defined(AMD_MFMA_AVAILABLE) || defined(NEW_MMA_AVAILABLE)
757-
x_df[i*MMQ_MMA_TILE_X_K_Q8_1 + kbxd] = __bfloat162float(ggml_cuda_e8m0_to_fp32(bxi->e))*0.5f;
757+
x_df[i*MMQ_MMA_TILE_X_K_Q8_1 + kbxd] = ggml_cuda_e8m0_to_fp32(bxi->e)*0.5f;
758758
#else
759-
x_df[i*(MMQ_TILE_NE_K/QI_MXFP4) + i/QI_MXFP4 + kbxd] = __bfloat162float(ggml_cuda_e8m0_to_fp32(bxi->e))*0.5f;
759+
x_df[i*(MMQ_TILE_NE_K/QI_MXFP4) + i/QI_MXFP4 + kbxd] = ggml_cuda_e8m0_to_fp32(bxi->e)*0.5f;
760760
#endif // defined(AMD_MFMA_AVAILABLE) || defined(NEW_MMA_AVAILABLE)
761761
}
762762
}

0 commit comments

Comments
 (0)