File tree Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -754,9 +754,9 @@ template <int mmq_y, bool need_check> static __device__ __forceinline__ void loa
754754 const block_mxfp4 * bxi = (const block_mxfp4 *) x + kbx0 + i*stride + kbxd;
755755
756756#if defined(AMD_MFMA_AVAILABLE) || defined(NEW_MMA_AVAILABLE)
757- x_df[i*MMQ_MMA_TILE_X_K_Q8_1 + kbxd] = __bfloat162float ( ggml_cuda_e8m0_to_fp32 (bxi->e ) )*0 .5f ;
757+ x_df[i*MMQ_MMA_TILE_X_K_Q8_1 + kbxd] = ggml_cuda_e8m0_to_fp32 (bxi->e )*0 .5f ;
758758#else
759- x_df[i*(MMQ_TILE_NE_K/QI_MXFP4) + i/QI_MXFP4 + kbxd] = __bfloat162float ( ggml_cuda_e8m0_to_fp32 (bxi->e ) )*0 .5f ;
759+ x_df[i*(MMQ_TILE_NE_K/QI_MXFP4) + i/QI_MXFP4 + kbxd] = ggml_cuda_e8m0_to_fp32 (bxi->e )*0 .5f ;
760760#endif // defined(AMD_MFMA_AVAILABLE) || defined(NEW_MMA_AVAILABLE)
761761 }
762762}
You can’t perform that action at this time.
0 commit comments