@@ -37,8 +37,8 @@ cvtScalePkUpcastFromFp8(Location loc, ConversionPatternRewriter &rewriter,
3737
3838 auto resType = i32_ty;
3939 auto dstType = f32_ty;
40- if constexpr (std::is_same_v<convertOp, ROCDL::CvtScale32PkF32Fp8 > ||
41- std::is_same_v<convertOp, ROCDL::CvtScale32PkF32Bf8 >) {
40+ if constexpr (std::is_same_v<convertOp, ROCDL::CvtScaleF32PkF32Fp8Op > ||
41+ std::is_same_v<convertOp, ROCDL::CvtScaleF32PkF32Bf8Op >) {
4242 resType = i64_ty;
4343 dstType = f32_ty;
4444 } else {
@@ -70,8 +70,8 @@ cvtScalePkDowncastToFp8(Location loc, ConversionPatternRewriter &rewriter,
7070 Value select = b.false_val ();
7171
7272 Value result;
73- if constexpr (std::is_same_v<convertOp, ROCDL::CvtScaleF32PkFp8F32 > ||
74- std::is_same_v<convertOp, ROCDL::CvtScaleF32PkBf8F32 >) {
73+ if constexpr (std::is_same_v<convertOp, ROCDL::CvtScaleF32PkFp8F32Op > ||
74+ std::is_same_v<convertOp, ROCDL::CvtScaleF32PkBf8F32Op >) {
7575 result = rewriter.create <convertOp>(loc, v2I16Ty, v2I16Vec, v0, v1, scale,
7676 select);
7777 } else {
@@ -134,8 +134,8 @@ static SmallVector<Value>
134134Fp16_to_Fp8E5M2_RTNE_HW (Location loc, ConversionPatternRewriter &rewriter,
135135 const SmallVector<Value> &v) {
136136 assert (v.size () == 2 );
137- return cvtScalePkDowncastToFp8<ROCDL::CvtScaleF32PkBf8F16 >(loc, rewriter,
138- v[0 ], v[1 ]);
137+ return cvtScalePkDowncastToFp8<ROCDL::CvtScaleF32PkBf8F16Op >(loc, rewriter,
138+ v[0 ], v[1 ]);
139139}
140140
141141ConverterT Fp16_to_Fp8E5M2_RTNE (AMD::ISAFamily isaFamily) {
@@ -270,8 +270,8 @@ static SmallVector<Value>
270270Fp16_to_Fp8E4M3FN_RTNE_HW (Location loc, ConversionPatternRewriter &rewriter,
271271 const SmallVector<Value> &v) {
272272 assert (v.size () == 2 );
273- return cvtScalePkDowncastToFp8<ROCDL::CvtScaleF32PkFp8F16 >(loc, rewriter,
274- v[0 ], v[1 ]);
273+ return cvtScalePkDowncastToFp8<ROCDL::CvtScaleF32PkFp8F16Op >(loc, rewriter,
274+ v[0 ], v[1 ]);
275275}
276276
277277ConverterT Fp16_to_Fp8E4M3FN_RTNE (AMD::ISAFamily isaFamily) {
@@ -378,35 +378,35 @@ static SmallVector<Value> Fp8E4M3FN_to_Fp32(Location loc,
378378 ConversionPatternRewriter &rewriter,
379379 const SmallVector<Value> &v) {
380380 assert (v.size () == 2 );
381- return cvtScalePkUpcastFromFp8<ROCDL::CvtScale32PkF32Fp8 >(loc, rewriter, v[ 0 ] ,
382- v[1 ]);
381+ return cvtScalePkUpcastFromFp8<ROCDL::CvtScaleF32PkF32Fp8Op >(loc, rewriter,
382+ v[ 0 ], v[1 ]);
383383}
384384
385385// Convert OCP Bf8 to Fp32 on CDNA4
386386static SmallVector<Value> Fp8E5M2_to_Fp32 (Location loc,
387387 ConversionPatternRewriter &rewriter,
388388 const SmallVector<Value> &v) {
389389 assert (v.size () == 2 );
390- return cvtScalePkUpcastFromFp8<ROCDL::CvtScale32PkF32Bf8 >(loc, rewriter, v[ 0 ] ,
391- v[1 ]);
390+ return cvtScalePkUpcastFromFp8<ROCDL::CvtScaleF32PkF32Bf8Op >(loc, rewriter,
391+ v[ 0 ], v[1 ]);
392392}
393393
394394// Convert Fp32 to OCP Fp8 on CDNA4
395395static SmallVector<Value> Fp32_to_Fp8E4M3FN (Location loc,
396396 ConversionPatternRewriter &rewriter,
397397 const SmallVector<Value> &v) {
398398 assert (v.size () == 2 );
399- return cvtScalePkDowncastToFp8<ROCDL::CvtScaleF32PkFp8F32 >(loc, rewriter,
400- v[0 ], v[1 ]);
399+ return cvtScalePkDowncastToFp8<ROCDL::CvtScaleF32PkFp8F32Op >(loc, rewriter,
400+ v[0 ], v[1 ]);
401401}
402402
403403// Convert Fp32 to OCP Bf8 on CDNA4
404404static SmallVector<Value> Fp32_to_Fp8E5M2 (Location loc,
405405 ConversionPatternRewriter &rewriter,
406406 const SmallVector<Value> &v) {
407407 assert (v.size () == 2 );
408- return cvtScalePkDowncastToFp8<ROCDL::CvtScaleF32PkBf8F32 >(loc, rewriter,
409- v[0 ], v[1 ]);
408+ return cvtScalePkDowncastToFp8<ROCDL::CvtScaleF32PkBf8F32Op >(loc, rewriter,
409+ v[0 ], v[1 ]);
410410}
411411
412412// Fp32 -> Nanoo Bf8 on CDNA3
@@ -549,8 +549,8 @@ static SmallVector<Value>
549549Fp8E4M3FN_to_Fp16_HW (Location loc, ConversionPatternRewriter &rewriter,
550550 const SmallVector<Value> &v) {
551551 assert (v.size () == 2 );
552- return cvtScalePkUpcastFromFp8<ROCDL::CvtScaleF32PkF16Fp8 >(loc, rewriter,
553- v[0 ], v[1 ]);
552+ return cvtScalePkUpcastFromFp8<ROCDL::CvtScaleF32PkF16Fp8Op >(loc, rewriter,
553+ v[0 ], v[1 ]);
554554}
555555
556556ConverterT Fp8E4M3FN_to_Fp16 (AMD::ISAFamily isaFamily) {
@@ -591,8 +591,8 @@ static SmallVector<Value>
591591Fp8E5M2_to_Fp16_HW (Location loc, ConversionPatternRewriter &rewriter,
592592 const SmallVector<Value> &v) {
593593 assert (v.size () == 2 );
594- return cvtScalePkUpcastFromFp8<ROCDL::CvtScaleF32PkF16Bf8 >(loc, rewriter,
595- v[0 ], v[1 ]);
594+ return cvtScalePkUpcastFromFp8<ROCDL::CvtScaleF32PkF16Bf8Op >(loc, rewriter,
595+ v[0 ], v[1 ]);
596596}
597597
598598ConverterT Fp8E5M2_to_Fp16 (AMD::ISAFamily isaFamily) {
@@ -851,8 +851,8 @@ static SmallVector<Value>
851851Bf16_to_Fp8E5M2_HW (Location loc, ConversionPatternRewriter &rewriter,
852852 const SmallVector<Value> &v) {
853853 assert (v.size () == 2 );
854- return cvtScalePkDowncastToFp8<ROCDL::CvtScaleF32PkBf8Bf16 >(loc, rewriter,
855- v[0 ], v[1 ]);
854+ return cvtScalePkDowncastToFp8<ROCDL::CvtScaleF32PkBf8Bf16Op >(loc, rewriter,
855+ v[0 ], v[1 ]);
856856}
857857
858858static ConverterT Bf16_to_Fp8E5M2 (AMD::ISAFamily isaFamily) {
@@ -864,8 +864,8 @@ static SmallVector<Value> Bf16_to_Fp8E4M3FN(Location loc,
864864 ConversionPatternRewriter &rewriter,
865865 const SmallVector<Value> &v) {
866866 assert (v.size () == 2 );
867- return cvtScalePkDowncastToFp8<ROCDL::CvtScaleF32PkFp8Bf16 >(loc, rewriter,
868- v[0 ], v[1 ]);
867+ return cvtScalePkDowncastToFp8<ROCDL::CvtScaleF32PkFp8Bf16Op >(loc, rewriter,
868+ v[0 ], v[1 ]);
869869}
870870
871871// fp8e4m3fn to bf16
0 commit comments