@@ -221,58 +221,58 @@ func.func @scaled_ext_scalar_f4e2m1_bf16(%v: vector<2xf4E2M1FN>, %scale: f32) ->
221221 func.return %ret : vector <2 xbf16 >
222222}
223223
224- // CHECK-LABEL: func.func @scaled_ext_packed8_fp4
224+ // CHECK-LABEL: func.func @scaled_ext_packed8_fp
225225func.func @scaled_ext_packed8_fp4 (%v: vector <8 xf4 E2 M1 FN>, %scale: f32 ) -> (vector <8 xf16 >, vector <8 xbf16 >, vector <8 xf32 >) {
226- // CHECK: amdgpu.scaled_ext_packed8
227- %ret0 = amdgpu.scaled_ext_packed8 %v , %scale [0 ] : vector <8 xf4 E2 M1 FN> to vector <8 xf16 >
228- // CHECK: amdgpu.scaled_ext_packed8
229- %ret1 = amdgpu.scaled_ext_packed8 %v , %scale [0 ] : vector <8 xf4 E2 M1 FN> to vector <8 xbf16 >
230- // CHECK: amdgpu.scaled_ext_packed8
231- %ret2 = amdgpu.scaled_ext_packed8 %v , %scale [0 ] : vector <8 xf4 E2 M1 FN> to vector <8 xf32 >
226+ // CHECK: amdgpu.scaled_ext_packed
227+ %ret0 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <8 xf4 E2 M1 FN> to vector <8 xf16 >
228+ // CHECK: amdgpu.scaled_ext_packed
229+ %ret1 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <8 xf4 E2 M1 FN> to vector <8 xbf16 >
230+ // CHECK: amdgpu.scaled_ext_packed
231+ %ret2 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <8 xf4 E2 M1 FN> to vector <8 xf32 >
232232 func.return %ret0 , %ret1 , %ret2 : vector <8 xf16 >, vector <8 xbf16 >, vector <8 xf32 >
233233}
234234
235- // CHECK-LABEL: func.func @scaled_ext_packed8_fp8
235+ // CHECK-LABEL: func.func @scaled_ext_packed8_fp
236236func.func @scaled_ext_packed8_fp8 (%v: vector <8 xf8 E4 M3 FN>, %scale: f32 ) -> (vector <8 xf16 >, vector <8 xbf16 >, vector <8 xf32 >) {
237- // CHECK: amdgpu.scaled_ext_packed8
238- %ret0 = amdgpu.scaled_ext_packed8 %v , %scale [0 ] : vector <8 xf8 E4 M3 FN> to vector <8 xf16 >
239- // CHECK: amdgpu.scaled_ext_packed8
240- %ret1 = amdgpu.scaled_ext_packed8 %v , %scale [0 ] : vector <8 xf8 E4 M3 FN> to vector <8 xbf16 >
241- // CHECK: amdgpu.scaled_ext_packed8
242- %ret2 = amdgpu.scaled_ext_packed8 %v , %scale [0 ] : vector <8 xf8 E4 M3 FN> to vector <8 xf32 >
237+ // CHECK: amdgpu.scaled_ext_packed
238+ %ret0 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <8 xf8 E4 M3 FN> to vector <8 xf16 >
239+ // CHECK: amdgpu.scaled_ext_packed
240+ %ret1 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <8 xf8 E4 M3 FN> to vector <8 xbf16 >
241+ // CHECK: amdgpu.scaled_ext_packed
242+ %ret2 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <8 xf8 E4 M3 FN> to vector <8 xf32 >
243243 func.return %ret0 , %ret1 , %ret2 : vector <8 xf16 >, vector <8 xbf16 >, vector <8 xf32 >
244244}
245245
246- // CHECK-LABEL: func.func @scaled_ext_packed8_bf8
246+ // CHECK-LABEL: func.func @scaled_ext_packed8_bf
247247func.func @scaled_ext_packed8_bf8 (%v: vector <8 xf8 E5 M2 >, %scale: f32 ) -> (vector <8 xf16 >, vector <8 xbf16 >, vector <8 xf32 >) {
248- // CHECK: amdgpu.scaled_ext_packed8
249- %ret0 = amdgpu.scaled_ext_packed8 %v , %scale [0 ] : vector <8 xf8 E5 M2 > to vector <8 xf16 >
250- // CHECK: amdgpu.scaled_ext_packed8
251- %ret1 = amdgpu.scaled_ext_packed8 %v , %scale [0 ] : vector <8 xf8 E5 M2 > to vector <8 xbf16 >
252- // CHECK: amdgpu.scaled_ext_packed8
253- %ret2 = amdgpu.scaled_ext_packed8 %v , %scale [0 ] : vector <8 xf8 E5 M2 > to vector <8 xf32 >
248+ // CHECK: amdgpu.scaled_ext_packed
249+ %ret0 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <8 xf8 E5 M2 > to vector <8 xf16 >
250+ // CHECK: amdgpu.scaled_ext_packed
251+ %ret1 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <8 xf8 E5 M2 > to vector <8 xbf16 >
252+ // CHECK: amdgpu.scaled_ext_packed
253+ %ret2 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <8 xf8 E5 M2 > to vector <8 xf32 >
254254 func.return %ret0 , %ret1 , %ret2 : vector <8 xf16 >, vector <8 xbf16 >, vector <8 xf32 >
255255}
256256
257257// CHECK-LABEL: func.func @scaled_ext_packed16_fp6
258258func.func @scaled_ext_packed16_fp6 (%v: vector <16 xf6 E2 M3 FN>, %scale: f32 ) -> (vector <16 xf16 >, vector <16 xbf16 >, vector <16 xf32 >) {
259- // CHECK: amdgpu.scaled_ext_packed16
260- %ret0 = amdgpu.scaled_ext_packed16 %v , %scale [0 ] : vector <16 xf6 E2 M3 FN> to vector <16 xf16 >
261- // CHECK: amdgpu.scaled_ext_packed16
262- %ret1 = amdgpu.scaled_ext_packed16 %v , %scale [0 ] : vector <16 xf6 E2 M3 FN> to vector <16 xbf16 >
263- // CHECK: amdgpu.scaled_ext_packed16
264- %ret2 = amdgpu.scaled_ext_packed16 %v , %scale [0 ] : vector <16 xf6 E2 M3 FN> to vector <16 xf32 >
259+ // CHECK: amdgpu.scaled_ext_packed
260+ %ret0 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <16 xf6 E2 M3 FN> to vector <16 xf16 >
261+ // CHECK: amdgpu.scaled_ext_packed
262+ %ret1 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <16 xf6 E2 M3 FN> to vector <16 xbf16 >
263+ // CHECK: amdgpu.scaled_ext_packed
264+ %ret2 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <16 xf6 E2 M3 FN> to vector <16 xf32 >
265265 func.return %ret0 , %ret1 , %ret2 : vector <16 xf16 >, vector <16 xbf16 >, vector <16 xf32 >
266266}
267267
268268// CHECK-LABEL: func.func @scaled_ext_packed16_bf16
269269func.func @scaled_ext_packed16_bf16 (%v: vector <16 xf6 E3 M2 FN>, %scale: f32 ) -> (vector <16 xf16 >, vector <16 xbf16 >, vector <16 xf32 >) {
270- // CHECK: amdgpu.scaled_ext_packed16
271- %ret0 = amdgpu.scaled_ext_packed16 %v , %scale [0 ] : vector <16 xf6 E3 M2 FN> to vector <16 xf16 >
272- // CHECK: amdgpu.scaled_ext_packed16
273- %ret1 = amdgpu.scaled_ext_packed16 %v , %scale [0 ] : vector <16 xf6 E3 M2 FN> to vector <16 xbf16 >
274- // CHECK: amdgpu.scaled_ext_packed16
275- %ret2 = amdgpu.scaled_ext_packed16 %v , %scale [0 ] : vector <16 xf6 E3 M2 FN> to vector <16 xf32 >
270+ // CHECK: amdgpu.scaled_ext_packed
271+ %ret0 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <16 xf6 E3 M2 FN> to vector <16 xf16 >
272+ // CHECK: amdgpu.scaled_ext_packed
273+ %ret1 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <16 xf6 E3 M2 FN> to vector <16 xbf16 >
274+ // CHECK: amdgpu.scaled_ext_packed
275+ %ret2 = amdgpu.scaled_ext_packed %v , %scale [0 ] : vector <16 xf6 E3 M2 FN> to vector <16 xf32 >
276276 func.return %ret0 , %ret1 , %ret2 : vector <16 xf16 >, vector <16 xbf16 >, vector <16 xf32 >
277277}
278278
0 commit comments