@@ -1239,37 +1239,37 @@ v_cvt_pk_bf8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3,2,1,0] row_mask:0xe bank_m
1239
1239
// GFX12: v_cvt_pk_bf8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd fi:1 ; encoding: [0x01,0x02,0x6a,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x04,0xed]
1240
1240
1241
1241
v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd
1242
- // GFX1200 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x00,0xed]
1242
+ // GFX12 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x00,0xed]
1243
1243
1244
1244
v_cvt_pk_fp8_f32_e64_dpp v255.h, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd
1245
- // GFX1200 : v_cvt_pk_fp8_f32_e64_dpp v255.h, -v2, |v3| op_sel:[0 ,0 ,1 ] quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd ; encoding: [0xff,0x42,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x00,0xed]
1245
+ // GFX12 : v_cvt_pk_fp8_f32_e64_dpp v255.h, -v2, |v3| op_sel:[0 ,0 ,1 ] quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd ; encoding: [0xff,0x42,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x00,0xed]
1246
1246
1247
1247
v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[0 ,1 ,2 ,3 ]
1248
- // GFX1200 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[0 ,1 ,2 ,3 ] row_mask:0xf bank_mask:0xf ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0xe4,0x00,0xff]
1248
+ // GFX12 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[0 ,1 ,2 ,3 ] row_mask:0xf bank_mask:0xf ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0xe4,0x00,0xff]
1249
1249
1250
1250
v_cvt_pk_fp8_f32_e64_dpp v6.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd
1251
- // GFX1200 : v_cvt_pk_fp8_f32_e64_dpp v6.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd ; encoding: [0x06,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x00,0xed]
1251
+ // GFX12 : v_cvt_pk_fp8_f32_e64_dpp v6.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd ; encoding: [0x06,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x00,0xed]
1252
1252
1253
1253
v_cvt_pk_fp8_f32_e64_dpp v1.l, -v6, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd
1254
- // GFX1200 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v6, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x06,0x1b,0x00,0xed]
1254
+ // GFX12 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v6, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x06,0x1b,0x00,0xed]
1255
1255
1256
1256
v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v255| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd
1257
- // GFX1200 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v255| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0xfe,0x03,0x20,0x02,0x1b,0x00,0xed]
1257
+ // GFX12 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v255| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0xfe,0x03,0x20,0x02,0x1b,0x00,0xed]
1258
1258
1259
1259
v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[0 ,2 ,1 ,3 ] row_mask:0xe bank_mask:0xd
1260
- // GFX1200 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[0 ,2 ,1 ,3 ] row_mask:0xe bank_mask:0xd ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0xd8,0x00,0xed]
1260
+ // GFX12 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[0 ,2 ,1 ,3 ] row_mask:0xe bank_mask:0xd ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0xd8,0x00,0xed]
1261
1261
1262
1262
v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0x2 bank_mask:0xd
1263
- // GFX1200 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0x2 bank_mask:0xd ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x00,0x2d]
1263
+ // GFX12 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0x2 bank_mask:0xd ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x00,0x2d]
1264
1264
1265
1265
v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0x5
1266
- // GFX1200 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0x5 ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x00,0xe5]
1266
+ // GFX12 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0x5 ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x00,0xe5]
1267
1267
1268
1268
v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd fi:1
1269
- // GFX1200 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd fi:1 ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x04,0xed]
1269
+ // GFX12 : v_cvt_pk_fp8_f32_e64_dpp v1.l, -v2, |v3| quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd fi:1 ; encoding: [0x01,0x02,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x04,0xed]
1270
1270
1271
1271
v_cvt_pk_fp8_f32_e64_dpp v255.h, -v2, |v3| quad_perm:[0 ,1 ,2 ,3 ]
1272
- // GFX1200 : v_cvt_pk_fp8_f32_e64_dpp v255.h, -v2, |v3| op_sel:[0 ,0 ,1 ] quad_perm:[0 ,1 ,2 ,3 ] row_mask:0xf bank_mask:0xf ; encoding: [0xff,0x42,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0xe4,0x00,0xff]
1272
+ // GFX12 : v_cvt_pk_fp8_f32_e64_dpp v255.h, -v2, |v3| op_sel:[0 ,0 ,1 ] quad_perm:[0 ,1 ,2 ,3 ] row_mask:0xf bank_mask:0xf ; encoding: [0xff,0x42,0x69,0xd7,0xfa,0x06,0x02,0x20,0x02,0xe4,0x00,0xff]
1273
1273
1274
1274
v_cvt_sr_bf8_f32_e64_dpp v1, -v2, v3 quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd
1275
1275
// GFX12: v_cvt_sr_bf8_f32_e64_dpp v1, -v2, v3 quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xe bank_mask:0xd ; encoding: [0x01,0x00,0x6c,0xd7,0xfa,0x06,0x02,0x20,0x02,0x1b,0x00,0xed]
0 commit comments