@@ -1245,47 +1245,56 @@ v_mul_dx9_zero_f32 v5, v1, v2 row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:
12451245v_mul_dx9_zero_f32 v255, -|v255|, -|v255| row_xmask:15 row_mask:0x3 bank_mask:0x0 bound_ctrl:0 fi:1
12461246// GFX11: v_mul_dx9_zero_f32_dpp v255, -|v255|, -|v255| row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1 ; encoding: [0xfa,0xfe,0xff,0x0f,0xff,0x6f,0xf5,0x30]
12471247
1248- v_mul_f16 v5, v1, v2 quad_perm:[3 ,2 ,1 ,0 ]
1249- // GFX11: v_mul_f16_dpp v5, v1, v2 quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x1b,0x00,0xff]
1248+ v_mul_f16 v5.l , v1.l , v2.l quad_perm:[3 ,2 ,1 ,0 ]
1249+ // GFX11: v_mul_f16_dpp v5.l , v1.l , v2.l quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x1b,0x00,0xff]
12501250
1251- v_mul_f16 v5, v1, v2 quad_perm:[0 ,1 ,2 ,3 ]
1252- // GFX11: v_mul_f16_dpp v5, v1, v2 quad_perm:[0 ,1 ,2 ,3 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0xe4,0x00,0xff]
1251+ v_mul_f16 v5.l , v1.l , v2.l quad_perm:[0 ,1 ,2 ,3 ]
1252+ // GFX11: v_mul_f16_dpp v5.l , v1.l , v2.l quad_perm:[0 ,1 ,2 ,3 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0xe4,0x00,0xff]
12531253
1254- v_mul_f16 v5, v1, v2 row_mirror
1255- // GFX11: v_mul_f16_dpp v5, v1, v2 row_mirror row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x40,0x01,0xff]
1254+ v_mul_f16 v5.l , v1.l , v2.l row_mirror
1255+ // GFX11: v_mul_f16_dpp v5.l , v1.l , v2.l row_mirror row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x40,0x01,0xff]
12561256
1257- v_mul_f16 v5, v1, v2 row_half_mirror
1258- // GFX11: v_mul_f16_dpp v5, v1, v2 row_half_mirror row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x41,0x01,0xff]
1257+ v_mul_f16 v5.l , v1.l , v2.l row_half_mirror
1258+ // GFX11: v_mul_f16_dpp v5.l , v1.l , v2.l row_half_mirror row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x41,0x01,0xff]
12591259
1260- v_mul_f16 v5, v1, v2 row_shl:1
1261- // GFX11: v_mul_f16_dpp v5, v1, v2 row_shl:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x01,0x01,0xff]
1260+ v_mul_f16 v5.l , v1.l , v2.l row_shl:1
1261+ // GFX11: v_mul_f16_dpp v5.l , v1.l , v2.l row_shl:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x01,0x01,0xff]
12621262
1263- v_mul_f16 v5, v1, v2 row_shl:15
1264- // GFX11: v_mul_f16_dpp v5, v1, v2 row_shl:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x0f,0x01,0xff]
1263+ v_mul_f16 v5.l , v1.l , v2.l row_shl:15
1264+ // GFX11: v_mul_f16_dpp v5.l , v1.l , v2.l row_shl:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x0f,0x01,0xff]
12651265
1266- v_mul_f16 v5, v1, v2 row_shr:1
1267- // GFX11: v_mul_f16_dpp v5, v1, v2 row_shr:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x11,0x01,0xff]
1266+ v_mul_f16 v5.l , v1.l , v2.l row_shr:1
1267+ // GFX11: v_mul_f16_dpp v5.l , v1.l , v2.l row_shr:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x11,0x01,0xff]
12681268
1269- v_mul_f16 v5, v1, v2 row_shr:15
1270- // GFX11: v_mul_f16_dpp v5, v1, v2 row_shr:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x1f,0x01,0xff]
1269+ v_mul_f16 v5.l , v1.l , v2.l row_shr:15
1270+ // GFX11: v_mul_f16_dpp v5.l , v1.l , v2.l row_shr:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x1f,0x01,0xff]
12711271
1272- v_mul_f16 v5, v1, v2 row_ror:1
1273- // GFX11: v_mul_f16_dpp v5, v1, v2 row_ror:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x21,0x01,0xff]
1272+ v_mul_f16 v5.l , v1.l , v2.l row_ror:1
1273+ // GFX11: v_mul_f16_dpp v5.l , v1.l , v2.l row_ror:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x21,0x01,0xff]
12741274
1275- v_mul_f16 v5, v1, v2 row_ror:15
1276- // GFX11: v_mul_f16_dpp v5, v1, v2 row_ror:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x2f,0x01,0xff]
1275+ v_mul_f16 v5.l , v1.l , v2.l row_ror:15
1276+ // GFX11: v_mul_f16_dpp v5.l , v1.l , v2.l row_ror:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x2f,0x01,0xff]
12771277
1278- v_mul_f16 v5, v1, v2 row_share:0 row_mask:0xf bank_mask:0xf
1279- // GFX11: v_mul_f16_dpp v5, v1, v2 row_share:0 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x50,0x01,0xff]
1278+ v_mul_f16 v5.l , v1.l , v2.l row_share:0 row_mask:0xf bank_mask:0xf
1279+ // GFX11: v_mul_f16_dpp v5.l , v1.l , v2.l row_share:0 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x50,0x01,0xff]
12801280
1281- v_mul_f16 v5, v1, v2 row_share:15 row_mask:0x0 bank_mask:0x1
1282- // GFX11: v_mul_f16_dpp v5, v1, v2 row_share:15 row_mask:0x0 bank_mask:0x1 ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x5f,0x01,0x01]
1281+ v_mul_f16 v5.l , v1.l , v2.l row_share:15 row_mask:0x0 bank_mask:0x1
1282+ // GFX11: v_mul_f16_dpp v5.l , v1.l , v2.l row_share:15 row_mask:0x0 bank_mask:0x1 ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x5f,0x01,0x01]
12831283
1284- v_mul_f16 v5, v1, v2 row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 fi: 0
1285- // GFX11: v_mul_f16_dpp v5, v1, v2 row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x60,0x09,0x13]
1284+ v_mul_f16 v5.l , v1.l , v2.l row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1
1285+ // GFX11: v_mul_f16_dpp v5.l , v1.l , v2.l row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 ; encoding: [0xfa,0x04,0x0a,0x6a,0x01,0x60,0x09,0x13]
12861286
1287- v_mul_f16 v127, -|v127|, -|v127| row_xmask:15 row_mask:0x3 bank_mask:0x0 bound_ctrl:0 fi:1
1288- // GFX11: v_mul_f16_dpp v127, -|v127|, -|v127| row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1 ; encoding: [0xfa,0xfe,0xfe,0x6a,0x7f,0x6f,0xf5,0x30]
1287+ v_mul_f16 v127.l, -|v127.l|, -|v127.l| row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1
1288+ // GFX11: v_mul_f16_dpp v127.l, -|v127.l|, -|v127.l| row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1 ; encoding: [0xfa,0xfe,0xfe,0x6a,0x7f,0x6f,0xf5,0x30]
1289+
1290+ v_mul_f16 v127.l, v127.l, v127.l row_share:15 row_mask:0x0 bank_mask:0x1
1291+ // GFX11: v_mul_f16_dpp v127.l, v127.l, v127.l row_share:15 row_mask:0x0 bank_mask:0x1 ; encoding: [0xfa,0xfe,0xfe,0x6a,0x7f,0x5f,0x01,0x01]
1292+
1293+ v_mul_f16 v5.h, v1.h, v2.h row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 fi:0
1294+ // GFX11: v_mul_f16_dpp v5.h, v1.h, v2.h row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 ; encoding: [0xfa,0x04,0x0b,0x6b,0x81,0x60,0x09,0x13]
1295+
1296+ v_mul_f16 v127.h, -|v127.h|, -|v127.h| row_xmask:15 row_mask:0x3 bank_mask:0x0 bound_ctrl:0 fi:1
1297+ // GFX11: v_mul_f16_dpp v127.h, -|v127.h|, -|v127.h| row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1 ; encoding: [0xfa,0xfe,0xff,0x6b,0xff,0x6f,0xf5,0x30]
12891298
12901299v_mul_f32 v5, v1, v2 quad_perm:[3 ,2 ,1 ,0 ]
12911300// GFX11: v_mul_f32_dpp v5, v1, v2 quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x04,0x0a,0x10,0x01,0x1b,0x00,0xff]
0 commit comments