@@ -212,47 +212,56 @@ v_clz_i32_u32 v5, v1 row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 fi:0
212212v_clz_i32_u32 v255, v255 row_xmask:15 row_mask:0x3 bank_mask:0x0 bound_ctrl:0 fi:1
213213// GFX11: v_clz_i32_u32_dpp v255, v255 row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1 ; encoding: [0xfa,0x72,0xfe,0x7f,0xff,0x6f,0x05,0x30]
214214
215- v_cos_f16 v5, v1 quad_perm:[3 ,2 ,1 ,0 ]
216- // GFX11: v_cos_f16_dpp v5, v1 quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x1b,0x00,0xff]
215+ v_cos_f16 v5.l , v1.l quad_perm:[3 ,2 ,1 ,0 ]
216+ // GFX11: v_cos_f16_dpp v5.l , v1.l quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x1b,0x00,0xff]
217217
218- v_cos_f16 v5, v1 quad_perm:[0 ,1 ,2 ,3 ]
219- // GFX11: v_cos_f16_dpp v5, v1 quad_perm:[0 ,1 ,2 ,3 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0xe4,0x00,0xff]
218+ v_cos_f16 v5.l , v1.l quad_perm:[0 ,1 ,2 ,3 ]
219+ // GFX11: v_cos_f16_dpp v5.l , v1.l quad_perm:[0 ,1 ,2 ,3 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0xe4,0x00,0xff]
220220
221- v_cos_f16 v5, v1 row_mirror
222- // GFX11: v_cos_f16_dpp v5, v1 row_mirror row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x40,0x01,0xff]
221+ v_cos_f16 v5.l , v1.l row_mirror
222+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_mirror row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x40,0x01,0xff]
223223
224- v_cos_f16 v5, v1 row_half_mirror
225- // GFX11: v_cos_f16_dpp v5, v1 row_half_mirror row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x41,0x01,0xff]
224+ v_cos_f16 v5.l , v1.l row_half_mirror
225+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_half_mirror row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x41,0x01,0xff]
226226
227- v_cos_f16 v5, v1 row_shl:1
228- // GFX11: v_cos_f16_dpp v5, v1 row_shl:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x01,0x01,0xff]
227+ v_cos_f16 v5.l , v1.l row_shl:1
228+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_shl:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x01,0x01,0xff]
229229
230- v_cos_f16 v5, v1 row_shl:15
231- // GFX11: v_cos_f16_dpp v5, v1 row_shl:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x0f,0x01,0xff]
230+ v_cos_f16 v5.l , v1.l row_shl:15
231+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_shl:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x0f,0x01,0xff]
232232
233- v_cos_f16 v5, v1 row_shr:1
234- // GFX11: v_cos_f16_dpp v5, v1 row_shr:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x11,0x01,0xff]
233+ v_cos_f16 v5.l , v1.l row_shr:1
234+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_shr:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x11,0x01,0xff]
235235
236- v_cos_f16 v5, v1 row_shr:15
237- // GFX11: v_cos_f16_dpp v5, v1 row_shr:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x1f,0x01,0xff]
236+ v_cos_f16 v5.l , v1.l row_shr:15
237+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_shr:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x1f,0x01,0xff]
238238
239- v_cos_f16 v5, v1 row_ror:1
240- // GFX11: v_cos_f16_dpp v5, v1 row_ror:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x21,0x01,0xff]
239+ v_cos_f16 v5.l , v1.l row_ror:1
240+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_ror:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x21,0x01,0xff]
241241
242- v_cos_f16 v5, v1 row_ror:15
243- // GFX11: v_cos_f16_dpp v5, v1 row_ror:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x2f,0x01,0xff]
242+ v_cos_f16 v5.l , v1.l row_ror:15
243+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_ror:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x2f,0x01,0xff]
244244
245- v_cos_f16 v5, v1 row_share:0 row_mask:0xf bank_mask:0xf
246- // GFX11: v_cos_f16_dpp v5, v1 row_share:0 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x50,0x01,0xff]
245+ v_cos_f16 v5.l , v1.l row_share:0 row_mask:0xf bank_mask:0xf
246+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_share:0 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x50,0x01,0xff]
247247
248- v_cos_f16 v5, v1 row_share:15 row_mask:0x0 bank_mask:0x1
249- // GFX11: v_cos_f16_dpp v5, v1 row_share:15 row_mask:0x0 bank_mask:0x1 ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x5f,0x01,0x01]
248+ v_cos_f16 v5.l , v1.l row_share:15 row_mask:0x0 bank_mask:0x1
249+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_share:15 row_mask:0x0 bank_mask:0x1 ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x5f,0x01,0x01]
250250
251- v_cos_f16 v5, v1 row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 fi: 0
252- // GFX11: v_cos_f16_dpp v5, v1 row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x60,0x09,0x13]
251+ v_cos_f16 v5.l , v1.l row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1
252+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x60,0x09,0x13]
253253
254- v_cos_f16 v127, -|v127| row_xmask:15 row_mask:0x3 bank_mask:0x0 bound_ctrl:0 fi:1
255- // GFX11: v_cos_f16_dpp v127, -|v127| row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1 ; encoding: [0xfa,0xc2,0xfe,0x7e,0x7f,0x6f,0x35,0x30]
254+ v_cos_f16 v127.l, -|v127.l| row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1
255+ // GFX11: v_cos_f16_dpp v127.l, -|v127.l| row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1 ; encoding: [0xfa,0xc2,0xfe,0x7e,0x7f,0x6f,0x35,0x30]
256+
257+ v_cos_f16 v127.l, v127.l row_share:15 row_mask:0x0 bank_mask:0x1
258+ // GFX11: v_cos_f16_dpp v127.l, v127.l row_share:15 row_mask:0x0 bank_mask:0x1 ; encoding: [0xfa,0xc2,0xfe,0x7e,0x7f,0x5f,0x01,0x01]
259+
260+ v_cos_f16 v5.h, v1.h row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 fi:0
261+ // GFX11: v_cos_f16_dpp v5.h, v1.h row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 ; encoding: [0xfa,0xc2,0x0a,0x7f,0x81,0x60,0x09,0x13]
262+
263+ v_cos_f16 v127.h, -|v127.h| row_xmask:15 row_mask:0x3 bank_mask:0x0 bound_ctrl:0 fi:1
264+ // GFX11: v_cos_f16_dpp v127.h, -|v127.h| row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1 ; encoding: [0xfa,0xc2,0xfe,0x7f,0xff,0x6f,0x35,0x30]
256265
257266v_cos_f32 v5, v1 quad_perm:[3 ,2 ,1 ,0 ]
258267// GFX11: v_cos_f32_dpp v5, v1 quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x6c,0x0a,0x7e,0x01,0x1b,0x00,0xff]
0 commit comments