@@ -196,39 +196,39 @@ define void @preserve_wwm_copy_dstreg(ptr %parg0, ptr %parg1, ptr %parg2) #0 {
196196; GFX906-NEXT: ;;#ASMSTART
197197; GFX906-NEXT: ; def s21
198198; GFX906-NEXT: ;;#ASMEND
199- ; GFX906-NEXT: v_writelane_b32 v39, s21, 24
199+ ; GFX906-NEXT: v_writelane_b32 v39, s21, 12
200200; GFX906-NEXT: ;;#ASMSTART
201201; GFX906-NEXT: ; def s22
202202; GFX906-NEXT: ;;#ASMEND
203- ; GFX906-NEXT: v_writelane_b32 v39, s22, 25
203+ ; GFX906-NEXT: v_writelane_b32 v39, s22, 13
204204; GFX906-NEXT: ;;#ASMSTART
205205; GFX906-NEXT: ; def s23
206206; GFX906-NEXT: ;;#ASMEND
207- ; GFX906-NEXT: v_writelane_b32 v39, s23, 26
207+ ; GFX906-NEXT: v_writelane_b32 v39, s23, 14
208208; GFX906-NEXT: ;;#ASMSTART
209209; GFX906-NEXT: ; def s24
210210; GFX906-NEXT: ;;#ASMEND
211- ; GFX906-NEXT: v_writelane_b32 v39, s24, 27
211+ ; GFX906-NEXT: v_writelane_b32 v39, s24, 15
212212; GFX906-NEXT: ;;#ASMSTART
213213; GFX906-NEXT: ; def s25
214214; GFX906-NEXT: ;;#ASMEND
215- ; GFX906-NEXT: v_writelane_b32 v39, s25, 28
215+ ; GFX906-NEXT: v_writelane_b32 v39, s25, 16
216216; GFX906-NEXT: ;;#ASMSTART
217217; GFX906-NEXT: ; def s26
218218; GFX906-NEXT: ;;#ASMEND
219- ; GFX906-NEXT: v_writelane_b32 v39, s26, 29
219+ ; GFX906-NEXT: v_writelane_b32 v39, s26, 17
220220; GFX906-NEXT: ;;#ASMSTART
221221; GFX906-NEXT: ; def s27
222222; GFX906-NEXT: ;;#ASMEND
223- ; GFX906-NEXT: v_writelane_b32 v39, s27, 30
223+ ; GFX906-NEXT: v_writelane_b32 v39, s27, 18
224224; GFX906-NEXT: ;;#ASMSTART
225225; GFX906-NEXT: ; def s28
226226; GFX906-NEXT: ;;#ASMEND
227- ; GFX906-NEXT: v_writelane_b32 v39, s28, 31
227+ ; GFX906-NEXT: v_writelane_b32 v39, s28, 19
228228; GFX906-NEXT: ;;#ASMSTART
229229; GFX906-NEXT: ; def s29
230230; GFX906-NEXT: ;;#ASMEND
231- ; GFX906-NEXT: v_writelane_b32 v39, s29, 32
231+ ; GFX906-NEXT: v_writelane_b32 v39, s29, 20
232232; GFX906-NEXT: s_or_saveexec_b64 s[34:35], -1
233233; GFX906-NEXT: buffer_store_dword v39, off, s[0:3], s33 offset:4 ; 4-byte Folded Spill
234234; GFX906-NEXT: s_mov_b64 exec, s[34:35]
@@ -267,39 +267,39 @@ define void @preserve_wwm_copy_dstreg(ptr %parg0, ptr %parg1, ptr %parg2) #0 {
267267; GFX906-NEXT: v_readlane_b32 s15, v39, 2
268268; GFX906-NEXT: v_mov_b32_e32 v31, v40
269269; GFX906-NEXT: v_readlane_b32 s17, v39, 23
270- ; GFX906-NEXT: v_readlane_b32 s21, v39, 24
270+ ; GFX906-NEXT: v_readlane_b32 s21, v39, 12
271271; GFX906-NEXT: ;;#ASMSTART
272272; GFX906-NEXT: ; use s21
273273; GFX906-NEXT: ;;#ASMEND
274- ; GFX906-NEXT: v_readlane_b32 s22, v39, 25
274+ ; GFX906-NEXT: v_readlane_b32 s22, v39, 13
275275; GFX906-NEXT: ;;#ASMSTART
276276; GFX906-NEXT: ; use s22
277277; GFX906-NEXT: ;;#ASMEND
278- ; GFX906-NEXT: v_readlane_b32 s23, v39, 26
278+ ; GFX906-NEXT: v_readlane_b32 s23, v39, 14
279279; GFX906-NEXT: ;;#ASMSTART
280280; GFX906-NEXT: ; use s23
281281; GFX906-NEXT: ;;#ASMEND
282- ; GFX906-NEXT: v_readlane_b32 s24, v39, 27
282+ ; GFX906-NEXT: v_readlane_b32 s24, v39, 15
283283; GFX906-NEXT: ;;#ASMSTART
284284; GFX906-NEXT: ; use s24
285285; GFX906-NEXT: ;;#ASMEND
286- ; GFX906-NEXT: v_readlane_b32 s25, v39, 28
286+ ; GFX906-NEXT: v_readlane_b32 s25, v39, 16
287287; GFX906-NEXT: ;;#ASMSTART
288288; GFX906-NEXT: ; use s25
289289; GFX906-NEXT: ;;#ASMEND
290- ; GFX906-NEXT: v_readlane_b32 s26, v39, 29
290+ ; GFX906-NEXT: v_readlane_b32 s26, v39, 17
291291; GFX906-NEXT: ;;#ASMSTART
292292; GFX906-NEXT: ; use s26
293293; GFX906-NEXT: ;;#ASMEND
294- ; GFX906-NEXT: v_readlane_b32 s27, v39, 30
294+ ; GFX906-NEXT: v_readlane_b32 s27, v39, 18
295295; GFX906-NEXT: ;;#ASMSTART
296296; GFX906-NEXT: ; use s27
297297; GFX906-NEXT: ;;#ASMEND
298- ; GFX906-NEXT: v_readlane_b32 s28, v39, 31
298+ ; GFX906-NEXT: v_readlane_b32 s28, v39, 19
299299; GFX906-NEXT: ;;#ASMSTART
300300; GFX906-NEXT: ; use s28
301301; GFX906-NEXT: ;;#ASMEND
302- ; GFX906-NEXT: v_readlane_b32 s29, v39, 32
302+ ; GFX906-NEXT: v_readlane_b32 s29, v39, 20
303303; GFX906-NEXT: ;;#ASMSTART
304304; GFX906-NEXT: ; use s29
305305; GFX906-NEXT: ;;#ASMEND
@@ -575,39 +575,39 @@ define void @preserve_wwm_copy_dstreg(ptr %parg0, ptr %parg1, ptr %parg2) #0 {
575575; GFX908-NEXT: ;;#ASMSTART
576576; GFX908-NEXT: ; def s21
577577; GFX908-NEXT: ;;#ASMEND
578- ; GFX908-NEXT: v_writelane_b32 v39, s21, 24
578+ ; GFX908-NEXT: v_writelane_b32 v39, s21, 12
579579; GFX908-NEXT: ;;#ASMSTART
580580; GFX908-NEXT: ; def s22
581581; GFX908-NEXT: ;;#ASMEND
582- ; GFX908-NEXT: v_writelane_b32 v39, s22, 25
582+ ; GFX908-NEXT: v_writelane_b32 v39, s22, 13
583583; GFX908-NEXT: ;;#ASMSTART
584584; GFX908-NEXT: ; def s23
585585; GFX908-NEXT: ;;#ASMEND
586- ; GFX908-NEXT: v_writelane_b32 v39, s23, 26
586+ ; GFX908-NEXT: v_writelane_b32 v39, s23, 14
587587; GFX908-NEXT: ;;#ASMSTART
588588; GFX908-NEXT: ; def s24
589589; GFX908-NEXT: ;;#ASMEND
590- ; GFX908-NEXT: v_writelane_b32 v39, s24, 27
590+ ; GFX908-NEXT: v_writelane_b32 v39, s24, 15
591591; GFX908-NEXT: ;;#ASMSTART
592592; GFX908-NEXT: ; def s25
593593; GFX908-NEXT: ;;#ASMEND
594- ; GFX908-NEXT: v_writelane_b32 v39, s25, 28
594+ ; GFX908-NEXT: v_writelane_b32 v39, s25, 16
595595; GFX908-NEXT: ;;#ASMSTART
596596; GFX908-NEXT: ; def s26
597597; GFX908-NEXT: ;;#ASMEND
598- ; GFX908-NEXT: v_writelane_b32 v39, s26, 29
598+ ; GFX908-NEXT: v_writelane_b32 v39, s26, 17
599599; GFX908-NEXT: ;;#ASMSTART
600600; GFX908-NEXT: ; def s27
601601; GFX908-NEXT: ;;#ASMEND
602- ; GFX908-NEXT: v_writelane_b32 v39, s27, 30
602+ ; GFX908-NEXT: v_writelane_b32 v39, s27, 18
603603; GFX908-NEXT: ;;#ASMSTART
604604; GFX908-NEXT: ; def s28
605605; GFX908-NEXT: ;;#ASMEND
606- ; GFX908-NEXT: v_writelane_b32 v39, s28, 31
606+ ; GFX908-NEXT: v_writelane_b32 v39, s28, 19
607607; GFX908-NEXT: ;;#ASMSTART
608608; GFX908-NEXT: ; def s29
609609; GFX908-NEXT: ;;#ASMEND
610- ; GFX908-NEXT: v_writelane_b32 v39, s29, 32
610+ ; GFX908-NEXT: v_writelane_b32 v39, s29, 20
611611; GFX908-NEXT: s_or_saveexec_b64 s[34:35], -1
612612; GFX908-NEXT: buffer_store_dword v39, off, s[0:3], s33 offset:12 ; 4-byte Folded Spill
613613; GFX908-NEXT: s_mov_b64 exec, s[34:35]
@@ -646,39 +646,39 @@ define void @preserve_wwm_copy_dstreg(ptr %parg0, ptr %parg1, ptr %parg2) #0 {
646646; GFX908-NEXT: v_readlane_b32 s15, v39, 2
647647; GFX908-NEXT: v_mov_b32_e32 v31, v40
648648; GFX908-NEXT: v_readlane_b32 s17, v39, 23
649- ; GFX908-NEXT: v_readlane_b32 s21, v39, 24
649+ ; GFX908-NEXT: v_readlane_b32 s21, v39, 12
650650; GFX908-NEXT: ;;#ASMSTART
651651; GFX908-NEXT: ; use s21
652652; GFX908-NEXT: ;;#ASMEND
653- ; GFX908-NEXT: v_readlane_b32 s22, v39, 25
653+ ; GFX908-NEXT: v_readlane_b32 s22, v39, 13
654654; GFX908-NEXT: ;;#ASMSTART
655655; GFX908-NEXT: ; use s22
656656; GFX908-NEXT: ;;#ASMEND
657- ; GFX908-NEXT: v_readlane_b32 s23, v39, 26
657+ ; GFX908-NEXT: v_readlane_b32 s23, v39, 14
658658; GFX908-NEXT: ;;#ASMSTART
659659; GFX908-NEXT: ; use s23
660660; GFX908-NEXT: ;;#ASMEND
661- ; GFX908-NEXT: v_readlane_b32 s24, v39, 27
661+ ; GFX908-NEXT: v_readlane_b32 s24, v39, 15
662662; GFX908-NEXT: ;;#ASMSTART
663663; GFX908-NEXT: ; use s24
664664; GFX908-NEXT: ;;#ASMEND
665- ; GFX908-NEXT: v_readlane_b32 s25, v39, 28
665+ ; GFX908-NEXT: v_readlane_b32 s25, v39, 16
666666; GFX908-NEXT: ;;#ASMSTART
667667; GFX908-NEXT: ; use s25
668668; GFX908-NEXT: ;;#ASMEND
669- ; GFX908-NEXT: v_readlane_b32 s26, v39, 29
669+ ; GFX908-NEXT: v_readlane_b32 s26, v39, 17
670670; GFX908-NEXT: ;;#ASMSTART
671671; GFX908-NEXT: ; use s26
672672; GFX908-NEXT: ;;#ASMEND
673- ; GFX908-NEXT: v_readlane_b32 s27, v39, 30
673+ ; GFX908-NEXT: v_readlane_b32 s27, v39, 18
674674; GFX908-NEXT: ;;#ASMSTART
675675; GFX908-NEXT: ; use s27
676676; GFX908-NEXT: ;;#ASMEND
677- ; GFX908-NEXT: v_readlane_b32 s28, v39, 31
677+ ; GFX908-NEXT: v_readlane_b32 s28, v39, 19
678678; GFX908-NEXT: ;;#ASMSTART
679679; GFX908-NEXT: ; use s28
680680; GFX908-NEXT: ;;#ASMEND
681- ; GFX908-NEXT: v_readlane_b32 s29, v39, 32
681+ ; GFX908-NEXT: v_readlane_b32 s29, v39, 20
682682; GFX908-NEXT: ;;#ASMSTART
683683; GFX908-NEXT: ; use s29
684684; GFX908-NEXT: ;;#ASMEND
0 commit comments