@@ -429,36 +429,36 @@ define ptr @gep_disjoint_or(ptr %base) {
429429
430430; Check that AssertAlign nodes between ptradd nodes don't block offset folding,
431431; taken from preload-implicit-kernargs.ll
432- define amdgpu_kernel void @random_incorrect_offset (ptr addrspace (1 ) inreg %out ) # 0 {
432+ define amdgpu_kernel void @random_incorrect_offset (ptr addrspace (1 ) inreg %out ) {
433433; GFX942_PTRADD-LABEL: random_incorrect_offset:
434434; GFX942_PTRADD: ; %bb.1:
435- ; GFX942_PTRADD-NEXT: s_load_dwordx2 s[2:3 ], s[0:1 ], 0x0
435+ ; GFX942_PTRADD-NEXT: s_load_dwordx2 s[8:9 ], s[4:5 ], 0x0
436436; GFX942_PTRADD-NEXT: s_waitcnt lgkmcnt(0)
437437; GFX942_PTRADD-NEXT: s_branch .LBB21_0
438438; GFX942_PTRADD-NEXT: .p2align 8
439439; GFX942_PTRADD-NEXT: ; %bb.2:
440440; GFX942_PTRADD-NEXT: .LBB21_0:
441- ; GFX942_PTRADD-NEXT: s_load_dword s0, s[0:1 ], 0xa
441+ ; GFX942_PTRADD-NEXT: s_load_dword s0, s[4:5 ], 0xa
442442; GFX942_PTRADD-NEXT: v_mov_b32_e32 v0, 0
443443; GFX942_PTRADD-NEXT: s_waitcnt lgkmcnt(0)
444444; GFX942_PTRADD-NEXT: v_mov_b32_e32 v1, s0
445- ; GFX942_PTRADD-NEXT: global_store_dword v0, v1, s[2:3 ]
445+ ; GFX942_PTRADD-NEXT: global_store_dword v0, v1, s[8:9 ]
446446; GFX942_PTRADD-NEXT: s_endpgm
447447;
448448; GFX942_LEGACY-LABEL: random_incorrect_offset:
449449; GFX942_LEGACY: ; %bb.1:
450- ; GFX942_LEGACY-NEXT: s_load_dwordx2 s[2:3 ], s[0:1 ], 0x0
450+ ; GFX942_LEGACY-NEXT: s_load_dwordx2 s[8:9 ], s[4:5 ], 0x0
451451; GFX942_LEGACY-NEXT: s_waitcnt lgkmcnt(0)
452452; GFX942_LEGACY-NEXT: s_branch .LBB21_0
453453; GFX942_LEGACY-NEXT: .p2align 8
454454; GFX942_LEGACY-NEXT: ; %bb.2:
455455; GFX942_LEGACY-NEXT: .LBB21_0:
456- ; GFX942_LEGACY-NEXT: s_mov_b32 s4 , 8
457- ; GFX942_LEGACY-NEXT: s_load_dword s0, s[0:1 ], s4 offset:0x2
456+ ; GFX942_LEGACY-NEXT: s_mov_b32 s0 , 8
457+ ; GFX942_LEGACY-NEXT: s_load_dword s0, s[4:5 ], s0 offset:0x2
458458; GFX942_LEGACY-NEXT: v_mov_b32_e32 v0, 0
459459; GFX942_LEGACY-NEXT: s_waitcnt lgkmcnt(0)
460460; GFX942_LEGACY-NEXT: v_mov_b32_e32 v1, s0
461- ; GFX942_LEGACY-NEXT: global_store_dword v0, v1, s[2:3 ]
461+ ; GFX942_LEGACY-NEXT: global_store_dword v0, v1, s[8:9 ]
462462; GFX942_LEGACY-NEXT: s_endpgm
463463 %imp_arg_ptr = call ptr addrspace (4 ) @llvm.amdgcn.implicitarg.ptr ()
464464 %gep = getelementptr i8 , ptr addrspace (4 ) %imp_arg_ptr , i32 2
@@ -470,5 +470,3 @@ define amdgpu_kernel void @random_incorrect_offset(ptr addrspace(1) inreg %out)
470470declare void @llvm.memcpy.p0.p4.i64 (ptr noalias nocapture writeonly , ptr addrspace (4 ) noalias nocapture readonly , i64 , i1 immarg)
471471
472472!0 = !{}
473-
474- attributes #0 = { "amdgpu-agpr-alloc" ="0" "amdgpu-no-completion-action" "amdgpu-no-default-queue" "amdgpu-no-dispatch-id" "amdgpu-no-dispatch-ptr" "amdgpu-no-heap-ptr" "amdgpu-no-hostcall-ptr" "amdgpu-no-lds-kernel-id" "amdgpu-no-multigrid-sync-arg" "amdgpu-no-queue-ptr" "amdgpu-no-workgroup-id-x" "amdgpu-no-workgroup-id-y" "amdgpu-no-workgroup-id-z" "amdgpu-no-workitem-id-x" "amdgpu-no-workitem-id-y" "amdgpu-no-workitem-id-z" "uniform-work-group-size" ="false" }
0 commit comments