@@ -430,36 +430,36 @@ define ptr @gep_disjoint_or(ptr %base) {
430430
431431; Check that AssertAlign nodes between ptradd nodes don't block offset folding,
432432; taken from preload-implicit-kernargs.ll
433- define amdgpu_kernel void @random_incorrect_offset (ptr addrspace (1 ) inreg %out ) # 0 {
433+ define amdgpu_kernel void @random_incorrect_offset (ptr addrspace (1 ) inreg %out ) {
434434; GFX942_PTRADD-LABEL: random_incorrect_offset:
435435; GFX942_PTRADD: ; %bb.1:
436- ; GFX942_PTRADD-NEXT: s_load_dwordx2 s[2:3 ], s[0:1 ], 0x0
436+ ; GFX942_PTRADD-NEXT: s_load_dwordx2 s[8:9 ], s[4:5 ], 0x0
437437; GFX942_PTRADD-NEXT: s_waitcnt lgkmcnt(0)
438438; GFX942_PTRADD-NEXT: s_branch .LBB21_0
439439; GFX942_PTRADD-NEXT: .p2align 8
440440; GFX942_PTRADD-NEXT: ; %bb.2:
441441; GFX942_PTRADD-NEXT: .LBB21_0:
442- ; GFX942_PTRADD-NEXT: s_load_dword s0, s[0:1 ], 0xa
442+ ; GFX942_PTRADD-NEXT: s_load_dword s0, s[4:5 ], 0xa
443443; GFX942_PTRADD-NEXT: v_mov_b32_e32 v0, 0
444444; GFX942_PTRADD-NEXT: s_waitcnt lgkmcnt(0)
445445; GFX942_PTRADD-NEXT: v_mov_b32_e32 v1, s0
446- ; GFX942_PTRADD-NEXT: global_store_dword v0, v1, s[2:3 ]
446+ ; GFX942_PTRADD-NEXT: global_store_dword v0, v1, s[8:9 ]
447447; GFX942_PTRADD-NEXT: s_endpgm
448448;
449449; GFX942_LEGACY-LABEL: random_incorrect_offset:
450450; GFX942_LEGACY: ; %bb.1:
451- ; GFX942_LEGACY-NEXT: s_load_dwordx2 s[2:3 ], s[0:1 ], 0x0
451+ ; GFX942_LEGACY-NEXT: s_load_dwordx2 s[8:9 ], s[4:5 ], 0x0
452452; GFX942_LEGACY-NEXT: s_waitcnt lgkmcnt(0)
453453; GFX942_LEGACY-NEXT: s_branch .LBB21_0
454454; GFX942_LEGACY-NEXT: .p2align 8
455455; GFX942_LEGACY-NEXT: ; %bb.2:
456456; GFX942_LEGACY-NEXT: .LBB21_0:
457- ; GFX942_LEGACY-NEXT: s_mov_b32 s4 , 8
458- ; GFX942_LEGACY-NEXT: s_load_dword s0, s[0:1 ], s4 offset:0x2
457+ ; GFX942_LEGACY-NEXT: s_mov_b32 s0 , 8
458+ ; GFX942_LEGACY-NEXT: s_load_dword s0, s[4:5 ], s0 offset:0x2
459459; GFX942_LEGACY-NEXT: v_mov_b32_e32 v0, 0
460460; GFX942_LEGACY-NEXT: s_waitcnt lgkmcnt(0)
461461; GFX942_LEGACY-NEXT: v_mov_b32_e32 v1, s0
462- ; GFX942_LEGACY-NEXT: global_store_dword v0, v1, s[2:3 ]
462+ ; GFX942_LEGACY-NEXT: global_store_dword v0, v1, s[8:9 ]
463463; GFX942_LEGACY-NEXT: s_endpgm
464464 %imp_arg_ptr = call ptr addrspace (4 ) @llvm.amdgcn.implicitarg.ptr ()
465465 %gep = getelementptr i8 , ptr addrspace (4 ) %imp_arg_ptr , i32 2
@@ -471,5 +471,3 @@ define amdgpu_kernel void @random_incorrect_offset(ptr addrspace(1) inreg %out)
471471declare void @llvm.memcpy.p0.p4.i64 (ptr noalias nocapture writeonly , ptr addrspace (4 ) noalias nocapture readonly , i64 , i1 immarg)
472472
473473!0 = !{}
474-
475- attributes #0 = { "amdgpu-agpr-alloc" ="0" "amdgpu-no-completion-action" "amdgpu-no-default-queue" "amdgpu-no-dispatch-id" "amdgpu-no-dispatch-ptr" "amdgpu-no-heap-ptr" "amdgpu-no-hostcall-ptr" "amdgpu-no-lds-kernel-id" "amdgpu-no-multigrid-sync-arg" "amdgpu-no-queue-ptr" "amdgpu-no-workgroup-id-x" "amdgpu-no-workgroup-id-y" "amdgpu-no-workgroup-id-z" "amdgpu-no-workitem-id-x" "amdgpu-no-workitem-id-y" "amdgpu-no-workitem-id-z" "uniform-work-group-size" ="false" }
0 commit comments