-
Notifications
You must be signed in to change notification settings - Fork 15.4k
[AMDGPU] Change handling of unsupported non-compute shaders with HSA #126798
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from 3 commits
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -1,19 +1,174 @@ | ||
| ; RUN: not llc -mtriple=amdgcn-unknown-amdhsa < %s 2>&1 | FileCheck %s | ||
| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --tool not --version 5 | ||
| ; RUN: not llc -mtriple=amdgcn-unknown-amdhsa -O0 -stop-after=amdgpu-isel -o - < %s 2>&1 | FileCheck %s | ||
|
|
||
| ; CHECK: in function pixel_s{{.*}}: unsupported non-compute shaders with HSA | ||
|
Contributor
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. We must maintain test coverage for error cases
Contributor
Author
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I wanted to adapt the test, but FileCheck didn't seem to be able to check for the
Member
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Did you try
Contributor
Author
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Yeah, in the meantime, I found this by searching through similar tests (basically |
||
| define amdgpu_ps void @pixel_shader() #0 { | ||
| @I = global i32 42 | ||
| @P = global ptr @I | ||
|
|
||
| ; CHECK: error: <unknown>:0:0: in function pixel_shader_zero_args void (): unsupported non-compute shaders with HSA | ||
| ; CHECK: error: <unknown>:0:0: in function pixel_shader_one_arg void (ptr): unsupported non-compute shaders with HSA | ||
| ; CHECK: error: <unknown>:0:0: in function pixel_shader_two_args void (ptr, i32): unsupported non-compute shaders with HSA | ||
| ; CHECK: error: <unknown>:0:0: in function vertex_shader_zero_args void (): unsupported non-compute shaders with HSA | ||
| ; CHECK: error: <unknown>:0:0: in function vertex_shader_one_arg void (ptr): unsupported non-compute shaders with HSA | ||
| ; CHECK: error: <unknown>:0:0: in function vertex_shader_two_args void (ptr, i32): unsupported non-compute shaders with HSA | ||
| ; CHECK: error: <unknown>:0:0: in function geometry_shader_zero_args void (): unsupported non-compute shaders with HSA | ||
| ; CHECK: error: <unknown>:0:0: in function geometry_shader_one_arg void (ptr): unsupported non-compute shaders with HSA | ||
| ; CHECK: error: <unknown>:0:0: in function geometry_shader_two_args void (ptr, i32): unsupported non-compute shaders with HSA | ||
|
|
||
| ; CHECK-LABEL: name: pixel_shader_zero_args | ||
ro-i marked this conversation as resolved.
Outdated
Show resolved
Hide resolved
|
||
| ; CHECK: bb.0 (%ir-block.0): | ||
| ; CHECK-NEXT: %2:sreg_64 = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @I, target-flags(amdgpu-gotprel32-hi) @I, implicit-def dead $scc | ||
| ; CHECK-NEXT: %3:sreg_64_xexec = S_LOAD_DWORDX2_IMM killed %2, 0, 0 :: (dereferenceable invariant load (s64) from got, addrspace 4) | ||
| ; CHECK-NEXT: %5:vreg_64 = COPY %3 | ||
| ; CHECK-NEXT: %4:vgpr_32 = FLAT_LOAD_DWORD killed %5, 0, 0, implicit $exec, implicit $flat_scr :: (dereferenceable load (s32) from @I) | ||
| ; CHECK-NEXT: %6:sreg_64 = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @P, target-flags(amdgpu-gotprel32-hi) @P, implicit-def dead $scc | ||
| ; CHECK-NEXT: %7:sreg_64_xexec = S_LOAD_DWORDX2_IMM killed %6, 0, 0 :: (dereferenceable invariant load (s64) from got, addrspace 4) | ||
| ; CHECK-NEXT: %8:vreg_64 = COPY %7 | ||
| ; CHECK-NEXT: FLAT_STORE_DWORD killed %8, killed %4, 0, 0, implicit $exec, implicit $flat_scr :: (store (s32) into @P) | ||
| ; CHECK-NEXT: S_ENDPGM 0 | ||
| define amdgpu_ps void @pixel_shader_zero_args() { | ||
| %i = load i32, ptr @I | ||
| store i32 %i, ptr @P | ||
| ret void | ||
| } | ||
|
|
||
| ; CHECK-LABEL: name: pixel_shader_one_arg | ||
| ; CHECK: bb.0 (%ir-block.0): | ||
| ; CHECK-NEXT: %4:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %5:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %6:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %7:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %3:sreg_64 = REG_SEQUENCE %4, %subreg.sub0, %6, %subreg.sub1 | ||
| ; CHECK-NEXT: %2:vreg_64 = COPY %3 | ||
| ; CHECK-NEXT: %8:sreg_64 = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @I, target-flags(amdgpu-gotprel32-hi) @I, implicit-def dead $scc | ||
| ; CHECK-NEXT: %9:sreg_64_xexec = S_LOAD_DWORDX2_IMM killed %8, 0, 0 :: (dereferenceable invariant load (s64) from got, addrspace 4) | ||
| ; CHECK-NEXT: %11:vreg_64 = COPY %9 | ||
| ; CHECK-NEXT: %10:vgpr_32 = FLAT_LOAD_DWORD killed %11, 0, 0, implicit $exec, implicit $flat_scr :: (dereferenceable load (s32) from @I) | ||
| ; CHECK-NEXT: %12:vreg_64 = COPY %3 | ||
| ; CHECK-NEXT: FLAT_STORE_DWORD %12, killed %10, 0, 0, implicit $exec, implicit $flat_scr :: (store (s32) into %ir.p) | ||
| ; CHECK-NEXT: S_ENDPGM 0 | ||
| define amdgpu_ps void @pixel_shader_one_arg(ptr %p) { | ||
| %i = load i32, ptr @I | ||
| store i32 %i, ptr %p | ||
| ret void | ||
| } | ||
|
|
||
| ; CHECK: in function vertex_s{{.*}}: unsupported non-compute shaders with HSA | ||
| define amdgpu_vs void @vertex_shader() #0 { | ||
| ; CHECK-LABEL: name: pixel_shader_two_args | ||
| ; CHECK: bb.0 (%ir-block.0): | ||
| ; CHECK-NEXT: %5:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %6:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %7:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %8:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %4:sreg_64 = REG_SEQUENCE %5, %subreg.sub0, %7, %subreg.sub1 | ||
| ; CHECK-NEXT: %3:vgpr_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %2:vreg_64 = COPY %4 | ||
| ; CHECK-NEXT: S_ENDPGM 0 | ||
| define amdgpu_ps void @pixel_shader_two_args(ptr %p, i32 %i) { | ||
| store i32 %i, ptr %p | ||
| ret void | ||
| } | ||
|
|
||
| ; CHECK: in function geometry_s{{.*}}: unsupported non-compute shaders with HSA | ||
| define amdgpu_gs void @geometry_shader() #0 { | ||
| ; CHECK-LABEL: name: vertex_shader_zero_args | ||
| ; CHECK: bb.0 (%ir-block.0): | ||
| ; CHECK-NEXT: %2:sreg_64 = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @I, target-flags(amdgpu-gotprel32-hi) @I, implicit-def dead $scc | ||
| ; CHECK-NEXT: %3:sreg_64_xexec = S_LOAD_DWORDX2_IMM killed %2, 0, 0 :: (dereferenceable invariant load (s64) from got, addrspace 4) | ||
| ; CHECK-NEXT: %5:vreg_64 = COPY %3 | ||
| ; CHECK-NEXT: %4:vgpr_32 = FLAT_LOAD_DWORD killed %5, 0, 0, implicit $exec, implicit $flat_scr :: (dereferenceable load (s32) from @I) | ||
| ; CHECK-NEXT: %6:sreg_64 = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @P, target-flags(amdgpu-gotprel32-hi) @P, implicit-def dead $scc | ||
| ; CHECK-NEXT: %7:sreg_64_xexec = S_LOAD_DWORDX2_IMM killed %6, 0, 0 :: (dereferenceable invariant load (s64) from got, addrspace 4) | ||
| ; CHECK-NEXT: %8:vreg_64 = COPY %7 | ||
| ; CHECK-NEXT: FLAT_STORE_DWORD killed %8, killed %4, 0, 0, implicit $exec, implicit $flat_scr :: (store (s32) into @P) | ||
| ; CHECK-NEXT: S_ENDPGM 0 | ||
| define amdgpu_vs void @vertex_shader_zero_args() { | ||
| %i = load i32, ptr @I | ||
| store i32 %i, ptr @P | ||
| ret void | ||
| } | ||
|
|
||
| !llvm.module.flags = !{!0} | ||
| !0 = !{i32 1, !"amdhsa_code_object_version", i32 400} | ||
| ; CHECK-LABEL: name: vertex_shader_one_arg | ||
| ; CHECK: bb.0 (%ir-block.0): | ||
| ; CHECK-NEXT: %4:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %5:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %6:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %7:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %3:sreg_64 = REG_SEQUENCE %4, %subreg.sub0, %6, %subreg.sub1 | ||
| ; CHECK-NEXT: %2:vreg_64 = COPY %3 | ||
| ; CHECK-NEXT: %8:sreg_64 = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @I, target-flags(amdgpu-gotprel32-hi) @I, implicit-def dead $scc | ||
| ; CHECK-NEXT: %9:sreg_64_xexec = S_LOAD_DWORDX2_IMM killed %8, 0, 0 :: (dereferenceable invariant load (s64) from got, addrspace 4) | ||
| ; CHECK-NEXT: %11:vreg_64 = COPY %9 | ||
| ; CHECK-NEXT: %10:vgpr_32 = FLAT_LOAD_DWORD killed %11, 0, 0, implicit $exec, implicit $flat_scr :: (dereferenceable load (s32) from @I) | ||
| ; CHECK-NEXT: %12:vreg_64 = COPY %3 | ||
| ; CHECK-NEXT: FLAT_STORE_DWORD %12, killed %10, 0, 0, implicit $exec, implicit $flat_scr :: (store (s32) into %ir.p) | ||
| ; CHECK-NEXT: S_ENDPGM 0 | ||
| define amdgpu_vs void @vertex_shader_one_arg(ptr %p) { | ||
| %i = load i32, ptr @I | ||
| store i32 %i, ptr %p | ||
| ret void | ||
| } | ||
|
|
||
| ; CHECK-LABEL: name: vertex_shader_two_args | ||
| ; CHECK: bb.0 (%ir-block.0): | ||
| ; CHECK-NEXT: %5:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %6:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %7:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %8:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %4:sreg_64 = REG_SEQUENCE %5, %subreg.sub0, %7, %subreg.sub1 | ||
| ; CHECK-NEXT: %3:vgpr_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %2:vreg_64 = COPY %4 | ||
| ; CHECK-NEXT: S_ENDPGM 0 | ||
| define amdgpu_vs void @vertex_shader_two_args(ptr %p, i32 %i) { | ||
| store i32 %i, ptr %p | ||
| ret void | ||
| } | ||
|
|
||
| ; CHECK-LABEL: name: geometry_shader_zero_args | ||
| ; CHECK: bb.0 (%ir-block.0): | ||
| ; CHECK-NEXT: %2:sreg_64 = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @I, target-flags(amdgpu-gotprel32-hi) @I, implicit-def dead $scc | ||
| ; CHECK-NEXT: %3:sreg_64_xexec = S_LOAD_DWORDX2_IMM killed %2, 0, 0 :: (dereferenceable invariant load (s64) from got, addrspace 4) | ||
| ; CHECK-NEXT: %5:vreg_64 = COPY %3 | ||
| ; CHECK-NEXT: %4:vgpr_32 = FLAT_LOAD_DWORD killed %5, 0, 0, implicit $exec, implicit $flat_scr :: (dereferenceable load (s32) from @I) | ||
| ; CHECK-NEXT: %6:sreg_64 = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @P, target-flags(amdgpu-gotprel32-hi) @P, implicit-def dead $scc | ||
| ; CHECK-NEXT: %7:sreg_64_xexec = S_LOAD_DWORDX2_IMM killed %6, 0, 0 :: (dereferenceable invariant load (s64) from got, addrspace 4) | ||
| ; CHECK-NEXT: %8:vreg_64 = COPY %7 | ||
| ; CHECK-NEXT: FLAT_STORE_DWORD killed %8, killed %4, 0, 0, implicit $exec, implicit $flat_scr :: (store (s32) into @P) | ||
| ; CHECK-NEXT: S_ENDPGM 0 | ||
| define amdgpu_gs void @geometry_shader_zero_args() { | ||
| %i = load i32, ptr @I | ||
| store i32 %i, ptr @P | ||
| ret void | ||
| } | ||
|
|
||
| ; CHECK-LABEL: name: geometry_shader_one_arg | ||
| ; CHECK: bb.0 (%ir-block.0): | ||
| ; CHECK-NEXT: %4:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %5:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %6:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %7:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %3:sreg_64 = REG_SEQUENCE %4, %subreg.sub0, %6, %subreg.sub1 | ||
| ; CHECK-NEXT: %2:vreg_64 = COPY %3 | ||
| ; CHECK-NEXT: %8:sreg_64 = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @I, target-flags(amdgpu-gotprel32-hi) @I, implicit-def dead $scc | ||
| ; CHECK-NEXT: %9:sreg_64_xexec = S_LOAD_DWORDX2_IMM killed %8, 0, 0 :: (dereferenceable invariant load (s64) from got, addrspace 4) | ||
| ; CHECK-NEXT: %11:vreg_64 = COPY %9 | ||
| ; CHECK-NEXT: %10:vgpr_32 = FLAT_LOAD_DWORD killed %11, 0, 0, implicit $exec, implicit $flat_scr :: (dereferenceable load (s32) from @I) | ||
| ; CHECK-NEXT: %12:vreg_64 = COPY %3 | ||
| ; CHECK-NEXT: FLAT_STORE_DWORD %12, killed %10, 0, 0, implicit $exec, implicit $flat_scr :: (store (s32) into %ir.p) | ||
| ; CHECK-NEXT: S_ENDPGM 0 | ||
| define amdgpu_gs void @geometry_shader_one_arg(ptr %p) { | ||
| %i = load i32, ptr @I | ||
| store i32 %i, ptr %p | ||
| ret void | ||
| } | ||
|
|
||
| ; CHECK-LABEL: name: geometry_shader_two_args | ||
| ; CHECK: bb.0 (%ir-block.0): | ||
| ; CHECK-NEXT: %5:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %6:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %7:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %8:sreg_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %4:sreg_64 = REG_SEQUENCE %5, %subreg.sub0, %7, %subreg.sub1 | ||
| ; CHECK-NEXT: %3:vgpr_32 = IMPLICIT_DEF | ||
| ; CHECK-NEXT: %2:vreg_64 = COPY %4 | ||
| ; CHECK-NEXT: S_ENDPGM 0 | ||
| define amdgpu_gs void @geometry_shader_two_args(ptr %p, i32 %i) { | ||
| store i32 %i, ptr %p | ||
| ret void | ||
| } | ||
Uh oh!
There was an error while loading. Please reload this page.