|
1 | 1 | ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5 |
2 | | -; RUN: llc < %s | FileCheck -check-prefix=ENABLED %s |
3 | | -; RUN: llc -disable-nvptx-load-store-vectorizer < %s | FileCheck -check-prefix=DISABLED %s |
4 | | -; RUN: %if ptxas %{ llc < %s | %ptxas-verify %} |
5 | | -; RUN: %if ptxas %{ llc -disable-nvptx-load-store-vectorizer < %s | %ptxas-verify %} |
| 2 | +; RUN: llc -march=nvptx64 -mcpu=sm_90 -mattr=+ptx88 < %s | FileCheck -check-prefix=ENABLED %s |
| 3 | +; RUN: llc -march=nvptx64 -mcpu=sm_90 -mattr=+ptx88 -disable-nvptx-load-store-vectorizer < %s | FileCheck -check-prefix=DISABLED %s |
| 4 | +; RUN: %if ptxas-sm_90 && ptxas-isa-8.8 %{ llc -march=nvptx64 -mcpu=sm_90 -mattr=+ptx88 < %s | %ptxas-verify -arch=sm_90 %} |
| 5 | +; RUN: %if ptxas-sm_90 && ptxas-isa-8.8 %{ llc -march=nvptx64 -mcpu=sm_90 -mattr=+ptx88 -disable-nvptx-load-store-vectorizer < %s | %ptxas-verify -arch=sm_90 %} |
6 | 6 |
|
7 | 7 | target triple = "nvptx64-nvidia-cuda" |
8 | 8 |
|
@@ -52,7 +52,7 @@ define half @fh(ptr %p) { |
52 | 52 | ; ENABLED-NEXT: ld.param.b64 %rd1, [fh_param_0]; |
53 | 53 | ; ENABLED-NEXT: .pragma "used_bytes_mask 0x3ff"; |
54 | 54 | ; ENABLED-NEXT: ld.v4.b32 {%r1, %r2, %r3, %r4}, [%rd1]; |
55 | | -; ENABLED-NEXT: { .reg .b16 tmp; mov.b32 {%rs1, tmp}, %r3; } |
| 55 | +; ENABLED-NEXT: mov.b32 {%rs1, _}, %r3; |
56 | 56 | ; ENABLED-NEXT: mov.b32 {%rs2, %rs3}, %r2; |
57 | 57 | ; ENABLED-NEXT: mov.b32 {%rs4, %rs5}, %r1; |
58 | 58 | ; ENABLED-NEXT: cvt.f32.f16 %r5, %rs5; |
|
0 commit comments