|
1 | | -; RUN: llc -O0 < %s -mtriple=nvptx -mcpu=sm_20 | FileCheck %s -check-prefixes=ALL,CLS32,G32 |
2 | | -; RUN: llc -O0 < %s -mtriple=nvptx64 -mcpu=sm_20 | FileCheck %s -check-prefixes=ALL,NOPTRCONV,CLS64,G64 |
3 | | -; RUN: llc -O0 < %s -mtriple=nvptx64 -mcpu=sm_20 --nvptx-short-ptr| FileCheck %s -check-prefixes=ALL,PTRCONV,CLS64,G64 |
| 1 | +; RUN: llc -O0 < %s -mtriple=nvptx -mcpu=sm_20 | FileCheck %s -check-prefixes=ALL,CLS32 |
| 2 | +; RUN: llc -O0 < %s -mtriple=nvptx64 -mcpu=sm_20 | FileCheck %s -check-prefixes=ALL,NOPTRCONV,CLS64 |
| 3 | +; RUN: llc -O0 < %s -mtriple=nvptx64 -mcpu=sm_20 --nvptx-short-ptr | FileCheck %s -check-prefixes=ALL,PTRCONV,CLS64 |
4 | 4 | ; RUN: %if ptxas && !ptxas-12.0 %{ llc -O0 < %s -mtriple=nvptx -mcpu=sm_20 | %ptxas-verify %} |
5 | 5 | ; RUN: %if ptxas %{ llc -O0 < %s -mtriple=nvptx64 -mcpu=sm_20 | %ptxas-verify %} |
6 | 6 | ; RUN: %if ptxas %{ llc -O0 < %s -mtriple=nvptx64 -mcpu=sm_20 --nvptx-short-ptr | %ptxas-verify %} |
7 | 7 |
|
8 | 8 | ; ALL-LABEL: conv1 |
9 | 9 | define i32 @conv1(ptr addrspace(1) %ptr) { |
10 | | -; G32: cvta.global.u32 |
| 10 | +; CLS32: cvta.global.u32 |
11 | 11 | ; ALL-NOT: cvt.u64.u32 |
12 | | -; G64: cvta.global.u64 |
| 12 | +; CLS64: cvta.global.u64 |
13 | 13 | ; ALL: ld.u32 |
14 | 14 | %genptr = addrspacecast ptr addrspace(1) %ptr to ptr |
15 | 15 | %val = load i32, ptr %genptr |
@@ -101,13 +101,10 @@ define i32 @conv8(ptr %ptr) { |
101 | 101 |
|
102 | 102 | ; ALL-LABEL: conv9 |
103 | 103 | define i32 @conv9(ptr addrspace(1) %ptr) { |
104 | | -; CLS32: cvta.global.u32 |
105 | | -; CLS32: cvta.to.shared.u32 |
106 | | -; CLS64: cvta.global.u64 |
107 | | -; CLS64: cvta.to.shared.u64 |
108 | | -; PTRCONV: cvt.u32.u64 |
109 | | -; NOPTRCONV-NOT: cvt.u32.u64 |
110 | | -; ALL: ld.shared.u32 |
| 104 | +; CLS32: // implicit-def: %[[ADDR:r[0-9]+]] |
| 105 | +; PTRCONV: // implicit-def: %[[ADDR:r[0-9]+]] |
| 106 | +; NOPTRCONV: // implicit-def: %[[ADDR:rd[0-9]+]] |
| 107 | +; ALL: ld.shared.u32 %r{{[0-9]+}}, [%[[ADDR]]] |
111 | 108 | %specptr = addrspacecast ptr addrspace(1) %ptr to ptr addrspace(3) |
112 | 109 | %val = load i32, ptr addrspace(3) %specptr |
113 | 110 | ret i32 %val |
|
0 commit comments