44
55target triple = "nvptx64-nvidia-cuda"
66
7- declare void @llvm.nvvm.prefetch.local.L1.evictnormal (ptr addrspace (5 ) %local_ptr )
8- declare void @llvm.nvvm.prefetch.local.L2.evictnormal (ptr addrspace (5 ) %local_ptr )
7+ declare void @llvm.nvvm.prefetch.global.L1 (ptr addrspace (1 ) %global_ptr )
8+ declare void @llvm.nvvm.prefetch.global.L2 (ptr addrspace (1 ) %global_ptr )
9+ declare void @llvm.nvvm.prefetch.local.L1 (ptr addrspace (5 ) %local_ptr )
10+ declare void @llvm.nvvm.prefetch.local.L2 (ptr addrspace (5 ) %local_ptr )
911
10- declare void @llvm.nvvm.prefetch.global.L1.evictnormal (ptr addrspace (1 ) %global_ptr )
11- declare void @llvm.nvvm.prefetch.global.L2.evictnormal (ptr addrspace (1 ) %global_ptr )
12- declare void @llvm.nvvm.prefetch.global.L1.evictlast (ptr addrspace (1 ) %global_ptr )
13- declare void @llvm.nvvm.prefetch.global.L2.evictlast (ptr addrspace (1 ) %global_ptr )
12+ declare void @llvm.nvvm.prefetch.L1 (ptr %ptr )
13+ declare void @llvm.nvvm.prefetch.L2 (ptr %ptr )
1414
15- declare void @llvm.nvvm.prefetch.L1.evictnormal (ptr %ptr )
16- declare void @llvm.nvvm.prefetch.L2.evictnormal (ptr %ptr )
15+ declare void @llvm.nvvm.prefetch.global.L2.evict.normal (ptr addrspace ( 1 ) %global_ptr )
16+ declare void @llvm.nvvm.prefetch.global. L2.evict.last (ptr addrspace ( 1 ) %global_ptr )
1717
18- declare void @llvm.nvvm.prefetchu.L1.evictnormal (ptr %ptr )
18+ declare void @llvm.nvvm.prefetchu.L1 (ptr %ptr )
1919
2020define void @prefetch_local (ptr addrspace (5 ) %local_ptr ) {
2121; CHECK-PTX64-LABEL: prefetch_local(
@@ -24,11 +24,11 @@ define void @prefetch_local(ptr addrspace(5) %local_ptr) {
2424; CHECK-PTX64-EMPTY:
2525; CHECK-PTX64-NEXT: // %bb.0:
2626; CHECK-PTX64-NEXT: ld.param.u64 %rd1, [prefetch_local_param_0];
27- ; CHECK-PTX64-NEXT: prefetch.local.L1.evictnormal [%rd1];
28- ; CHECK-PTX64-NEXT: prefetch.local.L2.evictnormal [%rd1];
27+ ; CHECK-PTX64-NEXT: prefetch.local.L1 [%rd1];
28+ ; CHECK-PTX64-NEXT: prefetch.local.L2 [%rd1];
2929; CHECK-PTX64-NEXT: ret;
30- tail call void @llvm.nvvm.prefetch.local.L1.evictnormal (ptr addrspace (5 ) %local_ptr )
31- tail call void @llvm.nvvm.prefetch.local.L2.evictnormal (ptr addrspace (5 ) %local_ptr )
30+ tail call void @llvm.nvvm.prefetch.local.L1 (ptr addrspace (5 ) %local_ptr )
31+ tail call void @llvm.nvvm.prefetch.local.L2 (ptr addrspace (5 ) %local_ptr )
3232 ret void
3333}
3434
@@ -39,15 +39,15 @@ define void @prefetch_global(ptr addrspace(1) %global_ptr) {
3939; CHECK-PTX64-EMPTY:
4040; CHECK-PTX64-NEXT: // %bb.0:
4141; CHECK-PTX64-NEXT: ld.param.u64 %rd1, [prefetch_global_param_0];
42- ; CHECK-PTX64-NEXT: prefetch.global.L1.evictnormal [%rd1];
43- ; CHECK-PTX64-NEXT: prefetch.global.L2.evictnormal [%rd1];
44- ; CHECK-PTX64-NEXT: prefetch.global.L1.evictlast [%rd1];
45- ; CHECK-PTX64-NEXT: prefetch.global.L2.evictlast [%rd1];
42+ ; CHECK-PTX64-NEXT: prefetch.global.L1 [%rd1];
43+ ; CHECK-PTX64-NEXT: prefetch.global.L2 [%rd1];
44+ ; CHECK-PTX64-NEXT: prefetch.global.L2::evict_normal [%rd1];
45+ ; CHECK-PTX64-NEXT: prefetch.global.L2::evict_last [%rd1];
4646; CHECK-PTX64-NEXT: ret;
47- tail call void @llvm.nvvm.prefetch.global.L1.evictnormal (ptr addrspace (1 ) %global_ptr )
48- tail call void @llvm.nvvm.prefetch.global.L2.evictnormal (ptr addrspace (1 ) %global_ptr )
49- tail call void @llvm.nvvm.prefetch.global.L1.evictlast (ptr addrspace (1 ) %global_ptr )
50- tail call void @llvm.nvvm.prefetch.global.L2.evictlast (ptr addrspace (1 ) %global_ptr )
47+ tail call void @llvm.nvvm.prefetch.global.L1 (ptr addrspace (1 ) %global_ptr )
48+ tail call void @llvm.nvvm.prefetch.global.L2 (ptr addrspace (1 ) %global_ptr )
49+ tail call void @llvm.nvvm.prefetch.global.L2.evict.normal (ptr addrspace (1 ) %global_ptr )
50+ tail call void @llvm.nvvm.prefetch.global.L2.evict.last (ptr addrspace (1 ) %global_ptr )
5151 ret void
5252}
5353
@@ -59,11 +59,11 @@ define void @prefetch_(ptr %ptr) {
5959; CHECK-PTX64-EMPTY:
6060; CHECK-PTX64-NEXT: // %bb.0:
6161; CHECK-PTX64-NEXT: ld.param.u64 %rd1, [prefetch__param_0];
62- ; CHECK-PTX64-NEXT: prefetch.L1.evictnormal [%rd1];
63- ; CHECK-PTX64-NEXT: prefetch.L2.evictnormal [%rd1];
62+ ; CHECK-PTX64-NEXT: prefetch.L1 [%rd1];
63+ ; CHECK-PTX64-NEXT: prefetch.L2 [%rd1];
6464; CHECK-PTX64-NEXT: ret;
65- tail call void @llvm.nvvm.prefetch.L1.evictnormal (ptr %ptr )
66- tail call void @llvm.nvvm.prefetch.L2.evictnormal (ptr %ptr )
65+ tail call void @llvm.nvvm.prefetch.L1 (ptr %ptr )
66+ tail call void @llvm.nvvm.prefetch.L2 (ptr %ptr )
6767 ret void
6868}
6969
@@ -74,8 +74,8 @@ define void @prefetchu_l1(ptr %ptr) {
7474; CHECK-PTX64-EMPTY:
7575; CHECK-PTX64-NEXT: // %bb.0:
7676; CHECK-PTX64-NEXT: ld.param.u64 %rd1, [prefetchu_l1_param_0];
77- ; CHECK-PTX64-NEXT: prefetchu.L1.evictnormal [%rd1];
77+ ; CHECK-PTX64-NEXT: prefetchu.L1 [%rd1];
7878; CHECK-PTX64-NEXT: ret;
79- tail call void @llvm.nvvm.prefetchu.L1.evictnormal (ptr %ptr )
79+ tail call void @llvm.nvvm.prefetchu.L1 (ptr %ptr )
8080 ret void
8181}
0 commit comments