@@ -33,14 +33,12 @@ gpu.module @kernels {
3333 // CHECK-SUB: %[[V2:.+]] = vector.insert %[[R2]], %[[V1]] [4] : f16 into vector<5xf16>
3434 // CHECK-SUB: "test.consume"(%[[V2]]) : (vector<5xf16>) -> ()
3535 // CHECK-DPP-COUNT-6: amdgpu.dpp
36- // CHECK-DPP: rocdl.readlane
3736 %sum0 = gpu.subgroup_reduce add %arg0 : (vector <5 xf16 >) -> (vector <5 xf16 >)
3837 " test.consume" (%sum0 ) : (vector <5 xf16 >) -> ()
3938
4039 // CHECK-SUB-COUNT-3: gpu.subgroup_reduce mul {{.+}} uniform
4140 // CHECK-SUB: "test.consume"
4241 // CHECK-DPP-COUNT-6: amdgpu.dpp
43- // CHECK-DPP: rocdl.readlane
4442 %sum1 = gpu.subgroup_reduce mul %arg0 uniform : (vector <5 xf16 >) -> (vector <5 xf16 >)
4543 " test.consume" (%sum1 ) : (vector <5 xf16 >) -> ()
4644
@@ -71,14 +69,12 @@ gpu.module @kernels {
7169 // CHECK-SUB: %[[V0:.+]] = vector.broadcast %[[R0]] : f32 to vector<1xf32>
7270 // CHECK-SUB: "test.consume"(%[[V0]]) : (vector<1xf32>) -> ()
7371 // CHECK-DPP-COUNT-6: amdgpu.dpp
74- // CHECK-DPP: rocdl.readlane
7572 %sum0 = gpu.subgroup_reduce add %arg0 : (vector <1 xf32 >) -> (vector <1 xf32 >)
7673 " test.consume" (%sum0 ) : (vector <1 xf32 >) -> ()
7774
7875 // CHECK-SUB: gpu.subgroup_reduce add {{.+}} uniform : (f32) -> f32
7976 // CHECK-SUB: "test.consume"
8077 // CHECK-DPP-COUNT-6: amdgpu.dpp
81- // CHECK-DPP: rocdl.readlane
8278 %sum1 = gpu.subgroup_reduce add %arg0 uniform : (vector <1 xf32 >) -> (vector <1 xf32 >)
8379 " test.consume" (%sum1 ) : (vector <1 xf32 >) -> ()
8480
@@ -148,7 +144,6 @@ gpu.module @kernels {
148144 // CHECK-SHFL: "test.consume"(%[[A4]]) : (i32) -> ()
149145
150146 // CHECK-DPP-COUNT-6: amdgpu.dpp
151- // CHECK-DPP: rocdl.readlane
152147 %sum0 = gpu.subgroup_reduce add %arg0 : (i32 ) -> i32
153148 " test.consume" (%sum0 ) : (i32 ) -> ()
154149
@@ -282,7 +277,6 @@ gpu.module @kernels {
282277 // CHECK-SHFL: %[[AL:.+]] = arith.addi {{.+}} : i16
283278 // CHECK-SHFL: "test.consume"(%[[AL]]) : (i16) -> ()
284279 // CHECK-DPP-COUNT-6: amdgpu.dpp
285- // CHECK-DPP: rocdl.readlane
286280 %sum0 = gpu.subgroup_reduce add %arg0 : (i16 ) -> i16
287281 " test.consume" (%sum0 ) : (i16 ) -> ()
288282
0 commit comments