Skip to content

Commit 199df0e

Browse files
committed
Putting ntload back, and remove the missed barrier
1 parent 2efba3c commit 199df0e

File tree

1 file changed

+1
-3
lines changed

1 file changed

+1
-3
lines changed

algorithms/sycl/Reduction.cpp

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -101,12 +101,10 @@ namespace {
101101
for (std::size_t i = 0; i < itemsPerWorkItem*workGroupSize; i += workGroupSize) {
102102
const auto id = baseIdx + i;
103103
if(id < size){
104-
threadAcc = operation(threadAcc, static_cast<AccT>(&buffer[id]));
104+
threadAcc = operation(threadAcc, static_cast<AccT>(ntload(&buffer[id])));
105105
}
106106
}
107107

108-
idx.barrier(sycl::access::fence_space::local_space);
109-
110108
const auto reducedValue = sycl::reduce_over_group(idx.get_group(), threadAcc, operation);
111109

112110
if(localId == 0){

0 commit comments

Comments
 (0)