We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 2efba3c commit 199df0eCopy full SHA for 199df0e
algorithms/sycl/Reduction.cpp
@@ -101,12 +101,10 @@ namespace {
101
for (std::size_t i = 0; i < itemsPerWorkItem*workGroupSize; i += workGroupSize) {
102
const auto id = baseIdx + i;
103
if(id < size){
104
- threadAcc = operation(threadAcc, static_cast<AccT>(&buffer[id]));
+ threadAcc = operation(threadAcc, static_cast<AccT>(ntload(&buffer[id])));
105
}
106
107
108
- idx.barrier(sycl::access::fence_space::local_space);
109
-
110
const auto reducedValue = sycl::reduce_over_group(idx.get_group(), threadAcc, operation);
111
112
if(localId == 0){
0 commit comments