@@ -185,38 +185,37 @@ UR_APIEXPORT ur_result_t UR_APICALL urEnqueueKernelLaunch(
185185 rangeEnd[1 ] = (rangeEnd[3 ] / numWG0) % numWG1;
186186 rangeEnd[2 ] = rangeEnd[3 ] / (numWG0 * numWG1);
187187 Tasks.schedule ([ndr, InEvents, &kernel = *kernel, rangeStart,
188- rangeEnd = rangeEnd[3 ], numWG0, numWG1,
189- numParallelThreads](size_t threadId) {
190- auto state = getState (ndr);
191- InEvents.wait ();
192- for (size_t g0 = rangeStart[0 ], g1 = rangeStart[1 ],
193- g2 = rangeStart[ 2 ], g3 = rangeStart[3 ];
194- g3 < rangeEnd; ++g3) {
188+ rangeEnd = rangeEnd[3 ], numWG0, numWG1,
189+ numParallelThreads](size_t threadId) {
190+ auto state = getState (ndr);
191+ InEvents.wait ();
192+ for (size_t g0 = rangeStart[0 ], g1 = rangeStart[1 ], g2 = rangeStart[ 2 ],
193+ g3 = rangeStart[3 ];
194+ g3 < rangeEnd; ++g3) {
195195#ifdef NATIVECPU_USE_OCK
196- state.update (g0, g1, g2);
197- kernel._subhandler (
198- kernel. getArgs (numParallelThreads, threadId). data (), &state);
196+ state.update (g0, g1, g2);
197+ kernel._subhandler (kernel. getArgs (numParallelThreads, threadId). data (),
198+ &state);
199199#else
200- for (size_t local2 = 0 ; local2 < ndr.LocalSize [2 ]; ++local2) {
201- for (size_t local1 = 0 ; local1 < ndr.LocalSize [1 ]; ++local1) {
202- for (size_t local0 = 0 ; local0 < ndr.LocalSize [0 ]; ++local0) {
203- state.update (g0, g1, g2, local0, local1, local2);
204- kernel._subhandler (
205- kernel.getArgs (numParallelThreads, threadId).data (),
206- &state);
207- }
208- }
200+ for (size_t local2 = 0 ; local2 < ndr.LocalSize [2 ]; ++local2) {
201+ for (size_t local1 = 0 ; local1 < ndr.LocalSize [1 ]; ++local1) {
202+ for (size_t local0 = 0 ; local0 < ndr.LocalSize [0 ]; ++local0) {
203+ state.update (g0, g1, g2, local0, local1, local2);
204+ kernel._subhandler (
205+ kernel.getArgs (numParallelThreads, threadId).data (), &state);
209206 }
207+ }
208+ }
210209#endif
211- if (++g0 == numWG0) {
212- g0 = 0 ;
213- if (++g1 == numWG1) {
214- g1 = 0 ;
215- ++g2;
216- }
217- }
210+ if (++g0 == numWG0) {
211+ g0 = 0 ;
212+ if (++g1 == numWG1) {
213+ g1 = 0 ;
214+ ++g2;
218215 }
219- });
216+ }
217+ }
218+ });
220219 rangeStart = rangeEnd;
221220 }
222221 event->set_futures (Tasks.getTaskInfo ());
0 commit comments