@@ -73,8 +73,8 @@ class device_kernel_w_linear {
7373 constexpr auto PADDING_SIZE_uz = static_cast <std::size_t >(PADDING_SIZE);
7474
7575 // calculate the indices used in the current work-item
76- const auto feature_idx = (idx.get_id (1 ) + grid_x_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_features
77- const auto class_idx = (idx.get_id (0 ) + grid_y_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_classes
76+ const auto feature_idx = (idx.get_id (1 ) + grid_y_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_features
77+ const auto class_idx = (idx.get_id (0 ) + grid_x_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_classes
7878
7979 // create a work-item private array used for internal caching
8080 std::array<std::array<real_type, INTERNAL_BLOCK_SIZE_uz>, INTERNAL_BLOCK_SIZE_uz> temp{};
@@ -185,8 +185,8 @@ class device_kernel_predict_linear {
185185 constexpr auto PADDING_SIZE_uz = static_cast <std::size_t >(PADDING_SIZE);
186186
187187 // calculate the indices used in the current work-item
188- const auto pp_idx = (idx.get_id (1 ) + grid_x_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_predict_points
189- const auto class_idx = (idx.get_id (0 ) + grid_y_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_classes
188+ const auto pp_idx = (idx.get_id (1 ) + grid_y_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_predict_points
189+ const auto class_idx = (idx.get_id (0 ) + grid_x_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_classes
190190
191191 // create a work-item private array used for internal caching
192192 std::array<std::array<real_type, INTERNAL_BLOCK_SIZE_uz>, INTERNAL_BLOCK_SIZE_uz> temp{};
@@ -305,8 +305,8 @@ class device_kernel_predict {
305305 constexpr auto PADDING_SIZE_uz = static_cast <std::size_t >(PADDING_SIZE);
306306
307307 // calculate the indices used in the current work-item
308- const auto pp_idx = (idx.get_id (1 ) + grid_x_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_predict_points
309- const auto sv_idx = (idx.get_id (0 ) + grid_y_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_support_vectors
308+ const auto pp_idx = (idx.get_id (1 ) + grid_y_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_predict_points
309+ const auto sv_idx = (idx.get_id (0 ) + grid_x_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_support_vectors
310310
311311 // create a work-item private array used for internal caching
312312 std::array<std::array<real_type, INTERNAL_BLOCK_SIZE_uz>, INTERNAL_BLOCK_SIZE_uz> temp{};
0 commit comments