@@ -62,8 +62,8 @@ class device_kernel_w_linear {
6262 template <typename T>
6363 void operator ()(T group) const {
6464 ::sycl::memory_environment (group,
65- ::sycl::require_local_mem<real_type[FEATURE_BLOCK_SIZE ][INTERNAL_BLOCK_SIZE * THREAD_BLOCK_SIZE]>(),
66- ::sycl::require_local_mem<real_type[FEATURE_BLOCK_SIZE ][INTERNAL_BLOCK_SIZE * THREAD_BLOCK_SIZE]>(),
65+ ::sycl::require_local_mem<real_type[THREAD_BLOCK_SIZE ][INTERNAL_BLOCK_SIZE * THREAD_BLOCK_SIZE]>(),
66+ ::sycl::require_local_mem<real_type[THREAD_BLOCK_SIZE ][INTERNAL_BLOCK_SIZE * THREAD_BLOCK_SIZE]>(),
6767 ::sycl::require_private_mem<std::size_t>(),
6868 ::sycl::require_private_mem<std::size_t>(),
6969 ::sycl::require_private_mem<std::size_t>(),
@@ -104,8 +104,8 @@ class device_kernel_w_linear {
104104 const auto global_class_idx = class_idx_linear (idx) + static_cast <std::size_t >(internal) * THREAD_BLOCK_SIZE_uz;
105105 const auto global_feature_idx = feature_idx_linear (idx) + static_cast <std::size_t >(internal) * THREAD_BLOCK_SIZE_uz;
106106
107- data_cache_feature[local_id_0][internal * THREAD_BLOCK_SIZE + local_id_1] = sv_d_[global_feature_idx * (device_specific_num_sv_ + PADDING_SIZE_uz) + sv + sv_offset_ + threadIdx_x]; // SoA
108- data_cache_alpha[local_id_0][internal * THREAD_BLOCK_SIZE + local_id_1] = alpha_d_[global_class_idx * (num_sv_ + PADDING_SIZE_uz) + sv + threadIdx_x]; // AoS
107+ data_cache_feature[local_id_0][internal * THREAD_BLOCK_SIZE + local_id_1] = sv_d_[global_feature_idx * (device_specific_num_sv_ + PADDING_SIZE_uz) + sv + threadIdx_x]; // SoA
108+ data_cache_alpha[local_id_0][internal * THREAD_BLOCK_SIZE + local_id_1] = alpha_d_[global_class_idx * (num_sv_ + PADDING_SIZE_uz) + sv + sv_offset_ + threadIdx_x]; // AoS
109109 }
110110 });
111111
0 commit comments