We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c87dd7e commit dfc5c0bCopy full SHA for dfc5c0b
ggml/src/ggml-sycl/set_rows.cpp
@@ -68,10 +68,10 @@ static void set_rows_sycl(
68
const size_t src_type_size, const size_t dst_type_size,
69
queue_ptr stream) {
70
71
- const int max_threads_per_row = 128; // KEEPING 128 for now
+ const int max_threads_per_row = 256; // KEEPING 256 for now
72
const int threads_per_row = std::min((int)ne00, max_threads_per_row);
73
74
- const int max_threads_per_block = 128;
+ const int max_threads_per_block = 256;
75
const int rows_per_block = std::max(1, max_threads_per_block / threads_per_row);
76
77
const sycl::range<3> block_size(1, rows_per_block, threads_per_row);
0 commit comments