We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 75520d6 commit 7e559f3Copy full SHA for 7e559f3
ggml/src/ggml-cuda/ssm-scan.cu
@@ -10,7 +10,7 @@ using namespace cub;
10
#include "ssm-scan.cuh"
11
12
template <size_t splitD, size_t N, size_t L_template>
13
-__global__ void __launch_bounds__(splitD, 2)
+__global__ void __launch_bounds__(splitD, 1)
14
ssm_scan_f32(const float *__restrict__ src0, const float *__restrict__ src1, const float *__restrict__ src2,
15
const float *__restrict__ src3, const float *__restrict__ src4, const float *__restrict__ src5,
16
const int src0_nb1, const int src0_nb2, const int src1_nb1, const int src1_nb2,
0 commit comments