We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 0441ccb commit aba30d6Copy full SHA for aba30d6
src/llama-model.cpp
@@ -11906,7 +11906,7 @@ struct llm_graph_context_mamba : public llm_graph_context {
11906
for (auto chunk_i = 0; chunk_i < n_seq_tokens; chunk_i += chunk_size) {
11907
11908
// chunk views
11909
- const auto chunk_size_i = std::min(chunk_size, uint32_t(n_seq_tokens - chunk_i * chunk_size));
+ const auto chunk_size_i = std::min(chunk_size, uint32_t(n_seq_tokens - chunk_i));
11910
// slice dtA on dim 1
11911
ggml_tensor * dtA_chunk = ggml_view_3d(ctx, dtA,
11912
dtA->ne[0], chunk_size_i, dtA->ne[2],
0 commit comments