File tree Expand file tree Collapse file tree 2 files changed +6
-2
lines changed Expand file tree Collapse file tree 2 files changed +6
-2
lines changed Original file line number Diff line number Diff line change @@ -73,7 +73,9 @@ llama_memory_context_ptr llama_memory_hybrid::init_batch(llama_batch_allocr & ba
73
73
// if all tokens are output, split by sequence
74
74
ubatch = balloc.split_seq (n_ubatch);
75
75
} else {
76
- ubatch = balloc.split_equal (n_ubatch, false );
76
+ // TODO: non-sequential equal split can be done if using unified KV cache
77
+ // for simplicity, we always use sequential equal split for now
78
+ ubatch = balloc.split_equal (n_ubatch, true );
77
79
}
78
80
79
81
if (ubatch.n_tokens == 0 ) {
Original file line number Diff line number Diff line change @@ -382,7 +382,9 @@ llama_memory_context_ptr llama_memory_recurrent::init_batch(llama_batch_allocr &
382
382
// if all tokens are output, split by sequence
383
383
ubatch = balloc.split_seq (n_ubatch);
384
384
} else {
385
- ubatch = balloc.split_equal (n_ubatch, false );
385
+ // TODO: non-sequential equal split can be done if using unified KV cache
386
+ // for simplicity, we always use sequential equal split for now
387
+ ubatch = balloc.split_equal (n_ubatch, true );
386
388
}
387
389
388
390
if (ubatch.n_tokens == 0 ) {
You can’t perform that action at this time.
0 commit comments