Skip to content

Commit 7e8e1a0

Browse files
committed
readded cacheless logic
1 parent 04167d9 commit 7e8e1a0

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

src/llama-model.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -8221,7 +8221,7 @@ struct llm_build_modern_bert : public llm_graph_context {
82218221

82228222
ggml_tensor * inp_out_ids = build_inp_out_ids();
82238223

8224-
auto * inp_attn = build_attn_inp_kv_iswa(); // TODO: support cacheless iSWA embeddings [TAG_NO_CACHE_ISWA]
8224+
auto * inp_attn = build_attn_inp_no_cache();
82258225

82268226
for (int il = 0; il < n_layer; ++il) {
82278227
ggml_tensor * cur = inpL;
@@ -19831,7 +19831,7 @@ llama_memory_i * llama_model::create_memory(const llama_memory_params & params,
1983119831
case LLM_ARCH_NOMIC_BERT_MOE:
1983219832
case LLM_ARCH_NEO_BERT:
1983319833
case LLM_ARCH_WAVTOKENIZER_DEC:
19834-
//case LLM_ARCH_MODERN_BERT: // TODO: disabled until cacheless SWA logic is fixed [TAG_NO_CACHE_ISWA]
19834+
case LLM_ARCH_MODERN_BERT:
1983519835
case LLM_ARCH_GEMMA_EMBEDDING:
1983619836
case LLM_ARCH_DREAM:
1983719837
case LLM_ARCH_LLADA:

0 commit comments

Comments
 (0)