access n_swa via hparams

huydt-bti · huydt-bti · commit cfebb6e73744 · 2025-06-05T22:48:59.000+09:00
diff --git a/src/llama-graph.cpp b/src/llama-graph.cpp
@@ -1243,8 +1243,9 @@ llm_graph_input_attn_no_cache * llm_graph_context::build_attn_inp_no_cache() con
 }
 
 llm_graph_input_attn_no_cache * llm_graph_context::build_attn_inp_no_cache_iswa() const {
-    // Default sliding window size - can be made configurable via cparams
-    const int n_swa = 128;
+    // Use the sliding window size from hyperparameters
+    // If hparams.n_swa is 0, use a default value (128)
+    const int n_swa = hparams.n_swa > 0 ? hparams.n_swa : 128;
 
     auto inp = std::make_unique<llm_graph_input_attn_no_cache>(hparams, cparams, n_swa);
 

Original file line number	Diff line number	Diff line change
`@@ -1243,8 +1243,9 @@ llm_graph_input_attn_no_cache * llm_graph_context::build_attn_inp_no_cache() con`
`1243`	`1243`	`}`
`1244`	`1244`
`1245`	`1245`	`llm_graph_input_attn_no_cache * llm_graph_context::build_attn_inp_no_cache_iswa() const {`
`1246`		`- // Default sliding window size - can be made configurable via cparams`
`1247`		`- const int n_swa = 128;`
	`1246`	`+ // Use the sliding window size from hyperparameters`
	`1247`	`+ // If hparams.n_swa is 0, use a default value (128)`
	`1248`	`+ const int n_swa = hparams.n_swa > 0 ? hparams.n_swa : 128;`
`1248`	`1249`
`1249`	`1250`	`auto inp = std::make_unique<llm_graph_input_attn_no_cache>(hparams, cparams, n_swa);`
`1250`	`1251`