fix(llama.cu): 改正依赖更新导致的编译问题

PanZezhong1725 · PanZezhong1725 · commit 11b0b54094bc · 2025-07-18T08:02:22.000Z
Signed-off-by: PanZezhong &lt;panzezhong@qiyuanlab.com&gt;
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/README.md b/README.md
@@ -129,7 +129,8 @@ Options:
 path = "model-path"
 gpus = [0, 1, 2, 3]
 max-tokens = 4096
-think = true
 temperature = 0.9
 top-p = 0.6
+repetition_penalty = 1.02
+think = true
 ```
diff --git a/llama.cu/src/model/qw2vl_mmproj.rs b/llama.cu/src/model/qw2vl_mmproj.rs
@@ -52,6 +52,8 @@ impl GGufModel<'_> {
                                 get(&format!("v.blk.{iblk}.attn_qkv.weight")),
                                 Some((dt_norm, get(&format!("v.blk.{iblk}.attn_qkv.bias")))),
                             ),
+                            q_norm: None,
+                            k_norm: None,
                             rope: Some(RoPE {
                                 multimodal: true,
                                 nctx: 34, // todo: from image