Skip to content

Commit 525978f

Browse files
committed
build(llama.cu): 更新 InfiniNN
Signed-off-by: YdrMaster <ydrml@hotmail.com>
1 parent 5e8be04 commit 525978f

File tree

3 files changed

+8
-6
lines changed

3 files changed

+8
-6
lines changed

Cargo.lock

Lines changed: 5 additions & 5 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

llama.cu/Cargo.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ edition.workspace = true
77
operators = { git = "https://github.com/YdrMaster/operators-rs", rev = "01b39e8", default-features = false, features = [
88
"nvidia-gpu",
99
] }
10-
nn = { git = "https://github.com/YdrMaster/InfiniNN", rev = "7b01a0e" }
10+
nn = { git = "https://github.com/YdrMaster/InfiniNN", rev = "e3061d6" }
1111
ggus = { git = "https://github.com/InfiniTensor/gguf", rev = "23c362f" }
1212
tokeneer = { git = "https://github.com/InfiniTensor/tokeneer", rev = "c48f39f" }
1313

llama.cu/src/model/llama.rs

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -68,6 +68,8 @@ impl GGufModel<'_> {
6868
get(&format!("blk.{iblk}.attn_qkv.weight")),
6969
dt_bias.map(|dt| (dt, get(&format!("blk.{iblk}.attn_qkv.bias")))),
7070
),
71+
q_norm: None,
72+
k_norm: None,
7173
rope: Some(RoPE {
7274
multimodal: false,
7375
nctx,

0 commit comments

Comments
 (0)