Skip to content

Commit 54bb6f1

Browse files
committed
argh again
1 parent 20424d8 commit 54bb6f1

File tree

2 files changed

+7
-5
lines changed

2 files changed

+7
-5
lines changed
Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,3 @@
1+
export MODEL_PATH=/devel/tools/llama.cpp/reference/theo77186_Qwen3-Next-70M-TinyStories
2+
export CONVERTED_MODEL=/devel/tools/llama.cpp/reference/theo77186_Qwen3-Next-70M-TinyStories/theo77186_Qwen3-Next-70M-TinyStories.gguf
3+
make causal-verify-logits

src/models/llm_build_qwen3next.cpp

Lines changed: 4 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -279,14 +279,13 @@ struct ggml_tensor * llm_build_qwen3next::delta_net(
279279
cb(q, "q_postscale", il);
280280
cb(beta, "beta_sigmoid", il);
281281

282-
// Pad first along the token dimension
283-
q = ggml_pad(ctx, q, 0, 0, pad_size, 0);
284-
k = ggml_pad(ctx, k, 0, 0, pad_size, 0);
285-
v = ggml_pad(ctx, v, 0, 0, pad_size, 0);
286-
287282
q = ggml_cont(ctx, ggml_permute(ctx, q, 0, 2, 1, 3));
288283
k = ggml_cont(ctx, ggml_permute(ctx, k, 0, 2, 1, 3));
289284
v = ggml_cont(ctx, ggml_permute(ctx, v, 0, 2, 1, 3));
285+
286+
q = ggml_pad(ctx, q, 0, pad_size, 0, 0);
287+
k = ggml_pad(ctx, k, 0, pad_size, 0, 0);
288+
v = ggml_pad(ctx, v, 0, pad_size, 0, 0);
290289

291290
beta = ggml_cont(ctx, ggml_permute(ctx, beta, 1, 2, 0, 3));
292291
cb(beta, "beta_reshape", il);

0 commit comments

Comments
 (0)