Skip to content

Commit 5a161d9

Browse files
committed
Remove unnecessary transposes/reshapes
1 parent 5728642 commit 5a161d9

File tree

1 file changed

+1
-8
lines changed

1 file changed

+1
-8
lines changed

src/models/llm_build_qwen3next.cpp

Lines changed: 1 addition & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -715,18 +715,11 @@ ggml_tensor * llm_build_qwen3next::build_qwen3next_linear_attn_layer(llm_graph_i
715715
// cb(conv_output_proper, "conv_output_proper", il);
716716

717717
conv_output_proper = ggml_transpose(ctx0, conv_output_proper);
718-
conv_output_proper = ggml_cont_4d(ctx0, conv_output_proper, qkv_dim, 1, n_seq_tokens, n_seqs);
719718

720719
ggml_tensor * conv_output_silu = ggml_silu(ctx0, conv_output_proper);
721720
cb(conv_output_silu, "conv_output_silu", il);
722721

723-
conv_output_proper = ggml_reshape_2d(ctx0, conv_output_silu, n_seq_tokens * n_seqs, qkv_dim);
724-
cb(conv_output_proper, "conv_output_final", il);
725-
726-
ggml_tensor * conv_transposed = ggml_transpose(ctx0, conv_output_proper);
727-
cb(conv_transposed, "conv_transposed", il);
728-
729-
ggml_tensor * conv_qkv_mix = ggml_cont_2d(ctx0, conv_transposed, qkv_dim, n_seq_tokens * n_seqs);
722+
ggml_tensor * conv_qkv_mix = ggml_cont_2d(ctx0, conv_output_silu, qkv_dim, n_seq_tokens * n_seqs);
730723
cb(conv_qkv_mix, "conv_qkv_mix", il);
731724

732725
// Extract the convolved Q, K, V from conv_output

0 commit comments

Comments
 (0)