@@ -715,18 +715,11 @@ ggml_tensor * llm_build_qwen3next::build_qwen3next_linear_attn_layer(llm_graph_i
715715 // cb(conv_output_proper, "conv_output_proper", il);
716716
717717 conv_output_proper = ggml_transpose (ctx0, conv_output_proper);
718- conv_output_proper = ggml_cont_4d (ctx0, conv_output_proper, qkv_dim, 1 , n_seq_tokens, n_seqs);
719718
720719 ggml_tensor * conv_output_silu = ggml_silu (ctx0, conv_output_proper);
721720 cb (conv_output_silu, " conv_output_silu" , il);
722721
723- conv_output_proper = ggml_reshape_2d (ctx0, conv_output_silu, n_seq_tokens * n_seqs, qkv_dim);
724- cb (conv_output_proper, " conv_output_final" , il);
725-
726- ggml_tensor * conv_transposed = ggml_transpose (ctx0, conv_output_proper);
727- cb (conv_transposed, " conv_transposed" , il);
728-
729- ggml_tensor * conv_qkv_mix = ggml_cont_2d (ctx0, conv_transposed, qkv_dim, n_seq_tokens * n_seqs);
722+ ggml_tensor * conv_qkv_mix = ggml_cont_2d (ctx0, conv_output_silu, qkv_dim, n_seq_tokens * n_seqs);
730723 cb (conv_qkv_mix, " conv_qkv_mix" , il);
731724
732725 // Extract the convolved Q, K, V from conv_output
0 commit comments