@@ -1856,18 +1856,15 @@ llm_graph_input_mem_hybrid * llm_graph_context::build_inp_mem_hybrid() const {
18561856void llm_graph_context::build_dense_out (
18571857 ggml_tensor * dense_2,
18581858 ggml_tensor * dense_3) const {
1859- if (!cparams.embeddings ) {
1859+ if (!cparams.embeddings || dense_2 == nullptr || dense_3 == nullptr ) {
18601860 return ;
18611861 }
1862- ggml_tensor * cur = res->get_embd_pooled ();
1863- if (dense_2 != nullptr ) {
1864- cur = ggml_mul_mat (ctx0, dense_2, cur);
1865- cb (cur, " result_embd_pooled" , -1 );
1866- }
1867- if (dense_3 != nullptr ) {
1868- cur = ggml_mul_mat (ctx0, dense_3, cur);
1869- cb (cur, " result_embd_pooled" , -1 );
1870- }
1862+ ggml_tensor * cur = res->t_embd_pooled != nullptr ? res->t_embd_pooled : res->t_embd ;
1863+ GGML_ASSERT (cur != nullptr && " missing t_embd_pooled/t_embd" );
1864+
1865+ cur = ggml_mul_mat (ctx0, dense_2, cur);
1866+ cur = ggml_mul_mat (ctx0, dense_3, cur);
1867+ cb (cur, " result_embd_pooled" , -1 );
18711868 res->t_embd_pooled = cur;
18721869 ggml_build_forward_expand (gf, cur);
18731870}
0 commit comments