Removed unnecessary iteration of batch n_tokens on sequence embeddings generation.

Emreerdog · Emreerdog · commit 1fccfc9eb61a · 2024-12-25T14:13:50.000+03:00
diff --git a/examples/embedding/embedding.cpp b/examples/embedding/embedding.cpp
@@ -53,28 +53,37 @@ static void batch_decode(llama_context * ctx, llama_batch & batch, float * outpu
         }
     }
 
-    for (int i = 0; i < batch.n_tokens; i++) {
-        if (!batch.logits[i]) {
-            continue;
-        }
+    const float* embd = nullptr;
+    int embd_pos = 0;
 
-        const float * embd = nullptr;
-        int embd_pos = 0;
+    if(pooling_type == LLAMA_POOLING_TYPE_NONE)
+    {
+        for (int i = 0; i < batch.n_tokens; i++)
+        {
+            if (!batch.logits[i]) {
+                continue;
+            }
 
-        if (pooling_type == LLAMA_POOLING_TYPE_NONE) {
-            // try to get token embeddings
             embd = llama_get_embeddings_ith(ctx, i);
             embd_pos = i;
             GGML_ASSERT(embd != NULL && "failed to get token embeddings");
-        } else {
-            // try to get sequence embeddings - supported only when pooling_type is not NONE
-            embd = llama_get_embeddings_seq(ctx, batch.seq_id[i][0]);
-            embd_pos = batch.seq_id[i][0];
-            GGML_ASSERT(embd != NULL && "failed to get sequence embeddings");
+
+            float * out = output + embd_pos * n_embd;
+            common_embd_normalize(embd, out, n_embd, embd_norm);
         }
+    }
 
-        float * out = output + embd_pos * n_embd;
-        common_embd_normalize(embd, out, n_embd, embd_norm);
+    else
+    {
+        for(int i = 0; i < n_seq; i++)
+        {
+            embd = llama_get_embeddings_seq(ctx, i);
+            embd_pos = i;
+            GGML_ASSERT(embd != NULL && "failed to get sequence embeddings");
+            
+            float * out = output + embd_pos * n_embd;
+            common_embd_normalize(embd, out, n_embd, embd_norm);
+        }
     }
 }