zilliztech
diff --git a/‎packages/core/src/embedding/gemini-embedding.test.ts‎
Lines changed: 305 additions & 0 deletions b/‎packages/core/src/embedding/gemini-embedding.test.ts‎
Lines changed: 305 additions & 0 deletions
@@ -0,0 +1,305 @@
+import { GoogleGenAI } from '@google/genai';
+import { GeminiEmbedding } from './gemini-embedding';
+import type { EmbeddingVector } from './base-embedding';
+
+// Mock the GoogleGenAI module
+const mockEmbedContent = jest.fn();
+jest.mock('@google/genai', () => {
+  return {
+    GoogleGenAI: jest.fn().mockImplementation(() => ({
+      models: {
+        embedContent: mockEmbedContent,
+      },
+    })),
+  };
+});
+
+const MockGoogleGenAI = GoogleGenAI as unknown as jest.Mock;
+
+describe('GeminiEmbedding Retry Mechanism', () => {
+  let consoleLogSpy: jest.SpyInstance;
+
+  beforeEach(() => {
+    jest.resetModules();
+    mockEmbedContent.mockClear();
+    MockGoogleGenAI.mockClear();
+    consoleLogSpy = jest.spyOn(console, 'log').mockImplementation(() => {});
+  });
+
+  afterEach(() => {
+    consoleLogSpy.mockRestore();
+  });
+
+  describe('Single Embedding with Retry', () => {
+    it('should succeed on first attempt', async () => {
+      const embedding = new GeminiEmbedding({ 
+        model: 'gemini-embedding-001', 
+        apiKey: 'test-key',
+        maxRetries: 3,
+        baseDelay: 100
+      });
+
+      const mockResponse = {
+        embeddings: [{
+          values: [0.1, 0.2, 0.3]
+        }]
+      };
+      mockEmbedContent.mockResolvedValue(mockResponse);
+
+      const result = await embedding.embed('test text');
+
+      expect(result).toEqual({
+        vector: [0.1, 0.2, 0.3],
+        dimension: 3
+      });
+      expect(mockEmbedContent).toHaveBeenCalledTimes(1);
+      expect(consoleLogSpy).not.toHaveBeenCalledWith(expect.stringContaining('retrying'));
+    });
+
+    it('should retry on 503 error and eventually succeed', async () => {
+      const embedding = new GeminiEmbedding({ 
+        model: 'gemini-embedding-001', 
+        apiKey: 'test-key',
+        maxRetries: 3,
+        baseDelay: 10 // Fast for testing
+      });
+
+      // First two attempts fail with 503, third succeeds
+      const mockError = new Error('503 Service Unavailable: The model is overloaded. Please try again later.');
+      const mockResponse = {
+        embeddings: [{
+          values: [0.1, 0.2, 0.3]
+        }]
+      };
+
+      mockEmbedContent
+        .mockRejectedValueOnce(mockError)
+        .mockRejectedValueOnce(mockError)  
+        .mockResolvedValueOnce(mockResponse);
+
+      const result = await embedding.embed('test text');
+
+      expect(result).toEqual({
+        vector: [0.1, 0.2, 0.3],
+        dimension: 3
+      });
+      expect(mockEmbedContent).toHaveBeenCalledTimes(3);
+      expect(consoleLogSpy).toHaveBeenCalledWith(expect.stringContaining('Single embed attempt 1 failed, retrying'));
+      expect(consoleLogSpy).toHaveBeenCalledWith(expect.stringContaining('Single embed attempt 2 failed, retrying'));
+    });
+
+    it('should throw after exhausting all retries', async () => {
+      const embedding = new GeminiEmbedding({ 
+        model: 'gemini-embedding-001', 
+        apiKey: 'test-key',
+        maxRetries: 2,
+        baseDelay: 10
+      });
+
+      const mockError = new Error('503 Service Unavailable: The model is overloaded. Please try again later.');
+      mockEmbedContent.mockRejectedValue(mockError);
+
+      await expect(embedding.embed('test text')).rejects.toThrow('503 Service Unavailable');
+      expect(mockEmbedContent).toHaveBeenCalledTimes(2);
+    });
+
+    it('should not retry on non-retryable errors', async () => {
+      const embedding = new GeminiEmbedding({ 
+        model: 'gemini-embedding-001', 
+        apiKey: 'test-key',
+        maxRetries: 3,
+        baseDelay: 10
+      });
+
+      const mockError = new Error('401 Unauthorized: Invalid API key');
+      mockEmbedContent.mockRejectedValue(mockError);
+
+      await expect(embedding.embed('test text')).rejects.toThrow('401 Unauthorized');
+      expect(mockEmbedContent).toHaveBeenCalledTimes(1); // No retries
+      expect(consoleLogSpy).not.toHaveBeenCalledWith(expect.stringContaining('retrying'));
+    });
+  });
+
+  describe('Batch Embedding with Retry and Fallback', () => {
+    it('should succeed batch processing on first attempt', async () => {
+      const embedding = new GeminiEmbedding({ 
+        model: 'gemini-embedding-001', 
+        apiKey: 'test-key',
+        maxRetries: 3,
+        baseDelay: 100
+      });
+
+      const mockResponse = {
+        embeddings: [
+          { values: [0.1, 0.2, 0.3] },
+          { values: [0.4, 0.5, 0.6] }
+        ]
+      };
+      mockEmbedContent.mockResolvedValue(mockResponse);
+
+      const result = await embedding.embedBatch(['text1', 'text2']);
+
+      expect(result).toEqual([
+        { vector: [0.1, 0.2, 0.3], dimension: 3 },
+        { vector: [0.4, 0.5, 0.6], dimension: 3 }
+      ]);
+      expect(mockEmbedContent).toHaveBeenCalledTimes(1);
+    });
+
+    it('should retry batch processing and eventually succeed', async () => {
+      const embedding = new GeminiEmbedding({ 
+        model: 'gemini-embedding-001', 
+        apiKey: 'test-key',
+        maxRetries: 3,
+        baseDelay: 10
+      });
+
+      const mockError = new Error('503 Service Unavailable: The model is overloaded. Please try again later.');
+      const mockResponse = {
+        embeddings: [
+          { values: [0.1, 0.2, 0.3] },
+          { values: [0.4, 0.5, 0.6] }
+        ]
+      };
+
+      mockEmbedContent
+        .mockRejectedValueOnce(mockError)
+        .mockResolvedValueOnce(mockResponse);
+
+      const result = await embedding.embedBatch(['text1', 'text2']);
+
+      expect(result).toEqual([
+        { vector: [0.1, 0.2, 0.3], dimension: 3 },
+        { vector: [0.4, 0.5, 0.6], dimension: 3 }
+      ]);
+      expect(mockEmbedContent).toHaveBeenCalledTimes(2);
+      expect(consoleLogSpy).toHaveBeenCalledWith(expect.stringContaining('Attempt 1 failed with retryable error, retrying'));
+    });
+
+    it('should fallback to individual requests when batch consistently fails', async () => {
+      const embedding = new GeminiEmbedding({ 
+        model: 'gemini-embedding-001', 
+        apiKey: 'test-key',
+        maxRetries: 2,
+        baseDelay: 10
+      });
+
+      const mockBatchError = new Error('503 Service Unavailable: The model is overloaded. Please try again later.');
+      const mockSingleResponse1 = { embeddings: [{ values: [0.1, 0.2, 0.3] }] };
+      const mockSingleResponse2 = { embeddings: [{ values: [0.4, 0.5, 0.6] }] };
+
+      mockEmbedContent
+        // Batch attempts (2 failures)
+        .mockRejectedValueOnce(mockBatchError)
+        .mockRejectedValueOnce(mockBatchError)
+        // Individual requests (2 successes)
+        .mockResolvedValueOnce(mockSingleResponse1)
+        .mockResolvedValueOnce(mockSingleResponse2);
+
+      const result = await embedding.embedBatch(['text1', 'text2']);
+
+      expect(result).toEqual([
+        { vector: [0.1, 0.2, 0.3], dimension: 3 },
+        { vector: [0.4, 0.5, 0.6], dimension: 3 }
+      ]);
+      expect(mockEmbedContent).toHaveBeenCalledTimes(4); // 2 batch + 2 individual
+      expect(consoleLogSpy).toHaveBeenCalledWith(expect.stringContaining('falling back to individual requests'));
+      expect(consoleLogSpy).toHaveBeenCalledWith(expect.stringContaining('Using fallback: processing 2 texts individually'));
+    });
+
+    it('should validate response array length matches input length', async () => {
+      const embedding = new GeminiEmbedding({ 
+        model: 'gemini-embedding-001', 
+        apiKey: 'test-key'
+      });
+
+      // Return only 1 embedding for 2 input texts
+      const mockResponse = {
+        embeddings: [
+          { values: [0.1, 0.2, 0.3] }
+          // Missing second embedding
+        ]
+      };
+      mockEmbedContent.mockResolvedValue(mockResponse);
+
+      await expect(embedding.embedBatch(['text1', 'text2'])).rejects.toThrow(
+        'Gemini API returned 1 embeddings but expected 2'
+      );
+    });
+  });
+
+  describe('Error Classification', () => {
+    it('should correctly identify retryable errors', async () => {
+      const embedding = new GeminiEmbedding({ 
+        model: 'gemini-embedding-001', 
+        apiKey: 'test-key' 
+      });
+
+      const retryableErrors = [
+        'Error: 503 Service Unavailable',
+        'Error: 429 Too Many Requests', 
+        'The model is overloaded. Please try again later.',
+        'Status: UNAVAILABLE',
+        'Server is busy, please try again',
+        'Rate limit exceeded',
+        'Temporarily unavailable',
+        'Network timeout error'
+      ];
+
+      for (const errorMsg of retryableErrors) {
+        expect(embedding['isRetryableError'](errorMsg)).toBe(true);
+      }
+    });
+
+    it('should correctly identify non-retryable errors', async () => {
+      const embedding = new GeminiEmbedding({ 
+        model: 'gemini-embedding-001', 
+        apiKey: 'test-key' 
+      });
+
+      const nonRetryableErrors = [
+        'Error: 401 Unauthorized',
+        'Error: 403 Forbidden', 
+        'Invalid API key provided',
+        'Model not found',
+        'Invalid request format',
+        'Quota exceeded'
+      ];
+
+      for (const errorMsg of nonRetryableErrors) {
+        expect(embedding['isRetryableError'](errorMsg)).toBe(false);
+      }
+    });
+  });
+
+  describe('Configuration Options', () => {
+    it('should use custom retry configuration', async () => {
+      const embedding = new GeminiEmbedding({ 
+        model: 'gemini-embedding-001', 
+        apiKey: 'test-key',
+        maxRetries: 5,
+        baseDelay: 50
+      });
+
+      const mockError = new Error('503 Service Unavailable');
+      mockEmbedContent.mockRejectedValue(mockError);
+
+      await expect(embedding.embed('test')).rejects.toThrow();
+      expect(mockEmbedContent).toHaveBeenCalledTimes(5); // Custom maxRetries
+    });
+
+    it('should use default retry configuration when not specified', async () => {
+      const embedding = new GeminiEmbedding({ 
+        model: 'gemini-embedding-001', 
+        apiKey: 'test-key'
+        // No retry config specified
+      });
+
+      const mockError = new Error('503 Service Unavailable');
+      mockEmbedContent.mockRejectedValue(mockError);
+
+      await expect(embedding.embed('test')).rejects.toThrow();
+      expect(mockEmbedContent).toHaveBeenCalledTimes(3); // Default maxRetries = 3
+    });
+  });
+});