Merge branch 'main' into fix/azure-foundry-fix-mapping

narengogi · web-flow · commit 3a290aa35b00 · 2025-07-18T17:06:57.000+05:30
diff --git a/package-lock.json b/package-lock.json
diff --git a/package.json b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "@portkey-ai/gateway",
-  "version": "1.10.1",
+  "version": "1.10.2",
   "description": "A fast AI gateway by Portkey",
   "repository": {
     "type": "git",
diff --git a/plugins/portkey/gibberish.ts b/plugins/portkey/gibberish.ts
@@ -4,7 +4,7 @@ import {
   PluginHandler,
   PluginParameters,
 } from '../types';
-import { getText } from '../utils';
+import { getCurrentContentPart } from '../utils';
 import { PORTKEY_ENDPOINTS, fetchPortkey } from './globals';
 
 export const handler: PluginHandler = async (
@@ -16,9 +16,17 @@ export const handler: PluginHandler = async (
   let error = null;
   let verdict = false;
   let data: any = null;
-
+  let text = '';
   try {
-    const text = getText(context, eventType);
+    const { content, textArray } = getCurrentContentPart(context, eventType);
+    if (!content) {
+      return {
+        error: { message: 'request or response json is empty' },
+        verdict: true,
+        data: null,
+      };
+    }
+    text = textArray.filter((text) => text).join('\n');
     const not = parameters.not || false;
 
     const response: any = await fetchPortkey(
@@ -47,7 +55,6 @@ export const handler: PluginHandler = async (
     };
   } catch (e) {
     error = e as Error;
-    const text = getText(context, eventType);
     data = {
       explanation: `An error occurred while checking for gibberish: ${error.message}`,
       not: parameters.not || false,
diff --git a/plugins/portkey/language.ts b/plugins/portkey/language.ts
@@ -4,7 +4,7 @@ import {
   PluginHandler,
   PluginParameters,
 } from '../types';
-import { getText } from '../utils';
+import { getCurrentContentPart } from '../utils';
 import { PORTKEY_ENDPOINTS, fetchPortkey } from './globals';
 
 export const handler: PluginHandler = async (
@@ -16,9 +16,17 @@ export const handler: PluginHandler = async (
   let error = null;
   let verdict = false;
   let data: any = null;
-
+  let text = '';
   try {
-    const text = getText(context, eventType);
+    const { content, textArray } = getCurrentContentPart(context, eventType);
+    if (!content) {
+      return {
+        error: { message: 'request or response json is empty' },
+        verdict: true,
+        data: null,
+      };
+    }
+    text = textArray.filter((text) => text).join('\n');
     const languages = parameters.language;
     const not = parameters.not || false;
 
@@ -51,7 +59,6 @@ export const handler: PluginHandler = async (
     };
   } catch (e) {
     error = e as Error;
-    const text = getText(context, eventType);
     data = {
       explanation: `An error occurred while checking language: ${error.message}`,
       not: parameters.not || false,
diff --git a/plugins/portkey/moderateContent.ts b/plugins/portkey/moderateContent.ts
@@ -4,7 +4,7 @@ import {
   PluginHandler,
   PluginParameters,
 } from '../types';
-import { getText } from '../utils';
+import { getCurrentContentPart } from '../utils';
 import { PORTKEY_ENDPOINTS, fetchPortkey } from './globals';
 
 export const handler: PluginHandler = async (
@@ -16,9 +16,17 @@ export const handler: PluginHandler = async (
   let error = null;
   let verdict = false;
   let data: any = null;
-
+  let text = '';
   try {
-    const text = getText(context, eventType);
+    const { content, textArray } = getCurrentContentPart(context, eventType);
+    if (!content) {
+      return {
+        error: { message: 'request or response json is empty' },
+        verdict: true,
+        data: null,
+      };
+    }
+    text = textArray.filter((text) => text).join('\n');
     const categories = parameters.categories;
     const not = parameters.not || false;
 
@@ -59,7 +67,6 @@ export const handler: PluginHandler = async (
     };
   } catch (e) {
     error = e as Error;
-    const text = getText(context, eventType);
     data = {
       explanation: `An error occurred during content moderation: ${error.message}`,
       not: parameters.not || false,
diff --git a/src/globals.ts b/src/globals.ts
@@ -96,6 +96,7 @@ export const KLUSTER_AI: string = 'kluster-ai';
 export const NSCALE: string = 'nscale';
 export const HYPERBOLIC: string = 'hyperbolic';
 export const FEATHERLESS_AI: string = 'featherless-ai';
+export const KRUTRIM: string = 'krutrim';
 
 export const VALID_PROVIDERS = [
   ANTHROPIC,
@@ -157,6 +158,7 @@ export const VALID_PROVIDERS = [
   NSCALE,
   HYPERBOLIC,
   FEATHERLESS_AI,
+  KRUTRIM,
 ];
 
 export const CONTENT_TYPES = {
diff --git a/src/handlers/retryHandler.ts b/src/handlers/retryHandler.ts
@@ -175,7 +175,6 @@ export const retryRequest = async (
         retries: retryCount,
         onRetry: (error: Error, attempt: number) => {
           lastAttempt = attempt;
-          console.warn(`Failed in Retry attempt ${attempt}. Error: ${error}`);
         },
         randomize: false,
       }
@@ -206,9 +205,6 @@ export const retryRequest = async (
         headers: error.headers,
       });
     }
-    console.warn(
-      `Tried ${lastAttempt ?? 1} time(s) but failed. Error: ${JSON.stringify(error)}`
-    );
   }
   return {
     response: lastResponse as Response,
diff --git a/src/handlers/streamHandler.ts b/src/handlers/streamHandler.ts
@@ -310,31 +310,41 @@ export function handleStreamingMode(
 
   if (proxyProvider === BEDROCK) {
     (async () => {
-      for await (const chunk of readAWSStream(
-        reader,
-        responseTransformer,
-        fallbackChunkId,
-        strictOpenAiCompliance,
-        gatewayRequest
-      )) {
-        await writer.write(encoder.encode(chunk));
+      try {
+        for await (const chunk of readAWSStream(
+          reader,
+          responseTransformer,
+          fallbackChunkId,
+          strictOpenAiCompliance,
+          gatewayRequest
+        )) {
+          await writer.write(encoder.encode(chunk));
+        }
+      } catch (error) {
+        console.error(error);
+      } finally {
+        writer.close();
       }
-      writer.close();
     })();
   } else {
     (async () => {
-      for await (const chunk of readStream(
-        reader,
-        splitPattern,
-        responseTransformer,
-        isSleepTimeRequired,
-        fallbackChunkId,
-        strictOpenAiCompliance,
-        gatewayRequest
-      )) {
-        await writer.write(encoder.encode(chunk));
+      try {
+        for await (const chunk of readStream(
+          reader,
+          splitPattern,
+          responseTransformer,
+          isSleepTimeRequired,
+          fallbackChunkId,
+          strictOpenAiCompliance,
+          gatewayRequest
+        )) {
+          await writer.write(encoder.encode(chunk));
+        }
+      } catch (error) {
+        console.error(error);
+      } finally {
+        writer.close();
       }
-      writer.close();
     })();
   }
 
diff --git a/src/providers/bedrock/chatComplete.ts b/src/providers/bedrock/chatComplete.ts
@@ -529,9 +529,8 @@ export const BedrockChatCompleteResponseTransform: (
   }
 
   if ('output' in response) {
-    const shouldSendCacheUsage =
-      response.usage.cacheWriteInputTokens ||
-      response.usage.cacheReadInputTokens;
+    const cacheReadInputTokens = response.usage?.cacheReadInputTokens || 0;
+    const cacheWriteInputTokens = response.usage?.cacheWriteInputTokens || 0;
 
     let content: string = '';
     content = response.output.message.content
@@ -565,12 +564,19 @@ export const BedrockChatCompleteResponseTransform: (
         },
       ],
       usage: {
-        prompt_tokens: response.usage.inputTokens,
+        prompt_tokens:
+          response.usage.inputTokens +
+          cacheReadInputTokens +
+          cacheWriteInputTokens,
         completion_tokens: response.usage.outputTokens,
         total_tokens: response.usage.totalTokens, // contains the cache usage as well
-        ...(shouldSendCacheUsage && {
-          cache_read_input_tokens: response.usage.cacheReadInputTokens,
-          cache_creation_input_tokens: response.usage.cacheWriteInputTokens,
+        prompt_tokens_details: {
+          cached_tokens: cacheReadInputTokens,
+        },
+        // we only want to be sending this for anthropic models and this is not openai compliant
+        ...((cacheReadInputTokens > 0 || cacheWriteInputTokens > 0) && {
+          cache_read_input_tokens: cacheReadInputTokens,
+          cache_creation_input_tokens: cacheWriteInputTokens,
         }),
       },
     };
@@ -663,9 +669,9 @@ export const BedrockChatCompleteStreamChunkTransform: (
 
   // final chunk
   if (parsedChunk.usage) {
-    const shouldSendCacheUsage =
-      parsedChunk.usage.cacheWriteInputTokens ||
-      parsedChunk.usage.cacheReadInputTokens;
+    const cacheReadInputTokens = parsedChunk.usage?.cacheReadInputTokens || 0;
+    const cacheWriteInputTokens = parsedChunk.usage?.cacheWriteInputTokens || 0;
+
     return [
       `data: ${JSON.stringify({
         id: fallbackId,
@@ -684,10 +690,17 @@ export const BedrockChatCompleteStreamChunkTransform: (
           },
         ],
         usage: {
-          prompt_tokens: parsedChunk.usage.inputTokens,
+          prompt_tokens:
+            parsedChunk.usage.inputTokens +
+            cacheReadInputTokens +
+            cacheWriteInputTokens,
           completion_tokens: parsedChunk.usage.outputTokens,
           total_tokens: parsedChunk.usage.totalTokens,
-          ...(shouldSendCacheUsage && {
+          prompt_tokens_details: {
+            cached_tokens: cacheReadInputTokens,
+          },
+          // we only want to be sending this for anthropic models and this is not openai compliant
+          ...((cacheReadInputTokens > 0 || cacheWriteInputTokens > 0) && {
             cache_read_input_tokens: parsedChunk.usage.cacheReadInputTokens,
             cache_creation_input_tokens:
               parsedChunk.usage.cacheWriteInputTokens,
diff --git a/src/providers/bedrock/embed.ts b/src/providers/bedrock/embed.ts
@@ -52,9 +52,10 @@ export const BedrockCohereEmbedConfig: ProviderConfig = {
   encoding_format: {
     param: 'embedding_types',
     required: false,
-    transform: (params: any): string[] => {
+    transform: (params: any): string[] | undefined => {
       if (Array.isArray(params.encoding_format)) return params.encoding_format;
-      return [params.encoding_format];
+      else if (typeof params.encoding_format === 'string')
+        return [params.encoding_format];
     },
   },
 };
@@ -115,9 +116,10 @@ export const BedrockTitanEmbedConfig: ProviderConfig = {
   encoding_format: {
     param: 'embeddingTypes',
     required: false,
-    transform: (params: any): string[] => {
+    transform: (params: any): string[] | undefined => {
       if (Array.isArray(params.encoding_format)) return params.encoding_format;
-      return [params.encoding_format];
+      else if (typeof params.encoding_format === 'string')
+        return [params.encoding_format];
     },
   },
   // Titan specific parameters
diff --git a/src/providers/cohere/embed.ts b/src/providers/cohere/embed.ts
@@ -50,9 +50,10 @@ export const CohereEmbedConfig: ProviderConfig = {
   encoding_format: {
     param: 'embedding_types',
     required: false,
-    transform: (params: any): string[] => {
+    transform: (params: any): string[] | undefined => {
       if (Array.isArray(params.encoding_format)) return params.encoding_format;
-      return [params.encoding_format];
+      else if (typeof params.encoding_format === 'string')
+        return [params.encoding_format];
     },
   },
   //backwards compatibility
diff --git a/src/providers/index.ts b/src/providers/index.ts
@@ -60,6 +60,7 @@ import KlusterAIConfig from './kluster-ai';
 import NscaleConfig from './nscale';
 import HyperbolicConfig from './hyperbolic';
 import { FeatherlessAIConfig } from './featherless-ai';
+import KrutrimConfig from './krutrim';
 
 const Providers: { [key: string]: ProviderConfigs } = {
   openai: OpenAIConfig,
@@ -120,6 +121,7 @@ const Providers: { [key: string]: ProviderConfigs } = {
   nscale: NscaleConfig,
   hyperbolic: HyperbolicConfig,
   'featherless-ai': FeatherlessAIConfig,
+  krutrim: KrutrimConfig,
 };
 
 export default Providers;
diff --git a/src/providers/jina/embed.ts b/src/providers/jina/embed.ts
@@ -19,6 +19,9 @@ export const JinaEmbedConfig: ProviderConfig = {
   encoding_format: {
     param: 'encoding_format',
   },
+  dimensions: {
+    param: 'dimensions',
+  },
 };
 
 interface JinaEmbedResponse extends EmbedResponse {}
diff --git a/src/providers/krutrim/api.ts b/src/providers/krutrim/api.ts
@@ -0,0 +1,21 @@
+import { ProviderAPIConfig } from '../types';
+
+const KrutrimAPIConfig: ProviderAPIConfig = {
+  getBaseURL: () => 'https://cloud.olakrutrim.com/v1',
+  headers: ({ providerOptions, fn }) => {
+    const headersObj: Record<string, string> = {
+      Authorization: `Bearer ${providerOptions.apiKey}`,
+    };
+    return headersObj;
+  },
+  getEndpoint: ({ fn }) => {
+    switch (fn) {
+      case 'chatComplete':
+        return '/chat/completions';
+      default:
+        return '';
+    }
+  },
+};
+
+export default KrutrimAPIConfig;
diff --git a/src/providers/krutrim/chatComplete.ts b/src/providers/krutrim/chatComplete.ts
diff --git a/src/providers/krutrim/index.ts b/src/providers/krutrim/index.ts
diff --git a/src/providers/open-ai-base/createModelResponse.ts b/src/providers/open-ai-base/createModelResponse.ts
diff --git a/src/providers/types.ts b/src/providers/types.ts

Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`	`2`	`"name": "@portkey-ai/gateway",`
`3`		`- "version": "1.10.1",`
	`3`	`+ "version": "1.10.2",`
`4`	`4`	`"description": "A fast AI gateway by Portkey",`
`5`	`5`	`"repository": {`
`6`	`6`	`"type": "git",`
Original file line number	Diff line number	Diff line change
`@@ -175,7 +175,6 @@ export const retryRequest = async (`
`175`	`175`	`retries: retryCount,`
`176`	`176`	`onRetry: (error: Error, attempt: number) => {`
`177`	`177`	`lastAttempt = attempt;`
`178`		- console.warn(`Failed in Retry attempt ${attempt}. Error: ${error}`);
`179`	`178`	`},`
`180`	`179`	`randomize: false,`
`181`	`180`	`}`
`@@ -206,9 +205,6 @@ export const retryRequest = async (`
`206`	`205`	`headers: error.headers,`
`207`	`206`	`});`
`208`	`207`	`}`
`209`		`- console.warn(`
`210`		- `Tried ${lastAttempt ?? 1} time(s) but failed. Error: ${JSON.stringify(error)}`
`211`		`- );`
`212`	`208`	`}`
`213`	`209`	`return {`
`214`	`210`	`response: lastResponse as Response,`