Merge branch 'main' into fix-readme

siddharthsambharia-portkey · web-flow · commit 7988e9ec0ee2 · 2025-06-25T13:41:06.000+05:30
diff --git a/plugins/default/webhook.ts b/plugins/default/webhook.ts
@@ -4,7 +4,7 @@ import {
   PluginHandler,
   PluginParameters,
 } from '../types';
-import { post } from '../utils';
+import { post, TimeoutError } from '../utils';
 
 function parseHeaders(headers: unknown): Record<string, string> {
   try {
@@ -107,20 +107,30 @@ export const handler: PluginHandler = async (
       responseData: response.data,
       requestContext: {
         headers,
-        timeout: 3000,
+        timeout: parameters.timeout || 3000,
       },
     };
   } catch (e: any) {
     error = e;
     delete error.stack;
 
+    const isTimeoutError = e instanceof TimeoutError;
+
+    const responseData = !isTimeoutError && e.response?.body;
+    const responseDataContentType = e.response?.headers?.get('content-type');
+
     data = {
       explanation: `Webhook error: ${e.message}`,
       webhookUrl: parameters.webhookURL || 'No URL provided',
       requestContext: {
         headers: parameters.headers || {},
-        timeout: 3000,
+        timeout: parameters.timeout || 3000,
       },
+      // return response body if it's not a ok response and not a timeout error
+      ...(responseData &&
+        responseDataContentType === 'application/json' && {
+          responseData: JSON.parse(responseData),
+        }),
     };
   }
 
diff --git a/plugins/utils.ts b/plugins/utils.ts
@@ -9,6 +9,7 @@ export interface ErrorResponse {
   status: number;
   statusText: string;
   body: string;
+  headers?: Headers;
 }
 
 export class HttpError extends Error {
@@ -21,7 +22,7 @@ export class HttpError extends Error {
   }
 }
 
-class TimeoutError extends Error {
+export class TimeoutError extends Error {
   url: string;
   timeout: number;
   method: string;
@@ -222,6 +223,7 @@ export async function post<T = any>(
         status: response.status,
         statusText: response.statusText,
         body: errorBody,
+        headers: response.headers,
       };
 
       throw new HttpError(
diff --git a/src/middlewares/hooks/index.ts b/src/middlewares/hooks/index.ts
@@ -306,6 +306,8 @@ export class HooksManager {
         transformed: result.transformed || false,
         created_at: createdAt,
         log: result.log || null,
+        fail_on_error:
+          (check.parameters as Record<string, any>)?.failOnError || false,
       };
     } catch (err: any) {
       console.error(`Error executing check "${check.id}":`, err);
@@ -390,7 +392,10 @@ export class HooksManager {
     }
 
     hookResult = {
-      verdict: checkResults.every((result) => result.verdict || result.error),
+      // if guardrail has error, make verdict false else do the normal check
+      verdict: checkResults.every(
+        (result) => result.verdict || (result.error && !result.fail_on_error)
+      ),
       id: hook.id,
       transformed: checkResults.some((result) => result.transformed),
       checks: checkResults,
diff --git a/src/middlewares/hooks/types.ts b/src/middlewares/hooks/types.ts
@@ -80,6 +80,7 @@ export interface GuardrailCheckResult {
     };
   };
   log?: any;
+  fail_on_error?: boolean;
 }
 
 export interface GuardrailResult {
diff --git a/src/providers/azure-ai-inference/api.ts b/src/providers/azure-ai-inference/api.ts
@@ -5,9 +5,28 @@ import {
 } from '../azure-openai/utils';
 import { ProviderAPIConfig } from '../types';
 
+const NON_INFERENCE_ENDPOINTS = [
+  'createBatch',
+  'retrieveBatch',
+  'cancelBatch',
+  'getBatchOutput',
+  'listBatches',
+  'uploadFile',
+  'listFiles',
+  'retrieveFile',
+  'deleteFile',
+  'retrieveFileContent',
+];
+
 const AzureAIInferenceAPI: ProviderAPIConfig = {
-  getBaseURL: ({ providerOptions }) => {
+  getBaseURL: ({ providerOptions, fn }) => {
     const { provider, azureFoundryUrl } = providerOptions;
+
+    // Azure Foundry URL includes `/deployments/<deployment>`, strip out and append openai for batches/finetunes
+    if (fn && NON_INFERENCE_ENDPOINTS.includes(fn)) {
+      return new URL(azureFoundryUrl ?? '').origin + '/openai';
+    }
+
     if (provider === GITHUB) {
       return 'https://models.inference.ai.azure.com';
     }
@@ -17,7 +36,7 @@ const AzureAIInferenceAPI: ProviderAPIConfig = {
 
     return '';
   },
-  headers: async ({ providerOptions }) => {
+  headers: async ({ providerOptions, fn }) => {
     const {
       apiKey,
       azureExtraParams,
@@ -31,6 +50,13 @@ const AzureAIInferenceAPI: ProviderAPIConfig = {
       ...(azureDeploymentName && {
         'azureml-model-deployment': azureDeploymentName,
       }),
+      ...(['createTranscription', 'createTranslation', 'uploadFile'].includes(
+        fn
+      )
+        ? {
+            'Content-Type': 'multipart/form-data',
+          }
+        : {}),
     };
     if (azureAdToken) {
       headers['Authorization'] =
@@ -70,14 +96,37 @@ const AzureAIInferenceAPI: ProviderAPIConfig = {
     }
     return headers;
   },
-  getEndpoint: ({ providerOptions, fn }) => {
+  getEndpoint: ({ providerOptions, fn, gatewayRequestURL }) => {
     const { azureApiVersion, urlToFetch } = providerOptions;
     let mappedFn = fn;
 
+    const urlObj = new URL(gatewayRequestURL);
+    const path = urlObj.pathname.replace('/v1', '');
+    const searchParams = urlObj.searchParams;
+
+    if (azureApiVersion) {
+      searchParams.set('api-version', azureApiVersion);
+    }
+
     const ENDPOINT_MAPPING: Record<string, string> = {
       complete: '/completions',
       chatComplete: '/chat/completions',
       embed: '/embeddings',
+      realtime: '/realtime',
+      imageGenerate: '/images/generations',
+      createSpeech: '/audio/speech',
+      createTranscription: '/audio/transcriptions',
+      createTranslation: '/audio/translations',
+      uploadFile: path,
+      retrieveFile: path,
+      listFiles: path,
+      deleteFile: path,
+      retrieveFileContent: path,
+      listBatches: path,
+      retrieveBatch: path,
+      cancelBatch: path,
+      getBatchOutput: path,
+      createBatch: path,
     };
 
     const isGithub = providerOptions.provider === GITHUB;
@@ -92,23 +141,40 @@ const AzureAIInferenceAPI: ProviderAPIConfig = {
       }
     }
 
-    const apiVersion = azureApiVersion ? `?api-version=${azureApiVersion}` : '';
+    const searchParamsString = searchParams.toString();
     switch (mappedFn) {
       case 'complete': {
         return isGithub
           ? ENDPOINT_MAPPING[mappedFn]
-          : `${ENDPOINT_MAPPING[mappedFn]}${apiVersion}`;
+          : `${ENDPOINT_MAPPING[mappedFn]}?${searchParamsString}`;
       }
       case 'chatComplete': {
         return isGithub
           ? ENDPOINT_MAPPING[mappedFn]
-          : `${ENDPOINT_MAPPING[mappedFn]}${apiVersion}`;
+          : `${ENDPOINT_MAPPING[mappedFn]}?${searchParamsString}`;
       }
       case 'embed': {
         return isGithub
           ? ENDPOINT_MAPPING[mappedFn]
-          : `${ENDPOINT_MAPPING[mappedFn]}${apiVersion}`;
+          : `${ENDPOINT_MAPPING[mappedFn]}?${searchParamsString}`;
       }
+      case 'realtime':
+      case 'imageGenerate':
+      case 'createSpeech':
+      case 'createTranscription':
+      case 'createTranslation':
+      case 'cancelBatch':
+      case 'createBatch':
+      case 'getBatchOutput':
+      case 'retrieveBatch':
+      case 'listBatches':
+      case 'retrieveFile':
+      case 'listFiles':
+      case 'deleteFile':
+      case 'retrieveFileContent': {
+        return `${ENDPOINT_MAPPING[mappedFn]}?${searchParamsString}`;
+      }
+
       default:
         return '';
     }
diff --git a/src/providers/azure-ai-inference/getBatchOutput.ts b/src/providers/azure-ai-inference/getBatchOutput.ts
@@ -0,0 +1,124 @@
+import { Context } from 'hono';
+import AzureAIInferenceAPI from './api';
+import { Options } from '../../types/requestBody';
+import { RetrieveBatchResponse } from '../types';
+import { AZURE_OPEN_AI } from '../../globals';
+
+// Return a ReadableStream containing batches output data
+export const AzureAIInferenceGetBatchOutputRequestHandler = async ({
+  c,
+  providerOptions,
+  requestURL,
+}: {
+  c: Context;
+  providerOptions: Options;
+  requestURL: string;
+}) => {
+  // get batch details which has ouptut file id
+  // get file content as ReadableStream
+  // return file content
+  const baseUrl = AzureAIInferenceAPI.getBaseURL({
+    providerOptions,
+    fn: 'retrieveBatch',
+    c,
+    gatewayRequestURL: requestURL,
+  });
+  const retrieveBatchRequestURL = requestURL.replace('/output', '');
+  const retrieveBatchURL =
+    baseUrl +
+    AzureAIInferenceAPI.getEndpoint({
+      providerOptions,
+      fn: 'retrieveBatch',
+      gatewayRequestURL: retrieveBatchRequestURL,
+      c,
+      gatewayRequestBodyJSON: {},
+      gatewayRequestBody: {},
+    });
+  const retrieveBatchesHeaders = await AzureAIInferenceAPI.headers({
+    c,
+    providerOptions,
+    fn: 'retrieveBatch',
+    transformedRequestBody: {},
+    transformedRequestUrl: retrieveBatchURL,
+    gatewayRequestBody: {},
+  });
+  try {
+    const retrieveBatchesResponse = await fetch(retrieveBatchURL, {
+      method: 'GET',
+      headers: retrieveBatchesHeaders,
+    });
+
+    if (!retrieveBatchesResponse.ok) {
+      const error = await retrieveBatchesResponse.text();
+      return new Response(
+        JSON.stringify({
+          error: error || 'error fetching batch output',
+          provider: AZURE_OPEN_AI,
+          param: null,
+        }),
+        {
+          status: 500,
+        }
+      );
+    }
+
+    const batchDetails: RetrieveBatchResponse =
+      await retrieveBatchesResponse.json();
+
+    const outputFileId =
+      batchDetails.output_file_id || batchDetails.error_file_id;
+    if (!outputFileId) {
+      const errors = batchDetails.errors;
+      if (errors) {
+        return new Response(JSON.stringify(errors), {
+          status: 200,
+        });
+      }
+      return new Response(
+        JSON.stringify({
+          error: 'invalid response output format',
+          provider_response: batchDetails,
+          provider: AZURE_OPEN_AI,
+        }),
+        {
+          status: 400,
+        }
+      );
+    }
+    const retrieveFileContentRequestURL = `https://api.portkey.ai/v1/files/${outputFileId}/content`; // construct the entire url instead of the path of sanity sake
+    const retrieveFileContentURL =
+      baseUrl +
+      AzureAIInferenceAPI.getEndpoint({
+        providerOptions,
+        fn: 'retrieveFileContent',
+        gatewayRequestURL: retrieveFileContentRequestURL,
+        c,
+        gatewayRequestBodyJSON: {},
+        gatewayRequestBody: {},
+      });
+    const retrieveFileContentHeaders = await AzureAIInferenceAPI.headers({
+      c,
+      providerOptions,
+      fn: 'retrieveFileContent',
+      transformedRequestBody: {},
+      transformedRequestUrl: retrieveFileContentURL,
+      gatewayRequestBody: {},
+    });
+    const response = fetch(retrieveFileContentURL, {
+      method: 'GET',
+      headers: retrieveFileContentHeaders,
+    });
+    return response;
+  } catch (e) {
+    return new Response(
+      JSON.stringify({
+        error: 'error fetching batch output',
+        provider: AZURE_OPEN_AI,
+        param: null,
+      }),
+      {
+        status: 500,
+      }
+    );
+  }
+};
diff --git a/src/providers/azure-ai-inference/index.ts b/src/providers/azure-ai-inference/index.ts
diff --git a/src/providers/azure-ai-inference/utils.ts b/src/providers/azure-ai-inference/utils.ts

Original file line number	Diff line number	Diff line change
`@@ -80,6 +80,7 @@ export interface GuardrailCheckResult {`
`80`	`80`	`};`
`81`	`81`	`};`
`82`	`82`	`log?: any;`
	`83`	`+ fail_on_error?: boolean;`
`83`	`84`	`}`
`84`	`85`
`85`	`86`	`export interface GuardrailResult {`