Skip to content

Commit 7feec50

Browse files
improve error handling when on-demand throughput is not avialable for a foundational model
1 parent 170bea2 commit 7feec50

File tree

1 file changed

+15
-5
lines changed

1 file changed

+15
-5
lines changed

src/api/providers/bedrock.ts

Lines changed: 15 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -840,16 +840,20 @@ export class AwsBedrockHandler extends BaseProvider implements SingleCompletionH
840840
> = {
841841
ACCESS_DENIED: {
842842
patterns: ["access", "denied", "permission"],
843-
messageTemplate: `You don't have access to the model with the specified ARN. Please verify:
844-
1. The ARN is correct and points to a valid model
845-
2. Your AWS credentials have permission to access this model (check IAM policies)
846-
3. The region in the ARN {regionInfo} matches the region where the model is deployed
847-
4. If using a provisioned model, ensure it's active and not in a failed state {customModelInfo}`,
843+
messageTemplate: `You don't have access to the model specified.
844+
845+
Please verify:
846+
1. Try cross-region inference if you're using a foundation model
847+
2. If using an ARN, verify the ARN is correct and points to a valid model
848+
3. Your AWS credentials have permission to access this model (check IAM policies)
849+
4. The region in the ARN matches the region where the model is deployed
850+
5. If using a provisioned model, ensure it's active and not in a failed state`,
848851
logLevel: "error",
849852
},
850853
NOT_FOUND: {
851854
patterns: ["not found", "does not exist"],
852855
messageTemplate: `The specified ARN does not exist or is invalid. Please check:
856+
853857
1. The ARN format is correct (arn:aws:bedrock:region:account-id:resource-type/resource-name)
854858
2. The model exists in the specified region
855859
3. The account ID in the ARN is correct`,
@@ -880,6 +884,12 @@ Suggestions:
880884
5. Check your AWS Bedrock quotas and limits`,
881885
logLevel: "error",
882886
},
887+
ON_DEMAND_NOT_SUPPORTED: {
888+
patterns: ["with on-demand throughput isn’t supported."],
889+
messageTemplate: `1. Try enabling cross-region inference in settings.
890+
2. Or, create an inference profile and then leverage the "Use custom ARN..." option of the model selector in settings.`,
891+
logLevel: "error",
892+
},
883893
ABORT: {
884894
patterns: ["aborterror"], // This will match error.name.toLowerCase() for AbortError
885895
messageTemplate: `Request was aborted: The operation timed out or was manually cancelled. Please try again or check your network connection.`,

0 commit comments

Comments
 (0)