Skip to content

Commit 939bd22

Browse files
This release adds support for on-demand custom model inference through CustomModelDeployment APIs for Amazon Bedrock.
1 parent a455d97 commit 939bd22

34 files changed

+5573
-10
lines changed

generator/ServiceModels/bedrock/bedrock-2023-04-20.api.json

Lines changed: 259 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -39,7 +39,7 @@
3939
"http":{
4040
"method":"POST",
4141
"requestUri":"/custom-models/create-custom-model",
42-
"responseCode":200
42+
"responseCode":202
4343
},
4444
"input":{"shape":"CreateCustomModelRequest"},
4545
"output":{"shape":"CreateCustomModelResponse"},
@@ -52,7 +52,28 @@
5252
{"shape":"TooManyTagsException"},
5353
{"shape":"ServiceQuotaExceededException"},
5454
{"shape":"ThrottlingException"}
55-
]
55+
],
56+
"idempotent":true
57+
},
58+
"CreateCustomModelDeployment":{
59+
"name":"CreateCustomModelDeployment",
60+
"http":{
61+
"method":"POST",
62+
"requestUri":"/model-customization/custom-model-deployments",
63+
"responseCode":202
64+
},
65+
"input":{"shape":"CreateCustomModelDeploymentRequest"},
66+
"output":{"shape":"CreateCustomModelDeploymentResponse"},
67+
"errors":[
68+
{"shape":"ResourceNotFoundException"},
69+
{"shape":"AccessDeniedException"},
70+
{"shape":"ValidationException"},
71+
{"shape":"InternalServerException"},
72+
{"shape":"TooManyTagsException"},
73+
{"shape":"ServiceQuotaExceededException"},
74+
{"shape":"ThrottlingException"}
75+
],
76+
"idempotent":true
5677
},
5778
"CreateEvaluationJob":{
5879
"name":"CreateEvaluationJob",
@@ -310,6 +331,25 @@
310331
],
311332
"idempotent":true
312333
},
334+
"DeleteCustomModelDeployment":{
335+
"name":"DeleteCustomModelDeployment",
336+
"http":{
337+
"method":"DELETE",
338+
"requestUri":"/model-customization/custom-model-deployments/{customModelDeploymentIdentifier}",
339+
"responseCode":200
340+
},
341+
"input":{"shape":"DeleteCustomModelDeploymentRequest"},
342+
"output":{"shape":"DeleteCustomModelDeploymentResponse"},
343+
"errors":[
344+
{"shape":"ResourceNotFoundException"},
345+
{"shape":"AccessDeniedException"},
346+
{"shape":"ValidationException"},
347+
{"shape":"ConflictException"},
348+
{"shape":"InternalServerException"},
349+
{"shape":"ThrottlingException"}
350+
],
351+
"idempotent":true
352+
},
313353
"DeleteFoundationModelAgreement":{
314354
"name":"DeleteFoundationModelAgreement",
315355
"http":{
@@ -491,6 +531,23 @@
491531
{"shape":"ThrottlingException"}
492532
]
493533
},
534+
"GetCustomModelDeployment":{
535+
"name":"GetCustomModelDeployment",
536+
"http":{
537+
"method":"GET",
538+
"requestUri":"/model-customization/custom-model-deployments/{customModelDeploymentIdentifier}",
539+
"responseCode":200
540+
},
541+
"input":{"shape":"GetCustomModelDeploymentRequest"},
542+
"output":{"shape":"GetCustomModelDeploymentResponse"},
543+
"errors":[
544+
{"shape":"ResourceNotFoundException"},
545+
{"shape":"AccessDeniedException"},
546+
{"shape":"ValidationException"},
547+
{"shape":"InternalServerException"},
548+
{"shape":"ThrottlingException"}
549+
]
550+
},
494551
"GetEvaluationJob":{
495552
"name":"GetEvaluationJob",
496553
"http":{
@@ -743,6 +800,22 @@
743800
{"shape":"ThrottlingException"}
744801
]
745802
},
803+
"ListCustomModelDeployments":{
804+
"name":"ListCustomModelDeployments",
805+
"http":{
806+
"method":"GET",
807+
"requestUri":"/model-customization/custom-model-deployments",
808+
"responseCode":200
809+
},
810+
"input":{"shape":"ListCustomModelDeploymentsRequest"},
811+
"output":{"shape":"ListCustomModelDeploymentsResponse"},
812+
"errors":[
813+
{"shape":"AccessDeniedException"},
814+
{"shape":"ValidationException"},
815+
{"shape":"InternalServerException"},
816+
{"shape":"ThrottlingException"}
817+
]
818+
},
746819
"ListCustomModels":{
747820
"name":"ListCustomModels",
748821
"http":{
@@ -1459,6 +1532,30 @@
14591532
"type":"string",
14601533
"pattern":".*[a-z]{1,20}/.{1,20}.*"
14611534
},
1535+
"CreateCustomModelDeploymentRequest":{
1536+
"type":"structure",
1537+
"required":[
1538+
"modelDeploymentName",
1539+
"modelArn"
1540+
],
1541+
"members":{
1542+
"modelDeploymentName":{"shape":"ModelDeploymentName"},
1543+
"modelArn":{"shape":"CustomModelArn"},
1544+
"description":{"shape":"CustomModelDeploymentDescription"},
1545+
"tags":{"shape":"TagList"},
1546+
"clientRequestToken":{
1547+
"shape":"IdempotencyToken",
1548+
"idempotencyToken":true
1549+
}
1550+
}
1551+
},
1552+
"CreateCustomModelDeploymentResponse":{
1553+
"type":"structure",
1554+
"required":["customModelDeploymentArn"],
1555+
"members":{
1556+
"customModelDeploymentArn":{"shape":"CustomModelDeploymentArn"}
1557+
}
1558+
},
14621559
"CreateCustomModelRequest":{
14631560
"type":"structure",
14641561
"required":[
@@ -1870,6 +1967,55 @@
18701967
"min":20,
18711968
"pattern":"arn:aws(-[^:]+)?:bedrock:[a-z0-9-]{1,20}:[0-9]{12}:custom-model/(imported|[a-z0-9-]{1,63}[.]{1}[a-z0-9-]{1,63}([a-z0-9-]{1,63}[.]){0,2}[a-z0-9-]{1,63}([:][a-z0-9-]{1,63}){0,2})/[a-z0-9]{12}"
18721969
},
1970+
"CustomModelDeploymentArn":{
1971+
"type":"string",
1972+
"max":1011,
1973+
"min":0,
1974+
"pattern":"arn:aws(-[^:]+)?:bedrock:[a-z0-9-]{1,20}:[0-9]{12}:custom-model-deployment/[a-z0-9]{12}"
1975+
},
1976+
"CustomModelDeploymentDescription":{
1977+
"type":"string",
1978+
"max":2048,
1979+
"min":1,
1980+
"pattern":".*"
1981+
},
1982+
"CustomModelDeploymentIdentifier":{
1983+
"type":"string",
1984+
"max":93,
1985+
"min":1,
1986+
"pattern":"(arn:aws(|-us-gov|-cn|-iso|-iso-b):bedrock:[a-z0-9-]{1,20}:[0-9]{12}:custom-model-deployment/[a-z0-9]{12})|^([0-9a-zA-Z][_-]?){1,63}"
1987+
},
1988+
"CustomModelDeploymentStatus":{
1989+
"type":"string",
1990+
"enum":[
1991+
"Creating",
1992+
"Active",
1993+
"Failed"
1994+
]
1995+
},
1996+
"CustomModelDeploymentSummary":{
1997+
"type":"structure",
1998+
"required":[
1999+
"customModelDeploymentArn",
2000+
"customModelDeploymentName",
2001+
"modelArn",
2002+
"createdAt",
2003+
"status"
2004+
],
2005+
"members":{
2006+
"customModelDeploymentArn":{"shape":"CustomModelDeploymentArn"},
2007+
"customModelDeploymentName":{"shape":"ModelDeploymentName"},
2008+
"modelArn":{"shape":"ModelArn"},
2009+
"createdAt":{"shape":"Timestamp"},
2010+
"status":{"shape":"CustomModelDeploymentStatus"},
2011+
"lastUpdatedAt":{"shape":"Timestamp"},
2012+
"failureMessage":{"shape":"ErrorMessage"}
2013+
}
2014+
},
2015+
"CustomModelDeploymentSummaryList":{
2016+
"type":"list",
2017+
"member":{"shape":"CustomModelDeploymentSummary"}
2018+
},
18732019
"CustomModelName":{
18742020
"type":"string",
18752021
"max":63,
@@ -1935,6 +2081,22 @@
19352081
"lastModifiedTime":{"shape":"Timestamp"}
19362082
}
19372083
},
2084+
"DeleteCustomModelDeploymentRequest":{
2085+
"type":"structure",
2086+
"required":["customModelDeploymentIdentifier"],
2087+
"members":{
2088+
"customModelDeploymentIdentifier":{
2089+
"shape":"CustomModelDeploymentIdentifier",
2090+
"location":"uri",
2091+
"locationName":"customModelDeploymentIdentifier"
2092+
}
2093+
}
2094+
},
2095+
"DeleteCustomModelDeploymentResponse":{
2096+
"type":"structure",
2097+
"members":{
2098+
}
2099+
},
19382100
"DeleteCustomModelRequest":{
19392101
"type":"structure",
19402102
"required":["modelIdentifier"],
@@ -2643,6 +2805,37 @@
26432805
"additionalModelRequestFields":{"shape":"AdditionalModelRequestFields"}
26442806
}
26452807
},
2808+
"GetCustomModelDeploymentRequest":{
2809+
"type":"structure",
2810+
"required":["customModelDeploymentIdentifier"],
2811+
"members":{
2812+
"customModelDeploymentIdentifier":{
2813+
"shape":"CustomModelDeploymentIdentifier",
2814+
"location":"uri",
2815+
"locationName":"customModelDeploymentIdentifier"
2816+
}
2817+
}
2818+
},
2819+
"GetCustomModelDeploymentResponse":{
2820+
"type":"structure",
2821+
"required":[
2822+
"customModelDeploymentArn",
2823+
"modelDeploymentName",
2824+
"modelArn",
2825+
"createdAt",
2826+
"status"
2827+
],
2828+
"members":{
2829+
"customModelDeploymentArn":{"shape":"CustomModelDeploymentArn"},
2830+
"modelDeploymentName":{"shape":"ModelDeploymentName"},
2831+
"modelArn":{"shape":"CustomModelArn"},
2832+
"createdAt":{"shape":"Timestamp"},
2833+
"status":{"shape":"CustomModelDeploymentStatus"},
2834+
"description":{"shape":"CustomModelDeploymentDescription"},
2835+
"failureMessage":{"shape":"ErrorMessage"},
2836+
"lastUpdatedAt":{"shape":"Timestamp"}
2837+
}
2838+
},
26462839
"GetCustomModelRequest":{
26472840
"type":"structure",
26482841
"required":["modelIdentifier"],
@@ -4262,6 +4455,63 @@
42624455
"url":{"shape":"String"}
42634456
}
42644457
},
4458+
"ListCustomModelDeploymentsRequest":{
4459+
"type":"structure",
4460+
"members":{
4461+
"createdBefore":{
4462+
"shape":"Timestamp",
4463+
"location":"querystring",
4464+
"locationName":"createdBefore"
4465+
},
4466+
"createdAfter":{
4467+
"shape":"Timestamp",
4468+
"location":"querystring",
4469+
"locationName":"createdAfter"
4470+
},
4471+
"nameContains":{
4472+
"shape":"ModelDeploymentName",
4473+
"location":"querystring",
4474+
"locationName":"nameContains"
4475+
},
4476+
"maxResults":{
4477+
"shape":"MaxResults",
4478+
"location":"querystring",
4479+
"locationName":"maxResults"
4480+
},
4481+
"nextToken":{
4482+
"shape":"PaginationToken",
4483+
"location":"querystring",
4484+
"locationName":"nextToken"
4485+
},
4486+
"sortBy":{
4487+
"shape":"SortModelsBy",
4488+
"location":"querystring",
4489+
"locationName":"sortBy"
4490+
},
4491+
"sortOrder":{
4492+
"shape":"SortOrder",
4493+
"location":"querystring",
4494+
"locationName":"sortOrder"
4495+
},
4496+
"statusEquals":{
4497+
"shape":"CustomModelDeploymentStatus",
4498+
"location":"querystring",
4499+
"locationName":"statusEquals"
4500+
},
4501+
"modelArnEquals":{
4502+
"shape":"CustomModelArn",
4503+
"location":"querystring",
4504+
"locationName":"modelArnEquals"
4505+
}
4506+
}
4507+
},
4508+
"ListCustomModelDeploymentsResponse":{
4509+
"type":"structure",
4510+
"members":{
4511+
"nextToken":{"shape":"PaginationToken"},
4512+
"modelDeploymentSummaries":{"shape":"CustomModelDeploymentSummaryList"}
4513+
}
4514+
},
42654515
"ListCustomModelsRequest":{
42664516
"type":"structure",
42674517
"members":{
@@ -5140,6 +5390,12 @@
51405390
},
51415391
"union":true
51425392
},
5393+
"ModelDeploymentName":{
5394+
"type":"string",
5395+
"max":63,
5396+
"min":1,
5397+
"pattern":"([0-9a-zA-Z][_-]?){1,63}"
5398+
},
51435399
"ModelId":{
51445400
"type":"string",
51455401
"max":2048,
@@ -6068,7 +6324,7 @@
60686324
"type":"string",
60696325
"max":1011,
60706326
"min":20,
6071-
"pattern":".*(^[a-zA-Z0-9][a-zA-Z0-9\\-]*$)|(^arn:aws(-[^:]+)?:bedrock:[a-z0-9-]{1,20}:[0-9]{12}:custom-model/([a-z0-9-]{1,63}[.][a-z0-9-]{1,63}(([:][a-z0-9-]{1,63}){0,2})?|imported)/[a-z0-9]{12}$)|(^arn:aws(-[^:]+)?:bedrock:[a-z0-9-]{1,20}:([0-9]{12}|)((:(fine-tuning-job|model-customization-job)/[a-z0-9-]{1,63}[.]{1}[a-z0-9-]{1,63}([a-z0-9-]{1,63}[.]){0,2}[a-z0-9-]{1,63}([:][a-z0-9-]{1,63}){0,2}(/[a-z0-9]{12})$)|(:guardrail/[a-z0-9]+$)|(:automated-reasoning-policy/[a-zA-Z0-9]+(:[a-zA-Z0-9]+)?$)|(:(inference-profile|application-inference-profile)/[a-zA-Z0-9-:.]+$)|(:(provisioned-model|model-invocation-job|model-evaluation-job|evaluation-job|model-import-job|imported-model|async-invoke|provisioned-model-v2|provisioned-model-reservation|prompt-router|custom-model-deployment)/[a-z0-9]{12}$))).*"
6327+
"pattern":".*(^[a-zA-Z0-9][a-zA-Z0-9\\-]*$)|(^arn:aws(-[^:]+)?:bedrock:[a-z0-9-]{1,20}:[0-9]{12}:custom-model/(imported)/[a-z0-9]{12}$)|(^arn:aws(-[^:]+)?:bedrock:[a-z0-9-]{1,20}:([0-9]{12}|)((:(fine-tuning-job|model-customization-job|custom-model)/[a-z0-9-]{1,63}[.]{1}[a-z0-9-]{1,63}([a-z0-9-]{1,63}[.]){0,2}[a-z0-9-]{1,63}([:][a-z0-9-]{1,63}){0,2}(/[a-z0-9]{12})$)|(:guardrail/[a-z0-9]+$)|(:automated-reasoning-policy/[a-zA-Z0-9]+(:[a-zA-Z0-9]+)?$)|(:(inference-profile|application-inference-profile)/[a-zA-Z0-9-:.]+$)|(:(provisioned-model|model-invocation-job|model-evaluation-job|evaluation-job|model-import-job|imported-model|async-invoke|provisioned-model-v2|provisioned-model-reservation|prompt-router|custom-model-deployment)/[a-z0-9]{12}$))).*"
60726328
},
60736329
"TeacherModelConfig":{
60746330
"type":"structure",

0 commit comments

Comments
 (0)