Skip to content

Commit 16129d1

Browse files
author
AWS
committed
Amazon SageMaker Service Update: SageMaker Inference Recommender now supports a new API ListInferenceRecommendationJobSteps to return the details of all the benchmark we create for an inference recommendation job.
1 parent 2a402e9 commit 16129d1

File tree

3 files changed

+113
-1
lines changed

3 files changed

+113
-1
lines changed
Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
{
2+
"type": "feature",
3+
"category": "Amazon SageMaker Service",
4+
"contributor": "",
5+
"description": "SageMaker Inference Recommender now supports a new API ListInferenceRecommendationJobSteps to return the details of all the benchmark we create for an inference recommendation job."
6+
}

services/sagemaker/src/main/resources/codegen-resources/paginators-1.json

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -156,6 +156,12 @@
156156
"limit_key": "MaxResults",
157157
"result_key": "Images"
158158
},
159+
"ListInferenceRecommendationsJobSteps": {
160+
"input_token": "NextToken",
161+
"output_token": "NextToken",
162+
"limit_key": "MaxResults",
163+
"result_key": "Steps"
164+
},
159165
"ListInferenceRecommendationsJobs": {
160166
"input_token": "NextToken",
161167
"output_token": "NextToken",

services/sagemaker/src/main/resources/codegen-resources/service-2.json

Lines changed: 101 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2170,6 +2170,16 @@
21702170
"output":{"shape":"ListImagesResponse"},
21712171
"documentation":"<p>Lists the images in your account and their properties. The list can be filtered by creation time or modified time, and whether the image name contains a specified string.</p>"
21722172
},
2173+
"ListInferenceRecommendationsJobSteps":{
2174+
"name":"ListInferenceRecommendationsJobSteps",
2175+
"http":{
2176+
"method":"POST",
2177+
"requestUri":"/"
2178+
},
2179+
"input":{"shape":"ListInferenceRecommendationsJobStepsRequest"},
2180+
"output":{"shape":"ListInferenceRecommendationsJobStepsResponse"},
2181+
"documentation":"<p>Returns a list of the subtasks for an Inference Recommender job.</p> <p>The supported subtasks are benchmarks, which evaluate the performance of your model on different instance types.</p>"
2182+
},
21732183
"ListInferenceRecommendationsJobs":{
21742184
"name":"ListInferenceRecommendationsJobs",
21752185
"http":{
@@ -4540,7 +4550,8 @@
45404550
"PrecisionMacro",
45414551
"Recall",
45424552
"RecallMacro",
4543-
"LogLoss"
4553+
"LogLoss",
4554+
"InferenceLatency"
45444555
]
45454556
},
45464557
"AutoMLMode":{
@@ -16258,6 +16269,37 @@
1625816269
},
1625916270
"documentation":"<p>A structure that contains a list of recommendation jobs.</p>"
1626016271
},
16272+
"InferenceRecommendationsJobStep":{
16273+
"type":"structure",
16274+
"required":[
16275+
"StepType",
16276+
"JobName",
16277+
"Status"
16278+
],
16279+
"members":{
16280+
"StepType":{
16281+
"shape":"RecommendationStepType",
16282+
"documentation":"<p>The type of the subtask.</p> <p> <code>BENCHMARK</code>: Evaluate the performance of your model on different instance types.</p>"
16283+
},
16284+
"JobName":{
16285+
"shape":"RecommendationJobName",
16286+
"documentation":"<p>The name of the Inference Recommender job.</p>"
16287+
},
16288+
"Status":{
16289+
"shape":"RecommendationJobStatus",
16290+
"documentation":"<p>The current status of the benchmark.</p>"
16291+
},
16292+
"InferenceBenchmark":{
16293+
"shape":"RecommendationJobInferenceBenchmark",
16294+
"documentation":"<p>The details for a specific benchmark.</p>"
16295+
}
16296+
},
16297+
"documentation":"<p>A returned array object for the <code>Steps</code> response field in the <a href=\"https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_InferenceRecommendationsJobStep.html\">ListInferenceRecommendationsJobSteps</a> API command.</p>"
16298+
},
16299+
"InferenceRecommendationsJobSteps":{
16300+
"type":"list",
16301+
"member":{"shape":"InferenceRecommendationsJobStep"}
16302+
},
1626116303
"InferenceRecommendationsJobs":{
1626216304
"type":"list",
1626316305
"member":{"shape":"InferenceRecommendationsJob"}
@@ -18470,6 +18512,45 @@
1847018512
}
1847118513
}
1847218514
},
18515+
"ListInferenceRecommendationsJobStepsRequest":{
18516+
"type":"structure",
18517+
"required":["JobName"],
18518+
"members":{
18519+
"JobName":{
18520+
"shape":"RecommendationJobName",
18521+
"documentation":"<p>The name for the Inference Recommender job.</p>"
18522+
},
18523+
"Status":{
18524+
"shape":"RecommendationJobStatus",
18525+
"documentation":"<p>A filter to return benchmarks of a specified status. If this field is left empty, then all benchmarks are returned.</p>"
18526+
},
18527+
"StepType":{
18528+
"shape":"RecommendationStepType",
18529+
"documentation":"<p>A filter to return details about the specified type of subtask.</p> <p> <code>BENCHMARK</code>: Evaluate the performance of your model on different instance types.</p>"
18530+
},
18531+
"MaxResults":{
18532+
"shape":"MaxResults",
18533+
"documentation":"<p>The maximum number of results to return.</p>"
18534+
},
18535+
"NextToken":{
18536+
"shape":"NextToken",
18537+
"documentation":"<p>A token that you can specify to return more results from the list. Specify this field if you have a token that was returned from a previous request.</p>"
18538+
}
18539+
}
18540+
},
18541+
"ListInferenceRecommendationsJobStepsResponse":{
18542+
"type":"structure",
18543+
"members":{
18544+
"Steps":{
18545+
"shape":"InferenceRecommendationsJobSteps",
18546+
"documentation":"<p>A list of all subtask details in Inference Recommender.</p>"
18547+
},
18548+
"NextToken":{
18549+
"shape":"NextToken",
18550+
"documentation":"<p>A token that you can specify in your next request to return more results from the list.</p>"
18551+
}
18552+
}
18553+
},
1847318554
"ListInferenceRecommendationsJobsRequest":{
1847418555
"type":"structure",
1847518556
"members":{
@@ -24597,6 +24678,7 @@
2459724678
"type":"list",
2459824679
"member":{"shape":"ProductionVariantInstanceType"}
2459924680
},
24681+
"RecommendationFailureReason":{"type":"string"},
2460024682
"RecommendationJobArn":{
2460124683
"type":"string",
2460224684
"max":256,
@@ -24650,6 +24732,20 @@
2465024732
"type":"string",
2465124733
"max":128
2465224734
},
24735+
"RecommendationJobInferenceBenchmark":{
24736+
"type":"structure",
24737+
"required":["ModelConfiguration"],
24738+
"members":{
24739+
"Metrics":{"shape":"RecommendationMetrics"},
24740+
"EndpointConfiguration":{"shape":"EndpointOutputConfiguration"},
24741+
"ModelConfiguration":{"shape":"ModelConfiguration"},
24742+
"FailureReason":{
24743+
"shape":"RecommendationFailureReason",
24744+
"documentation":"<p>The reason why a benchmark failed.</p>"
24745+
}
24746+
},
24747+
"documentation":"<p>The details for a specific benchmark from an Inference Recommender job.</p>"
24748+
},
2465324749
"RecommendationJobInputConfig":{
2465424750
"type":"structure",
2465524751
"required":["ModelPackageVersionArn"],
@@ -24805,6 +24901,10 @@
2480524901
},
2480624902
"documentation":"<p>The metrics of recommendations.</p>"
2480724903
},
24904+
"RecommendationStepType":{
24905+
"type":"string",
24906+
"enum":["BENCHMARK"]
24907+
},
2480824908
"RecordWrapper":{
2480924909
"type":"string",
2481024910
"enum":[

0 commit comments

Comments
 (0)