Skip to content

Commit 0bc5eb4

Browse files
authored
feat(inference): add modelId and quantization to updateDeploymentRequest (scaleway#2473)
1 parent ba26a9f commit 0bc5eb4

File tree

1 file changed

+6
-0
lines changed

1 file changed

+6
-0
lines changed

api/inference/v1/inference_sdk.go

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -773,6 +773,12 @@ type UpdateDeploymentRequest struct {
773773

774774
// MaxSize: defines the new maximum size of the pool.
775775
MaxSize *uint32 `json:"max_size,omitempty"`
776+
777+
// ModelID: id of the model to set to the deployment.
778+
ModelID *string `json:"model_id,omitempty"`
779+
780+
// Quantization: quantization to use to the deployment.
781+
Quantization *DeploymentQuantization `json:"quantization,omitempty"`
776782
}
777783

778784
// UpdateEndpointRequest: update endpoint request.

0 commit comments

Comments
 (0)