We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ba26a9f commit 0bc5eb4Copy full SHA for 0bc5eb4
api/inference/v1/inference_sdk.go
@@ -773,6 +773,12 @@ type UpdateDeploymentRequest struct {
773
774
// MaxSize: defines the new maximum size of the pool.
775
MaxSize *uint32 `json:"max_size,omitempty"`
776
+
777
+ // ModelID: id of the model to set to the deployment.
778
+ ModelID *string `json:"model_id,omitempty"`
779
780
+ // Quantization: quantization to use to the deployment.
781
+ Quantization *DeploymentQuantization `json:"quantization,omitempty"`
782
}
783
784
// UpdateEndpointRequest: update endpoint request.
0 commit comments