4949 LiveStreamingModelEndpointInferenceGateway ,
5050 LiveSyncModelEndpointInferenceGateway ,
5151 ModelEndpointInfraGateway ,
52+ RedisInferenceAutoscalingMetricsGateway ,
5253 S3FilesystemGateway ,
5354 S3LLMArtifactGateway ,
5455)
@@ -179,6 +180,9 @@ def _get_external_interfaces(
179180 model_endpoints_schema_gateway = LiveModelEndpointsSchemaGateway (
180181 filesystem_gateway = filesystem_gateway
181182 )
183+ inference_autoscaling_metrics_gateway = RedisInferenceAutoscalingMetricsGateway (
184+ redis_client = redis_client
185+ ) # we can just reuse the existing redis client, we shouldn't get key collisions because of the prefix
182186 model_endpoint_service = LiveModelEndpointService (
183187 model_endpoint_record_repository = model_endpoint_record_repo ,
184188 model_endpoint_infra_gateway = model_endpoint_infra_gateway ,
@@ -187,6 +191,7 @@ def _get_external_interfaces(
187191 streaming_model_endpoint_inference_gateway = streaming_model_endpoint_inference_gateway ,
188192 sync_model_endpoint_inference_gateway = sync_model_endpoint_inference_gateway ,
189193 model_endpoints_schema_gateway = model_endpoints_schema_gateway ,
194+ inference_autoscaling_metrics_gateway = inference_autoscaling_metrics_gateway ,
190195 )
191196 llm_model_endpoint_service = LiveLLMModelEndpointService (
192197 model_endpoint_record_repository = model_endpoint_record_repo ,
0 commit comments