diff --git a/src/sagemaker/serve/builder/jumpstart_builder.py b/src/sagemaker/serve/builder/jumpstart_builder.py index e689f41839..cfb43b813a 100644 --- a/src/sagemaker/serve/builder/jumpstart_builder.py +++ b/src/sagemaker/serve/builder/jumpstart_builder.py @@ -121,6 +121,7 @@ def __init__(self): self.is_compiled = False self.is_quantized = False self.speculative_decoding_draft_model_source = None + self.deployment_config_name = None self.name = None @abstractmethod @@ -515,6 +516,7 @@ def set_deployment_config(self, config_name: str, instance_type: str) -> None: raise Exception("Cannot set deployment config to an uninitialized model.") self.pysdk_model.set_deployment_config(config_name, instance_type) + self.deployment_config_name = config_name self.instance_type = instance_type diff --git a/src/sagemaker/serve/utils/telemetry_logger.py b/src/sagemaker/serve/utils/telemetry_logger.py index 0ea6ec3f26..6a1228ba40 100644 --- a/src/sagemaker/serve/utils/telemetry_logger.py +++ b/src/sagemaker/serve/utils/telemetry_logger.py @@ -165,6 +165,10 @@ def wrapper(self, *args, **kwargs): model_provider_value = SD_DRAFT_MODEL_SOURCE_TO_CODE[str(model_provider_enum)] extra += f"&x-sdDraftModelSource={model_provider_value}" + if getattr(self, "deployment_config_name", False): + config_name_code = self.deployment_config_name.lower() + extra += f"&x-configName={config_name_code}" + extra += f"&x-latency={round(elapsed, 2)}" if not self.serve_settings.telemetry_opt_out: