feature: Added automatic dashboard feature for DefaultModelMonitor create_monitoring_schedule with error handling, TODO: modify update_monitoring_schedule accordingly and add unit tests

Sushanth Sathish Kumar · sushanthkumar2004 · commit 14dad53997cb · 2024-08-22T23:31:14.000-07:00
diff --git a/src/sagemaker/model_monitor/dashboards.py b/src/sagemaker/model_monitor/dashboards.py
@@ -0,0 +1,215 @@
+import json 
+
+class Variable:
+    def __init__(self, variable_type, variable_property, inputType, id, label, search, populateFrom):
+        self.variable_type = variable_type
+        self.variable_property = variable_property 
+        self.inputType = inputType
+        self.id = id
+        self.label = label
+        self.search = search
+        self.populateFrom = populateFrom
+    
+    def to_dict(self):
+        variable_properties_dict = {}
+        if self.variable_type != None:
+            variable_properties_dict["type"] = self.variable_type
+        if self.variable_property != None:
+            variable_properties_dict["property"] = self.variable_property
+        if self.inputType != None:
+            variable_properties_dict["inputType"] = self.inputType
+        if self.id != None:
+            variable_properties_dict["id"] = self.id
+        if self.label != None:
+            variable_properties_dict["label"] = self.label
+        if self.search != None:
+            variable_properties_dict["search"] = self.search
+        if self.populateFrom != None:
+            variable_properties_dict["populateFrom"] = self.populateFrom
+        return variable_properties_dict
+
+    def to_json(self):
+        json.dumps(self.to_dict(), indent=4)
+
+class WidgetProperties:
+    def __init__(self, view=None, stacked=None, metrics=None, region=None, period=None, title=None, markdown=None):
+        self.view = view
+        self.stacked = stacked
+        self.metrics = metrics
+        self.region = region
+        self.period = period
+        self.title = title
+        self.markdown = markdown
+
+    def to_dict(self):
+        widget_properties_dict = {}
+        if self.view != None:
+            widget_properties_dict["view"] = self.view
+        if self.period != None:
+            widget_properties_dict["period"] = self.period
+        if self.markdown != None:
+            widget_properties_dict["markdown"] = self.markdown
+        if self.stacked != None:
+            widget_properties_dict["stacked"] = self.stacked
+        if self.region != None:
+            widget_properties_dict["region"] = self.region
+        if self.metrics != None:
+            widget_properties_dict["metrics"] = self.metrics
+        if self.title != None:
+            widget_properties_dict["title"] = self.title
+        return widget_properties_dict
+    
+    def to_json(self):
+        json.dumps(self.to_dict(), indent=4)
+
+class Widget:
+    def __init__(self, height, width, widget_type, properties=None):
+        self.height = height
+        self.width = width
+        self.type = widget_type
+        self.properties = properties if properties else WidgetProperties(None, False, [], None, None, None)
+
+    def to_dict(self):
+        return {
+            "height": self.height,
+            "width": self.width,
+            "type": self.type,
+            "properties": self.properties.to_dict()
+        }
+    
+    def to_json(self):
+        return json.dumps(self.to_dict(), indent=4)
+
+class AutomaticDataQualityDashboard:
+    DATA_QUALITY_METRICS_ENDPOINT_NAMESPACE = "{aws/sagemaker/Endpoints/data-metrics,Endpoint,Feature,MonitoringSchedule}"
+    DATA_QUALITY_METRICS_BATCH_NAMESPACE = "{aws/sagemaker/ModelMonitoring/data-metrics,Feature,MonitoringSchedule}"
+    
+    def __init__(self, endpoint_name, monitoring_schedule_name, batch_transform_input, region_name):
+        self.endpoint = endpoint_name
+        self.monitoring_schedule = monitoring_schedule_name
+        self.batch_transform = batch_transform_input
+        self.region = region_name
+                
+        variables = self._generate_variables()
+        type_counts_widget = self._generate_type_counts_widget()
+        null_counts_widget = self._generate_null_counts_widget()
+        estimated_unique_values_widget = self._generate_estimated_unique_values_widget()
+        completeness_widget = self._generate_completeness_widget()
+        baseline_drift_widget = self._generate_baseline_drift_widget()
+        
+        self.dashboard = {"variables" : variables, "widgets": [type_counts_widget, null_counts_widget, estimated_unique_values_widget, completeness_widget, baseline_drift_widget]}
+    
+    def _generate_variables(self):
+        if self.batch_transform:
+            return [Variable(variable_type="property", 
+                            variable_property="Feature",
+                            inputType="select",
+                            id="Feature",
+                            label="Feature",
+                            search=AutomaticDataQualityDashboard.DATA_QUALITY_METRICS_BATCH_NAMESPACE,
+                            populateFrom="Feature")]
+        else:
+            return [Variable(variable_type="property", 
+                            variable_property="Feature",
+                            inputType="select",
+                            id="Feature",
+                            label="Feature",
+                            search=AutomaticDataQualityDashboard.DATA_QUALITY_METRICS_ENDPOINT_NAMESPACE,
+                            populateFrom="Feature")]
+            
+    def _generate_type_counts_widget(self):
+        if self.batch_transform:
+            type_counts_widget_properties = WidgetProperties(view="timeSeries", 
+                                                            stacked=False, 
+                                                            metrics=[[{ "expression": f"SEARCH( '{AutomaticDataQualityDashboard.DATA_QUALITY_METRICS_BATCH_NAMESPACE} feature_(fractional OR boolean OR integral OR string OR unknown)_counts_ Feature=\"_\" MonitoringSchedule=\"{self.monitoring_schedule}\" ', 'Average')"}]],
+                                                            region=self.region,
+                                                            title="Type Counts")
+        else:
+            type_counts_widget_properties = WidgetProperties(view="timeSeries", 
+                                                            stacked=False, 
+                                                            metrics=[[{ "expression": f"SEARCH( '{AutomaticDataQualityDashboard.DATA_QUALITY_METRICS_ENDPOINT_NAMESPACE} feature_(fractional OR boolean OR integral OR string OR unknown)_counts_ Endpoint=\"{self.endpoint}\" Feature=\"_\" MonitoringSchedule=\"{self.monitoring_schedule}\" ', 'Average')"}]],
+                                                            region=self.region,
+                                                            title="Type Counts")
+        return Widget(height=8, width=12, widget_type="metric", properties=type_counts_widget_properties)
+
+    def _generate_null_counts_widget(self):
+        if self.batch_transform:
+            null_counts_widget_properties = WidgetProperties(view="timeSeries", 
+                                                            stacked=False, 
+                                                            metrics=[[{ "expression": f"SEARCH( '{AutomaticDataQualityDashboard.DATA_QUALITY_METRICS_BATCH_NAMESPACE} feature_null_ OR feature_non_null_ Feature=\"_\" MonitoringSchedule=\"{self.monitoring_schedule}\" ', 'Average')"}]],
+                                                            region=self.region,
+                                                            title="Missing Data Counts")
+        else:
+            null_counts_widget_properties = WidgetProperties(view="timeSeries", 
+                                                            stacked=False, 
+                                                            metrics=[[{ "expression": f"SEARCH( '{AutomaticDataQualityDashboard.DATA_QUALITY_METRICS_ENDPOINT_NAMESPACE} feature_null_ OR feature_non_null_ Endpoint=\"{self.endpoint}\" Feature=\"_\" MonitoringSchedule=\"{self.monitoring_schedule}\" ', 'Average')"}]],
+                                                            region=self.region,
+                                                            title="Missing Data Counts")
+        return Widget(height=8, width=12, widget_type="metric", properties=null_counts_widget_properties)
+            
+    def _generate_estimated_unique_values_widget(self):
+        if self.batch_transform:
+            estimated_unique_vals_widget_properties = WidgetProperties(view="timeSeries", 
+                                                            stacked=False, 
+                                                            metrics=[[{ "expression": f"SEARCH( '{AutomaticDataQualityDashboard.DATA_QUALITY_METRICS_BATCH_NAMESPACE} feature_estimated_unique_values_ Feature=\"_\" MonitoringSchedule=\"{self.monitoring_schedule}\" ', 'Average')"}]],
+                                                            region=self.region,
+                                                            title="Estimated Unique Values")
+        else:
+            estimated_unique_vals_widget_properties = WidgetProperties(view="timeSeries", 
+                                                            stacked=False, 
+                                                            metrics=[[{ "expression": f"SEARCH( '{AutomaticDataQualityDashboard.DATA_QUALITY_METRICS_ENDPOINT_NAMESPACE} feature_estimated_unique_values_ Endpoint=\"{self.endpoint}\" Feature=\"_\" MonitoringSchedule=\"{self.monitoring_schedule}\" ', 'Average')"}]],
+                                                            region=self.region,
+                                                            title="Estimated Unique Values")
+            
+        return Widget(height=8, width=12, widget_type="metric", properties=estimated_unique_vals_widget_properties)
+
+    def _generate_completeness_widget(self):
+        if self.batch_transform:
+            completeness_widget_properties = WidgetProperties(view="timeSeries", 
+                                                            stacked=False, 
+                                                            metrics=[[{ "expression": f"SEARCH( '{AutomaticDataQualityDashboard.DATA_QUALITY_METRICS_BATCH_NAMESPACE} feature_completeness_ Feature=\"_\" MonitoringSchedule=\"{self.monitoring_schedule}\" ', 'Average')"}]],
+                                                            region=self.region,
+                                                            title="Completeness")
+        else:
+            completeness_widget_properties = WidgetProperties(view="timeSeries", 
+                                                            stacked=False, 
+                                                            metrics=[[{ "expression": f"SEARCH( '{AutomaticDataQualityDashboard.DATA_QUALITY_METRICS_ENDPOINT_NAMESPACE} feature_completeness_ Endpoint=\"{self.endpoint}\" Feature=\"_\" MonitoringSchedule=\"{self.monitoring_schedule}\" ', 'Average')"}]],
+                                                            region=self.region,
+                                                            title="Completeness")
+        return Widget(height=8, width=12, widget_type="metric", properties=completeness_widget_properties)
+
+    def _generate_baseline_drift_widget(self):
+        if self.batch_transform:
+            baseline_drift_widget_properties = WidgetProperties(view="timeSeries", 
+                                                            stacked=False, 
+                                                            metrics=[[{ "expression": f"SEARCH( '{AutomaticDataQualityDashboard.DATA_QUALITY_METRICS_BATCH_NAMESPACE} feature_baseline_drift_ Feature=\"_\" MonitoringSchedule=\"{self.monitoring_schedule}\" ', 'Average')"}]],
+                                                            region=self.region,
+                                                            title="Baseline Drift")
+        else:
+            baseline_drift_widget_properties = WidgetProperties(view="timeSeries", 
+                                                            stacked=False, 
+                                                            metrics=[[{ "expression": f"SEARCH( '{AutomaticDataQualityDashboard.DATA_QUALITY_METRICS_ENDPOINT_NAMESPACE} feature_baseline_drift_ Endpoint=\"{self.endpoint}\" Feature=\"_\" MonitoringSchedule=\"{self.monitoring_schedule}\" ', 'Average')"}]],
+                                                            region=self.region,
+                                                            title="Baseline Drift")
+        return Widget(height=8, width=12, widget_type="metric", properties=baseline_drift_widget_properties)
+                
+    def to_dict(self):
+        return {"variables" : [var.to_dict() for var in self.dashboard["variables"]], "widgets" : [widget.to_dict() for widget in self.dashboard["widgets"]]}    
+    
+    def to_json(self):
+        return json.dumps(self.to_dict(), indent=4)
+
+# # The above code is a Python script that uses the boto3 library to interact with AWS CloudWatch
+# service. It seems to be related to creating and managing CloudWatch dashboards.
+import boto3 
+# dashboard_body = AutomaticDataQualityDashboard("DEMO-xgb-churn-pred-model-monitor-2024-07-09-17-54-38", "DEMO-xgb-churn-pred-model-monitor-schedule-2024-07-09-18-30-14", None, "us-west-2").to_json()
+# print(dashboard_body)
+# response = boto3.client('cloudwatch').put_dashboard(
+#             DashboardName="New",
+#             DashboardBody=dashboard_body
+#         )
+# print(response)
+
+
+# resp = boto3.client('cloudwatch').get_dashboard(DashboardName="Old")
+# print(resp)
diff --git a/src/sagemaker/model_monitor/model_monitoring.py b/src/sagemaker/model_monitor/model_monitoring.py
@@ -25,6 +25,7 @@
 import uuid
 from typing import Union, Optional, Dict, List
 import attr
+import re
 
 from six import string_types
 from six.moves.urllib.parse import urlparse
@@ -67,6 +68,8 @@
 from sagemaker.lineage._utils import get_resource_name_from_arn
 from sagemaker.model_monitor.cron_expression_generator import CronExpressionGenerator
 
+from sagemaker.model_monitor.dashboards import AutomaticDataQualityDashboard
+
 DEFAULT_REPOSITORY_NAME = "sagemaker-model-monitor-analyzer"
 
 STATISTICS_JSON_DEFAULT_FILE_NAME = "statistics.json"
@@ -1945,6 +1948,8 @@ def create_monitoring_schedule(
         monitor_schedule_name=None,
         schedule_cron_expression=None,
         enable_cloudwatch_metrics=True,
+        enable_automatic_dashboard=False,
+        dashboard_name=None,
         batch_transform_input=None,
         data_analysis_start_time=None,
         data_analysis_end_time=None,
@@ -1988,6 +1993,8 @@ def create_monitoring_schedule(
             data_analysis_end_time (str): End time for the data analysis window
                 for the one time monitoring schedule (NOW), e.g. "-PT1H" (default: None)
         """
+        cw_client = self.sagemaker_session.boto_session.client('cloudwatch')
+        
         if self.job_definition_name is not None or self.monitoring_schedule_name is not None:
             message = (
                 "It seems that this object was already used to create an Amazon Model "
@@ -2005,6 +2012,45 @@ def create_monitoring_schedule(
             )
             logger.error(message)
             raise ValueError(message)
+        
+        # error checking and validation logic for dashboard name
+        if (enable_cloudwatch_metrics == False and enable_automatic_dashboard == True):
+            message = (
+                "Could not create automatic dashboard. Please set enable_cloudwatch_metrics to True."
+            )
+            logger.error(message)
+            raise ValueError(message)
+        
+        if (enable_automatic_dashboard == True):
+            # verify that the provided dashboard name is not taken 
+            dashboard_name = monitor_schedule_name if dashboard_name is None else dashboard_name
+            
+            dashboard_name_validation = bool(re.match(r'^[0-9A-Za-z\-_]{1,255}$', dashboard_name))
+            if dashboard_name_validation == False:
+                message = (
+                    f"Dashboard name {dashboard_name} is not a valid dashboard name. "
+                    "Dashboard name can be at most 255 characters long "
+                    "and valid characters in dashboard names include '0-9A-Za-z-_'."
+                )
+                logger.error(message)
+                raise ValueError(message)
+            
+            try:
+                # try to access dashboard name to see if it exists 
+                cw_client.get_dashboard(DashboardName=dashboard_name)
+                message = (
+                    f"Dashboard name {dashboard_name} is already in use. "
+                    "Please provide a different dashboard name, or delete the already "
+                    "existing dashboard."
+                )
+                logger.error(message)
+                raise ValueError(message)
+            except Exception as e:
+                # in this case, the dashboard name is not in use
+                # and we are free to write to it without overwriting any 
+                # customer data. 
+                pass
+            
 
         self._check_monitoring_schedule_cron_validity(
             schedule_cron_expression=schedule_cron_expression,
@@ -2068,6 +2114,11 @@ def create_monitoring_schedule(
                 message = "Failed to delete job definition {}.".format(new_job_definition_name)
                 logger.exception(message)
             raise
+                
+        cw_client.put_dashboard(
+            DashboardName=dashboard_name,
+            DashboardBody=AutomaticDataQualityDashboard(endpoint_name=endpoint_input, monitoring_schedule_name=monitor_schedule_name, batch_transform_input=batch_transform_input, region_name=self.sagemaker_session.boto_region_name)
+        )
 
     def update_monitoring_schedule(
         self,