Fix all format issues (#623)

claytonparnell · web-flow · commit 505c5e0a52ea · 2025-04-23T15:43:37.000-07:00
diff --git a/template/v2/dirs/etc/sagemaker-ui/jupyter/server/jupyter_server_config.py b/template/v2/dirs/etc/sagemaker-ui/jupyter/server/jupyter_server_config.py
@@ -1,15 +1,10 @@
 import os
 
 c.ServerApp.terminado_settings = {"shell_command": ["/bin/bash"]}
-region = os.environ.get('AWS_REGION')
-csp_rule = os.environ.get('JUPYTERSERVER_CSP_RULE')
+region = os.environ.get("AWS_REGION")
+csp_rule = os.environ.get("JUPYTERSERVER_CSP_RULE")
 
-c.ServerApp.tornado_settings = {
-    "compress_response": True,
-    'headers': {
-        'Content-Security-Policy': csp_rule
-    }
-}
+c.ServerApp.tornado_settings = {"compress_response": True, "headers": {"Content-Security-Policy": csp_rule}}
 
 # Do not delete files to trash. Instead, permanently delete files.
 c.FileContentsManager.delete_to_trash = False
diff --git a/template/v2/dirs/etc/sagemaker-ui/workflows/sample_dag.py b/template/v2/dirs/etc/sagemaker-ui/workflows/sample_dag.py
@@ -1,21 +1,18 @@
 from airflow.decorators import dag
-from airflow.utils.dates import days_ago
 from airflow.operators.bash import BashOperator
 
-
 default_args = {
-    'owner': 'airflow',
+    "owner": "airflow",
 }
 
-@dag(default_args=default_args, tags=['sample'])
+
+@dag(default_args=default_args, tags=["sample"])
 def sample_dag():
     def sample_task():
-        _task = BashOperator(
-            task_id="hello_world",
-            bash_command="echo 'hello world!'"
-        )
+        _task = BashOperator(task_id="hello_world", bash_command="echo 'hello world!'")
         return _task
 
     task = sample_task()
 
+
 sample_dag = sample_dag()
diff --git a/template/v2/dirs/etc/sagemaker-ui/workflows/workflow_client.py b/template/v2/dirs/etc/sagemaker-ui/workflows/workflow_client.py
@@ -1,26 +1,24 @@
 import argparse
-import boto3
+from datetime import datetime, timezone
 from typing import Optional
+
+import boto3
 import requests
-from datetime import datetime, timezone
 
 JUPYTERLAB_URL = "http://default:8888/jupyterlab/default/"
 WORKFLOWS_API_ENDPOINT = "api/sagemaker/workflows"
 TIMESTAMP_FORMAT = "%Y-%m-%d %H:%M:%S.%f%z"
 DZ_CLIENT = boto3.client("datazone")
 
+
 def _validate_response(function_name: str, response: requests.Response):
     if response.status_code == 200:
         return response
     else:
-        raise RuntimeError(
-            f"{function_name} returned {response.status_code}: {str(response.content)}"
-        )
+        raise RuntimeError(f"{function_name} returned {response.status_code}: {str(response.content)}")
 
 
-def update_local_runner_status(
-    session: requests.Session, status: str, detailed_status: Optional[str] = None, **kwargs
-):
+def update_local_runner_status(session: requests.Session, status: str, detailed_status: Optional[str] = None, **kwargs):
     response = session.post(
         url=JUPYTERLAB_URL + WORKFLOWS_API_ENDPOINT + "/update-local-runner-status",
         headers={"X-Xsrftoken": session.cookies.get_dict()["_xsrf"]},
@@ -50,38 +48,41 @@ def stop_local_runner(session: requests.Session, **kwargs):
     )
     return _validate_response("StopLocalRunner", response)
 
+
 def check_blueprint(domain_id: str, **kwargs):
     try:
-        workflow_blueprint = DZ_CLIENT.list_environment_blueprints(domainIdentifier=domain_id, name='Workflows')['items']
+        workflow_blueprint = DZ_CLIENT.list_environment_blueprints(domainIdentifier=domain_id, name="Workflows")[
+            "items"
+        ]
         print(str(bool(workflow_blueprint)))
     except:
         print("False")
 
+
 COMMAND_REGISTRY = {
     "update-local-runner-status": update_local_runner_status,
     "start-local-runner": start_local_runner,
     "stop-local-runner": stop_local_runner,
-    "check-blueprint": check_blueprint
+    "check-blueprint": check_blueprint,
 }
 
+
 def main():
     parser = argparse.ArgumentParser(description="Workflow local runner client")
     subparsers = parser.add_subparsers(dest="command", help="Available commands")
 
-    update_status_parser = subparsers.add_parser(
-        "update-local-runner-status", help="Update status of local runner"
-    )
+    update_status_parser = subparsers.add_parser("update-local-runner-status", help="Update status of local runner")
     update_status_parser.add_argument("--status", type=str, required=True, help="Status to update")
-    update_status_parser.add_argument(
-        "--detailed-status", type=str, required=False, help="Detailed status text"
-    )
+    update_status_parser.add_argument("--detailed-status", type=str, required=False, help="Detailed status text")
 
     start_parser = subparsers.add_parser("start-local-runner", help="Start local runner")
 
     stop_parser = subparsers.add_parser("stop-local-runner", help="Stop local runner")
 
     check_blueprint_parser = subparsers.add_parser("check-blueprint", help="Check Workflows blueprint")
-    check_blueprint_parser.add_argument("--domain-id", type=str, required=True, help="Datazone Domain ID for blueprint check")
+    check_blueprint_parser.add_argument(
+        "--domain-id", type=str, required=True, help="Datazone Domain ID for blueprint check"
+    )
 
     args = parser.parse_args()
 
diff --git a/template/v2/dirs/etc/sagemaker/sm_pysdk_default_config.py b/template/v2/dirs/etc/sagemaker/sm_pysdk_default_config.py
@@ -1,152 +1,122 @@
-import yaml
-import os
-import sys
 import json
+import os
 import re
 
+import yaml
+
+
 def generate_intelligent_default_config(metadata: str) -> dict:
     config = {
-        'SchemaVersion': '1.0',
-        'SageMaker': {
-            'PythonSDK': {
-                'Modules': {
-                    'Session': {
-                        'DefaultS3Bucket': metadata['S3Bucket'],
-                        'DefaultS3ObjectKeyPrefix': metadata['S3ObjectKeyPrefix']
+        "SchemaVersion": "1.0",
+        "SageMaker": {
+            "PythonSDK": {
+                "Modules": {
+                    "Session": {
+                        "DefaultS3Bucket": metadata["S3Bucket"],
+                        "DefaultS3ObjectKeyPrefix": metadata["S3ObjectKeyPrefix"],
                     },
-                    'RemoteFunction': {
-                        'IncludeLocalWorkDir': True,
-                        'VpcConfig': {
-                            'SecurityGroupIds': metadata['SecurityGroupIds'],
-                            'Subnets': metadata['Subnets']
-                        }
+                    "RemoteFunction": {
+                        "IncludeLocalWorkDir": True,
+                        "VpcConfig": {"SecurityGroupIds": metadata["SecurityGroupIds"], "Subnets": metadata["Subnets"]},
                     },
-                    'NotebookJob': {
-                        'RoleArn': metadata['UserRoleArn'],
-                        'S3RootUri': f"s3://{metadata['S3Bucket']}/{metadata['S3ObjectKeyPrefix']}",
-                        'VpcConfig': {
-                            'SecurityGroupIds': metadata['SecurityGroupIds'],
-                            'Subnets': metadata['Subnets']
-                        }
+                    "NotebookJob": {
+                        "RoleArn": metadata["UserRoleArn"],
+                        "S3RootUri": f"s3://{metadata['S3Bucket']}/{metadata['S3ObjectKeyPrefix']}",
+                        "VpcConfig": {"SecurityGroupIds": metadata["SecurityGroupIds"], "Subnets": metadata["Subnets"]},
                     },
-                    'Serve': {
-                        'S3ModelDataUri': f"s3://{metadata['S3Bucket']}/{metadata['S3ObjectKeyPrefix']}"
-                    }
+                    "Serve": {"S3ModelDataUri": f"s3://{metadata['S3Bucket']}/{metadata['S3ObjectKeyPrefix']}"},
                 }
             },
-            'MonitoringSchedule': {
-                'MonitoringScheduleConfig': {
-                    'MonitoringJobDefinition': {
-                        'NetworkConfig': {
-                            'VpcConfig': {
-                                'SecurityGroupIds': metadata['SecurityGroupIds'],
-                                'Subnets': metadata['Subnets']
+            "MonitoringSchedule": {
+                "MonitoringScheduleConfig": {
+                    "MonitoringJobDefinition": {
+                        "NetworkConfig": {
+                            "VpcConfig": {
+                                "SecurityGroupIds": metadata["SecurityGroupIds"],
+                                "Subnets": metadata["Subnets"],
                             }
                         }
                     }
                 }
             },
-            'AutoMLJob': {
-                'AutoMLJobConfig': {
-                    'SecurityConfig': {
-                        'VpcConfig': {
-                            'SecurityGroupIds': metadata['SecurityGroupIds'],
-                            'Subnets': metadata['Subnets']
-                        }
+            "AutoMLJob": {
+                "AutoMLJobConfig": {
+                    "SecurityConfig": {
+                        "VpcConfig": {"SecurityGroupIds": metadata["SecurityGroupIds"], "Subnets": metadata["Subnets"]}
                     }
                 }
             },
-            'AutoMLJobV2': {
-                'SecurityConfig': {
-                    'VpcConfig': {
-                        'SecurityGroupIds': metadata['SecurityGroupIds'],
-                        'Subnets': metadata['Subnets']
-                    }
+            "AutoMLJobV2": {
+                "SecurityConfig": {
+                    "VpcConfig": {"SecurityGroupIds": metadata["SecurityGroupIds"], "Subnets": metadata["Subnets"]}
                 }
             },
-            'CompilationJob': {
-                'VpcConfig': {
-                    'SecurityGroupIds': metadata['SecurityGroupIds'],
-                    'Subnets': metadata['Subnets']
-                }
+            "CompilationJob": {
+                "VpcConfig": {"SecurityGroupIds": metadata["SecurityGroupIds"], "Subnets": metadata["Subnets"]}
             },
-            'Pipeline': {
-                'RoleArn': metadata['UserRoleArn']
+            "Pipeline": {"RoleArn": metadata["UserRoleArn"]},
+            "Model": {
+                "VpcConfig": {"SecurityGroupIds": metadata["SecurityGroupIds"], "Subnets": metadata["Subnets"]},
+                "ExecutionRoleArn": metadata["UserRoleArn"],
             },
-            'Model': {
-                'VpcConfig': {
-                    'SecurityGroupIds': metadata['SecurityGroupIds'],
-                    'Subnets': metadata['Subnets']
+            "ModelPackage": {"ValidationSpecification": {"ValidationRole": metadata["UserRoleArn"]}},
+            "ProcessingJob": {
+                "NetworkConfig": {
+                    "VpcConfig": {"SecurityGroupIds": metadata["SecurityGroupIds"], "Subnets": metadata["Subnets"]}
                 },
-                'ExecutionRoleArn': metadata['UserRoleArn']
-            },
-            'ModelPackage': {
-                'ValidationSpecification': {
-                    'ValidationRole': metadata['UserRoleArn']
-                }
+                "RoleArn": metadata["UserRoleArn"],
             },
-            'ProcessingJob': {
-                'NetworkConfig': {
-                    'VpcConfig': {
-                        'SecurityGroupIds': metadata['SecurityGroupIds'],
-                        'Subnets': metadata['Subnets']
-                    }
-                },
-                'RoleArn': metadata['UserRoleArn']
+            "TrainingJob": {
+                "RoleArn": metadata["UserRoleArn"],
+                "VpcConfig": {"SecurityGroupIds": metadata["SecurityGroupIds"], "Subnets": metadata["Subnets"]},
             },
-            'TrainingJob': {
-                'RoleArn': metadata['UserRoleArn'],
-                'VpcConfig': {
-                    'SecurityGroupIds': metadata['SecurityGroupIds'],
-                    'Subnets': metadata['Subnets']
-                }
-            }
-        }
+        },
     }
     return config
 
-if __name__=='__main__':   
-    try: 
+
+if __name__ == "__main__":
+    try:
         config = {}
-        resource_metadata = '/opt/ml/metadata/resource-metadata.json'
+        resource_metadata = "/opt/ml/metadata/resource-metadata.json"
 
-        PROJECT_S3_PATH = 'ProjectS3Path'
-        SECURITY_GROUP = 'SecurityGroup'
-        PRIVATE_SUBNETS = 'PrivateSubnets'
-        META_DATA = 'AdditionalMetadata'
-        EXECUTION_ROLE_ARN = 'ExecutionRoleArn'
-        CONFIG_FILE_NAME = 'config.yaml'
-        CONFIG_DIR = '/etc/xdg/sagemaker/'
+        PROJECT_S3_PATH = "ProjectS3Path"
+        SECURITY_GROUP = "SecurityGroup"
+        PRIVATE_SUBNETS = "PrivateSubnets"
+        META_DATA = "AdditionalMetadata"
+        EXECUTION_ROLE_ARN = "ExecutionRoleArn"
+        CONFIG_FILE_NAME = "config.yaml"
+        CONFIG_DIR = "/etc/xdg/sagemaker/"
 
         if os.path.exists(resource_metadata):
-            with open(resource_metadata, 'r') as file:
+            with open(resource_metadata, "r") as file:
                 data = json.load(file)
 
-            s3_path = data[META_DATA].get(PROJECT_S3_PATH, '')
+            s3_path = data[META_DATA].get(PROJECT_S3_PATH, "")
             metadata = {
                 # user provided bucket
-                'S3Bucket': re.search(r"s3://([^/]+)/", s3_path).group(1),
+                "S3Bucket": re.search(r"s3://([^/]+)/", s3_path).group(1),
                 # ${datazoneEnvironmentDomainId}/${datazoneEnvironmentProjectId}/${datazoneScopeName}/
-                'S3ObjectKeyPrefix': s3_path.split("//")[1].split("/", 1)[1],
+                "S3ObjectKeyPrefix": s3_path.split("//")[1].split("/", 1)[1],
                 # TODO: Is this a billing concern if set default
                 # 'InstanceType': 'ml.m5.xlarge',
-                'SecurityGroupIds': data[META_DATA].get(SECURITY_GROUP, '').split(','),
-                'Subnets': data[META_DATA].get(PRIVATE_SUBNETS, '').split(','),
-                'UserRoleArn': data[EXECUTION_ROLE_ARN]
+                "SecurityGroupIds": data[META_DATA].get(SECURITY_GROUP, "").split(","),
+                "Subnets": data[META_DATA].get(PRIVATE_SUBNETS, "").split(","),
+                "UserRoleArn": data[EXECUTION_ROLE_ARN],
             }
-            
+
             # Not create config file when invalid value exists in metadata
-            empty_values = [key for key, value in metadata.items() if value == "" or value == ['']]
+            empty_values = [key for key, value in metadata.items() if value == "" or value == [""]]
             if empty_values:
                 raise AttributeError(f"There are empty values in the metadata: {empty_values}")
 
             config = generate_intelligent_default_config(metadata)
         else:
-            raise FileNotFoundError('No resource-metadata.json exists on host!')
-            
+            raise FileNotFoundError("No resource-metadata.json exists on host!")
+
         # Write the config YAML file to default location of the admin config file
-        with open(os.path.join(CONFIG_DIR, CONFIG_FILE_NAME), 'w') as f:
+        with open(os.path.join(CONFIG_DIR, CONFIG_FILE_NAME), "w") as f:
             yaml.dump(config, f, default_flow_style=False, sort_keys=False)
-    
+
     except Exception as e:
-        print(f"Error: {e}, SageMaker PySDK intelligent config file is not valid!")
+        print(f"Error: {e}, SageMaker PySDK intelligent config file is not valid!")
diff --git a/test/test_dockerfile_based_harness.py b/test/test_dockerfile_based_harness.py
@@ -73,7 +73,10 @@
         ("sagemaker_studio_cli.test.Dockerfile", ["sagemaker_studio_cli"]),
         ("sm_spark_cli.test.Dockerfile", []),
         ("sagemaker_studio_dataengineering_sessions.test.Dockerfile", ["sagemaker-studio-dataengineering-sessions"]),
-        ("sagemaker_studio_dataengineering_extensions.test.Dockerfile", ["sagemaker-studio-dataengineering-extensions"]),
+        (
+            "sagemaker_studio_dataengineering_extensions.test.Dockerfile",
+            ["sagemaker-studio-dataengineering-extensions"],
+        ),
         ("sagemaker_studio.integ.Dockerfile", ["sagemaker_studio"]),
     ],
 )
@@ -149,7 +152,10 @@ def test_dockerfiles_for_cpu(
         ("sagemaker_studio_cli.test.Dockerfile", ["sagemaker_studio_cli"]),
         ("sm_spark_cli.test.Dockerfile", []),
         ("sagemaker_studio_dataengineering_sessions.test.Dockerfile", ["sagemaker-studio-dataengineering-sessions"]),
-        ("sagemaker_studio_dataengineering_extensions.test.Dockerfile", ["sagemaker-studio-dataengineering-extensions"]),
+        (
+            "sagemaker_studio_dataengineering_extensions.test.Dockerfile",
+            ["sagemaker-studio-dataengineering-extensions"],
+        ),
         ("sagemaker_studio.integ.Dockerfile", ["sagemaker_studio"]),
     ],
 )