@@ -433,6 +433,14 @@ Parameters:
433433 Type : Number
434434 Description : ' The desired number of tasks running for ML Engine ECS service'
435435 Default : 2
436+ MLEngineFargateTaskCPUValue :
437+ Type : Number
438+ Default : 2048
439+ Description : ' CPU value for AWS Fargate per ML Engine ECS task'
440+ MLEngineFargateTaskMemoryValue :
441+ Type : Number
442+ Default : 4096
443+ Description : ' Memory value for AWS Fargate per ML Engine ECS task'
436444Metadata :
437445 AWS::CloudFormation::Interface :
438446 ParameterGroups :
@@ -540,13 +548,39 @@ Metadata:
540548 - GenaiEngineHallucinationCheckMaxTokenLimit
541549 - GenaiEngineToxicityCheckMaxTokenLimit
542550 - GenaiEngineUsePIIModelV2
551+ - Label :
552+ default : ' Advanced ML Engine'
553+ Parameters :
554+ - MLEngineVersion
555+ - MLEngineContainerImageLocation
556+ - MLEngineBYOAppSecurityGroupIDs
557+ - MLEngineFargateTaskCPUValue
558+ - MLEngineFargateTaskMemoryValue
559+ - Label :
560+ default : ' Advanced ML Engine (IAM)'
561+ Parameters :
562+ - MLEngineBYOTaskRoleIAMArn
563+ - MLEngineBYOTaskExecutionRoleIAMArn
564+ - Label :
565+ default : ' Advanced ML Engine (Scalability)'
566+ Parameters :
567+ - MLEngineECSServiceTaskDesiredCount
568+ - MLEngineECSAutoscalingMinCapacity
569+ - MLEngineECSAutoscalingMaxCapacity
570+ - MLEngineECSScaleCPUTargetValue
571+ - MLEngineECSScaleMemoryTargetValue
572+ - MLEngineECSScaleInCooldownInSecs
573+ - MLEngineECSScaleOutCooldownInSecs
574+ - Label :
575+ default : ' Advanced ML Engine (Platform Monitoring)'
576+ Parameters :
577+ - MLEngineECSCPUAlarmThreshold
578+ - MLEngineECSMemoryAlarmThreshold
543579 ParameterLabels :
544580 ArthurResourceNamespace :
545581 default : ' Arthur Platform Resource Namespace'
546582 ArthurResourceNameSuffix :
547583 default : ' Arthur Platform Resource Name Suffix'
548- MLEngineContainerImageLocation :
549- default : ' ML Engine Container Image Location'
550584 ContainerRepositoryUsername :
551585 default : ' Container Repository Username'
552586 ContainerRepositoryPassword :
@@ -723,6 +757,10 @@ Metadata:
723757 default : ' ML Engine ECS Autoscaling Minimum Capacity'
724758 MLEngineECSServiceTaskDesiredCount :
725759 default : ' ML Engine ECS Service Task Desired Count'
760+ MLEngineFargateTaskCPUValue :
761+ default : ' ML Engine ECS CPU Value. Must be compatible with ECS Memory Value'
762+ MLEngineFargateTaskMemoryValue :
763+ default : ' ML Engine ECS Memory Value. Must be compatible with ECS CPU Value'
726764Conditions :
727765 ContainerRepositoryCredentialRequired :
728766 !Not [ !Equals [ !Ref ContainerRepositoryUsername, '' ] ]
@@ -900,6 +938,8 @@ Resources:
900938 MLEngineClientCredentialsSecretARN : !GetAtt [ MLEngineSecretsStack, Outputs.MLEngineClientCredentialsSecretOutput ]
901939 GenaiEngineInternalAPIKeySecretARN : !GetAtt [ GenaiEngineSecretsStack, Outputs.GenaiEngineAPIKeySecretOutput ]
902940 GenaiEngineInternalIngressHost : !Ref GenaiEngineIngressURL
941+ MLEngineFargateTaskCPUValue : !Ref MLEngineFargateTaskCPUValue
942+ MLEngineFargateTaskMemoryValue : !Ref MLEngineFargateTaskMemoryValue
903943 TemplateURL : " https://arthur-cft.s3.us-east-2.amazonaws.com/arthur-engine/templates/REPLACE_ME_GENAI_ENGINE_VERSION/ml-engine/arthur-ml-engine-ecs-task-definition.yml"
904944 GenaiEngineLBStack :
905945 Type : AWS::CloudFormation::Stack
0 commit comments