forked from ai-dynamo/dynamo
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathtask_definition_frontend.json
More file actions
78 lines (78 loc) · 2.49 KB
/
task_definition_frontend.json
File metadata and controls
78 lines (78 loc) · 2.49 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
{
"family": "Dynamo-frontend",
"containerDefinitions": [
{
"name": "dynamo-vllm-frontend",
"image": "nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag",
"repositoryCredentials": {
"credentialsParameter": "arn:aws:secretsmanager:AWS_REGION:AWS_ID:secret:ngc_nvcr_access"
},
"cpu": 0,
"portMappings": [
{
"name": "8000",
"containerPort": 8000,
"hostPort": 8000,
"protocol": "tcp",
"appProtocol": "http"
}
],
"essential": true,
"entryPoint": [
"sh",
"-c"
],
"command": [
"cd examples/backends/vllm && python -m dynamo.frontend --router-mode kv & python3 -m dynamo.vllm --model Qwen/Qwen3-0.6B --enforce-eager"
],
"environment": [
{
"name": "ETCD_ENDPOINTS",
"value": "http://IP_ADDRESS:2379"
},
{
"name": "NATS_SERVER",
"value": "nats://IP_ADDRESS:4222"
}
],
"environmentFiles": [],
"mountPoints": [],
"volumesFrom": [],
"ulimits": [],
"logConfiguration": {
"logDriver": "awslogs",
"options": {
"awslogs-group": "/ecs/Dynamo-frontend",
"mode": "non-blocking",
"awslogs-create-group": "true",
"max-buffer-size": "25m",
"awslogs-region": "AWS_REGION",
"awslogs-stream-prefix": "ecs"
},
"secretOptions": []
},
"systemControls": [],
"resourceRequirements": [
{
"value": "1",
"type": "GPU"
}
]
}
],
"taskRoleArn": "arn:aws:iam::AWS_ID:role/ecsTaskExecutionRole",
"executionRoleArn": "arn:aws:iam::AWS_ID:role/ecsTaskExecutionRole",
"networkMode": "host",
"volumes": [],
"placementConstraints": [],
"requiresCompatibilities": [
"EC2"
],
"cpu": "2048",
"memory": "40960",
"runtimePlatform": {
"cpuArchitecture": "X86_64",
"operatingSystemFamily": "LINUX"
},
"enableFaultInjection": false
}