"vscode:/vscode.git/clone" did not exist on "f83d9a532f490e4cff27b78887e880ab67dfc8fd"
task_definition_frontend.json 2.49 KB
Newer Older
1
2
3
4
5
{
    "family": "Dynamo-frontend",
    "containerDefinitions": [
        {
            "name": "dynamo-vllm-frontend",
6
            "image": "nvcr.io/nvidia/ai-dynamo/vllm-runtime:my-tag",
7
            "repositoryCredentials": {
kYLe's avatar
kYLe committed
8
                "credentialsParameter": "arn:aws:secretsmanager:AWS_REGION:AWS_ID:secret:ngc_nvcr_access"
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
            },
            "cpu": 0,
            "portMappings": [
                {
                    "name": "8000",
                    "containerPort": 8000,
                    "hostPort": 8000,
                    "protocol": "tcp",
                    "appProtocol": "http"
                }
            ],
            "essential": true,
            "entryPoint": [
                "sh",
                "-c"
            ],
            "command": [
                "cd components/backends/vllm && python -m dynamo.frontend --router-mode kv & python3 -m dynamo.vllm --model Qwen/Qwen3-0.6B --enforce-eager"
            ],
            "environment": [
                {
                    "name": "ETCD_ENDPOINTS",
                    "value": "http://IP_ADDRESS:2379"
                },
                {
                    "name": "NATS_SERVER",
                    "value": "nats://IP_ADDRESS:4222"
                }
            ],
            "environmentFiles": [],
            "mountPoints": [],
            "volumesFrom": [],
            "ulimits": [],
            "logConfiguration": {
                "logDriver": "awslogs",
                "options": {
                    "awslogs-group": "/ecs/Dynamo-frontend",
                    "mode": "non-blocking",
                    "awslogs-create-group": "true",
                    "max-buffer-size": "25m",
kYLe's avatar
kYLe committed
49
                    "awslogs-region": "AWS_REGION",
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
                    "awslogs-stream-prefix": "ecs"
                },
                "secretOptions": []
            },
            "systemControls": [],
            "resourceRequirements": [
                {
                    "value": "1",
                    "type": "GPU"
                }
            ]
        }
    ],
    "taskRoleArn": "arn:aws:iam::AWS_ID:role/ecsTaskExecutionRole",
    "executionRoleArn": "arn:aws:iam::AWS_ID:role/ecsTaskExecutionRole",
    "networkMode": "host",
    "volumes": [],
    "placementConstraints": [],
    "requiresCompatibilities": [
        "EC2"
    ],
    "cpu": "2048",
    "memory": "40960",
    "runtimePlatform": {
        "cpuArchitecture": "X86_64",
        "operatingSystemFamily": "LINUX"
    },
    "enableFaultInjection": false
}