Unverified Commit 35229c74 authored by julienmancuso's avatar julienmancuso Committed by GitHub
Browse files

fix: set gpus as strings in config files (#1123)

parent b3da9427
...@@ -34,7 +34,7 @@ VllmWorker: ...@@ -34,7 +34,7 @@ VllmWorker:
ServiceArgs: ServiceArgs:
workers: 1 workers: 1
resources: resources:
gpu: 1 gpu: '1'
common-configs: [model, block-size, max-model-len] common-configs: [model, block-size, max-model-len]
Planner: Planner:
......
...@@ -39,7 +39,7 @@ VllmWorker: ...@@ -39,7 +39,7 @@ VllmWorker:
ServiceArgs: ServiceArgs:
workers: 1 workers: 1
resources: resources:
gpu: 1 gpu: '1'
common-configs: [model, block-size, max-model-len, router, kv-transfer-config] common-configs: [model, block-size, max-model-len, router, kv-transfer-config]
Planner: Planner:
......
...@@ -42,7 +42,7 @@ VllmWorker: ...@@ -42,7 +42,7 @@ VllmWorker:
ServiceArgs: ServiceArgs:
workers: 1 workers: 1
resources: resources:
gpu: 1 gpu: '1'
common-configs: [model, block-size, max-model-len, router, kv-transfer-config] common-configs: [model, block-size, max-model-len, router, kv-transfer-config]
PrefillWorker: PrefillWorker:
...@@ -50,7 +50,7 @@ PrefillWorker: ...@@ -50,7 +50,7 @@ PrefillWorker:
ServiceArgs: ServiceArgs:
workers: 1 workers: 1
resources: resources:
gpu: 1 gpu: '1'
common-configs: [model, block-size, max-model-len, kv-transfer-config] common-configs: [model, block-size, max-model-len, kv-transfer-config]
Planner: Planner:
......
...@@ -49,7 +49,7 @@ VllmWorker: ...@@ -49,7 +49,7 @@ VllmWorker:
ServiceArgs: ServiceArgs:
workers: 1 workers: 1
resources: resources:
gpu: 8 gpu: '8'
PrefillWorker: PrefillWorker:
model: nvidia/Llama-3.1-405B-Instruct-FP8 model: nvidia/Llama-3.1-405B-Instruct-FP8
...@@ -63,4 +63,4 @@ PrefillWorker: ...@@ -63,4 +63,4 @@ PrefillWorker:
ServiceArgs: ServiceArgs:
workers: 1 workers: 1
resources: resources:
gpu: 8 gpu: '8'
\ No newline at end of file \ No newline at end of file
...@@ -35,5 +35,5 @@ VllmWorker: ...@@ -35,5 +35,5 @@ VllmWorker:
ServiceArgs: ServiceArgs:
workers: 1 workers: 1
resources: resources:
gpu: 1 gpu: '1'
common-configs: [model, block-size, max-model-len] common-configs: [model, block-size, max-model-len]
...@@ -34,7 +34,7 @@ VllmWorker: ...@@ -34,7 +34,7 @@ VllmWorker:
ServiceArgs: ServiceArgs:
workers: 1 workers: 1
resources: resources:
gpu: 16 gpu: '16'
common-configs: [model, block-size, max-model-len, kv-transfer-config, tensor-parallel-size] common-configs: [model, block-size, max-model-len, kv-transfer-config, tensor-parallel-size]
PrefillWorker: PrefillWorker:
...@@ -42,5 +42,5 @@ PrefillWorker: ...@@ -42,5 +42,5 @@ PrefillWorker:
ServiceArgs: ServiceArgs:
workers: 1 workers: 1
resources: resources:
gpu: 16 gpu: '16'
common-configs: [model, block-size, max-model-len, kv-transfer-config, tensor-parallel-size] common-configs: [model, block-size, max-model-len, kv-transfer-config, tensor-parallel-size]
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment