Unverified Commit 35229c74 authored by julienmancuso's avatar julienmancuso Committed by GitHub
Browse files

fix: set gpus as strings in config files (#1123)

parent b3da9427
......@@ -34,7 +34,7 @@ VllmWorker:
ServiceArgs:
workers: 1
resources:
gpu: 1
gpu: '1'
common-configs: [model, block-size, max-model-len]
Planner:
......
......@@ -39,7 +39,7 @@ VllmWorker:
ServiceArgs:
workers: 1
resources:
gpu: 1
gpu: '1'
common-configs: [model, block-size, max-model-len, router, kv-transfer-config]
Planner:
......
......@@ -42,7 +42,7 @@ VllmWorker:
ServiceArgs:
workers: 1
resources:
gpu: 1
gpu: '1'
common-configs: [model, block-size, max-model-len, router, kv-transfer-config]
PrefillWorker:
......@@ -50,7 +50,7 @@ PrefillWorker:
ServiceArgs:
workers: 1
resources:
gpu: 1
gpu: '1'
common-configs: [model, block-size, max-model-len, kv-transfer-config]
Planner:
......
......@@ -49,7 +49,7 @@ VllmWorker:
ServiceArgs:
workers: 1
resources:
gpu: 8
gpu: '8'
PrefillWorker:
model: nvidia/Llama-3.1-405B-Instruct-FP8
......@@ -63,4 +63,4 @@ PrefillWorker:
ServiceArgs:
workers: 1
resources:
gpu: 8
\ No newline at end of file
gpu: '8'
\ No newline at end of file
......@@ -35,5 +35,5 @@ VllmWorker:
ServiceArgs:
workers: 1
resources:
gpu: 1
gpu: '1'
common-configs: [model, block-size, max-model-len]
......@@ -34,7 +34,7 @@ VllmWorker:
ServiceArgs:
workers: 1
resources:
gpu: 16
gpu: '16'
common-configs: [model, block-size, max-model-len, kv-transfer-config, tensor-parallel-size]
PrefillWorker:
......@@ -42,5 +42,5 @@ PrefillWorker:
ServiceArgs:
workers: 1
resources:
gpu: 16
gpu: '16'
common-configs: [model, block-size, max-model-len, kv-transfer-config, tensor-parallel-size]
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment