Unverified Commit a6d970e9 authored by Schwinn Saereesitthipitak's avatar Schwinn Saereesitthipitak Committed by GitHub
Browse files

feat: refactor GMS client memory manager with tiered API (#6549)

parent 651ef5b5
......@@ -44,7 +44,7 @@ class SGLangWithGMSProcess(ManagedProcess):
"gms",
"--enable-memory-saver",
"--mem-fraction-static",
"0.8",
"0.9",
"--port",
str(sglang_port),
],
......
......@@ -54,7 +54,7 @@ class VLLMWithGMSProcess(ManagedProcess):
"gms",
"--enable-sleep-mode",
"--gpu-memory-utilization",
"0.8",
"0.9",
"--kv-events-config",
kv_events_cfg,
],
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment