Unverified Commit c1c0d00b authored by Roy's avatar Roy Committed by GitHub
Browse files

Don't use cupy when `enforce_eager=True` (#3037)

parent d9f726c4
......@@ -284,7 +284,10 @@ class LLMEngine:
is_driver_worker=True,
)
self._run_workers("init_model", cupy_port=get_open_port())
# don't use cupy for eager mode
self._run_workers("init_model",
cupy_port=get_open_port()
if not model_config.enforce_eager else None)
self._run_workers(
"load_model",
max_concurrent_workers=self.parallel_config.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment