Commit 14201006 authored by zhuwenwen's avatar zhuwenwen
Browse files

Merge branch 'v0.9.2-dev-wm-1' into 'v0.9.2-dev'

暂时去掉profilling标志位,避免影响其他模型

See merge request dcutoolkit/deeplearing/vllm!196
parents 7a97637e 8d971060
......@@ -2224,8 +2224,8 @@ class GPUModelRunner(LoRAModelRunnerMixin):
def profile_run(self) -> None:
# set profiling flag to avoid torch compile
set_profilling(True)
self._sync_device()
#set_profilling(True)
#self._sync_device()
# Profile with multimodal encoder & encoder cache.
# TODO: handle encoder-decoder models once we support them.
......@@ -2310,7 +2310,7 @@ class GPUModelRunner(LoRAModelRunnerMixin):
del hidden_states, output
self.encoder_cache.clear()
gc.collect()
set_profilling(False)
#set_profilling(False)
def capture_model(self) -> None:
if not self.use_cuda_graph:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment