Commit d969c150 authored by zhuwenwen's avatar zhuwenwen
Browse files

add cudagraph

parent fbfb40ad
...@@ -324,8 +324,7 @@ class ModelConfig: ...@@ -324,8 +324,7 @@ class ModelConfig:
# Set enforce_eager to False if the value is unset. # Set enforce_eager to False if the value is unset.
if self.enforce_eager is None: if self.enforce_eager is None:
# self.enforce_eager = False self.enforce_eager = False
self.enforce_eager = True
sliding_window = getattr(self.hf_text_config, "sliding_window", None) sliding_window = getattr(self.hf_text_config, "sliding_window", None)
has_interleaved_attention = (sliding_window is not None) and ( has_interleaved_attention = (sliding_window is not None) and (
......
...@@ -598,7 +598,6 @@ class EngineArgs: ...@@ -598,7 +598,6 @@ class EngineArgs:
'parsed into a dictionary.') 'parsed into a dictionary.')
parser.add_argument('--enforce-eager', parser.add_argument('--enforce-eager',
action='store_true', action='store_true',
default=True,
help='Always use eager-mode PyTorch. If False, ' help='Always use eager-mode PyTorch. If False, '
'will use eager mode and CUDA graph in hybrid ' 'will use eager mode and CUDA graph in hybrid '
'for maximal performance and flexibility.') 'for maximal performance and flexibility.')
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment