Unverified Commit 0678beaa authored by Liangsheng Yin's avatar Liangsheng Yin Committed by GitHub
Browse files

[sepc-v2] Fix imcompatibility with constrained decoding (#12615)

parent c2d4716d
...@@ -311,6 +311,7 @@ class TpModelWorker(BaseTpWorker): ...@@ -311,6 +311,7 @@ class TpModelWorker(BaseTpWorker):
set_random_seed(self.random_seed) set_random_seed(self.random_seed)
self.enable_overlap = not server_args.disable_overlap_schedule self.enable_overlap = not server_args.disable_overlap_schedule
self.enable_spec = server_args.speculative_algorithm is not None
self.hicache_layer_transfer_counter = None self.hicache_layer_transfer_counter = None
@property @property
...@@ -383,6 +384,7 @@ class TpModelWorker(BaseTpWorker): ...@@ -383,6 +384,7 @@ class TpModelWorker(BaseTpWorker):
if ( if (
self.enable_overlap self.enable_overlap
and not self.enable_spec
and model_worker_batch.sampling_info.grammars is not None and model_worker_batch.sampling_info.grammars is not None
): ):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment