Fix regex mask (#1296)

47f20da2 · Liangsheng Yin · GitHub · 4a9f8ea4 · 47f20da2 · 47f20da2
Unverified Commit 47f20da2 authored Sep 01, 2024 by Liangsheng Yin Committed by GitHub Sep 01, 2024
Showing with 6 additions and 6 deletions

python/sglang/srt/layers/sampler.py python/sglang/srt/layers/sampler.py +1 -1

python/sglang/srt/sampling/sampling_batch_info.py python/sglang/srt/sampling/sampling_batch_info.py +5 -5

No files found.
--- a/python/sglang/srt/layers/sampler.py
+++ b/python/sglang/srt/layers/sampler.py
@@ -63,7 +63,7 @@ class Sampler(CustomOp):
            logits.add_(sampling_info.logit_bias)
        if sampling_info.vocab_mask is not None:
-            logits = logits.masked_fill(~sampling_info.vocab_mask, float("-inf"))
+            logits = logits.masked_fill(sampling_info.vocab_mask, float("-inf"))
        logits = self._apply_penalties(logits, sampling_info)

--- a/python/sglang/srt/sampling/sampling_batch_info.py
+++ b/python/sglang/srt/sampling/sampling_batch_info.py
@@ -154,15 +154,15 @@ class SamplingBatchInfo:
        self.vocab_mask = None
        if has_regex:
+            self.vocab_mask = torch.zeros(
+                bs, self.vocab_size, dtype=torch.bool, device=device
+            )
            for i, req in enumerate(reqs):
                if req.regex_fsm is not None:
-                    if self.vocab_mask is None:
+                    self.vocab_mask[i].fill_(1)
-                        self.vocab_mask = torch.zeros(
-                            bs, self.vocab_size, dtype=torch.bool, device=device
-                        )
                    self.vocab_mask[i][
                        req.regex_fsm.get_next_instruction(req.regex_fsm_state).tokens
-                    ] = 1
+                    ] = 0
    def filter(self, unfinished_indices: List[int], new_indices: torch.Tensor):
        self.penalizer_orchestrator.filter(unfinished_indices, new_indices)