[Misc][Bugfix] Disable guided decoding for mistral tokenizer (#8521)

ee2bceaa · Roger Wang · GitHub · 1c1bb388 · ee2bceaa
Unverified Commit ee2bceaa authored Sep 16, 2024 by Roger Wang Committed by GitHub Sep 16, 2024
Hide whitespace changes
Inline Side-by-side

Showing with 23 additions and 0 deletions

vllm/model_executor/guided_decoding/__init__.py vllm/model_executor/guided_decoding/__init__.py +23 -0

No files found.
--- a/vllm/model_executor/guided_decoding/__init__.py
+++ b/vllm/model_executor/guided_decoding/__init__.py
@@ -6,6 +6,7 @@ from vllm.entrypoints.openai.protocol import (
 from vllm.model_executor.guided_decoding.guided_fields import (
    GuidedDecodingRequest)
 from vllm.sampling_params import LogitsProcessor
+from vllm.transformers_utils.tokenizer import MistralTokenizer
 async def get_guided_decoding_logits_processor(
@@ -15,12 +16,23 @@ async def get_guided_decoding_logits_processor(
    request = _adapt_request_for_tool_use(request)
    if guided_decoding_backend == 'outlines':
+        if isinstance(tokenizer, MistralTokenizer):
+            raise NotImplementedError(
+                "Guided decoding with 'outlines' is currently not supported "
+                "for Mistral tokenizer. Please consider contributing to the "
+                "'outlines' project if you are interested in this feature.")
        # NOTE: lazy import outlines to avoid https://github.com/vllm-project/vllm/issues/4193
        from vllm.model_executor.guided_decoding.outlines_decoding import (  # noqa
            get_outlines_guided_decoding_logits_processor)
        return await get_outlines_guided_decoding_logits_processor(
            request, tokenizer)
    if guided_decoding_backend == 'lm-format-enforcer':
+        if isinstance(tokenizer, MistralTokenizer):
+            raise NotImplementedError(
+                "Guided decoding with 'lm-format-enforcer' is currently not "
+                "supported for Mistral tokenizer. Please consider contributing "
+                "to the 'lm-format-enforcer' project if you are interested "
+                "in this feature.")
        from vllm.model_executor.guided_decoding.lm_format_enforcer_decoding import (  # noqa
            get_lm_format_enforcer_guided_decoding_logits_processor)
        return await get_lm_format_enforcer_guided_decoding_logits_processor(
@@ -37,12 +49,23 @@ def get_local_guided_decoding_logits_processor(
    # request = _adapt_request_for_tool_use(request)
    if guided_decoding_backend == 'outlines':
+        if isinstance(tokenizer, MistralTokenizer):
+            raise NotImplementedError(
+                "Guided decoding with 'outlines' is currently not supported "
+                "for Mistral tokenizer. Please consider contributing to the "
+                "'outlines' project if you are interested in this feature.")
        # NOTE: lazy import outlines to avoid https://github.com/vllm-project/vllm/issues/4193
        from vllm.model_executor.guided_decoding.outlines_decoding import (  # noqa
            get_local_outlines_guided_decoding_logits_processor)
        return get_local_outlines_guided_decoding_logits_processor(
            guided_options, tokenizer)
    if guided_decoding_backend == 'lm-format-enforcer':
+        if isinstance(tokenizer, MistralTokenizer):
+            raise NotImplementedError(
+                "Guided decoding with 'lm-format-enforcer' is currently not "
+                "supported for Mistral tokenizer. Please consider contributing "
+                "to the 'lm-format-enforcer' project if you are interested "
+                "in this feature.")
        from vllm.model_executor.guided_decoding.lm_format_enforcer_decoding import (  # noqa
            get_local_lm_format_enforcer_guided_decoding_logits_processor)
        return get_local_lm_format_enforcer_guided_decoding_logits_processor(