Commit 66b809cc authored by zhuwenwen's avatar zhuwenwen
Browse files

Merge tag 'v0.7.2' into v0.7.2-dev

parents 37b63c24 0408efc6
# SPDX-License-Identifier: Apache-2.0
from typing import List
from vllm.config import SchedulerConfig
......
# SPDX-License-Identifier: Apache-2.0
from typing import Callable, List, Optional, Tuple
from vllm.lora.request import LoRARequest
......
# SPDX-License-Identifier: Apache-2.0
from typing import List
from typing import Sequence as GenericSequence
from typing import cast
......
# SPDX-License-Identifier: Apache-2.0
import asyncio
from abc import ABC, abstractmethod
from typing import AsyncGenerator, List, Mapping, Optional
......
# SPDX-License-Identifier: Apache-2.0
"""
NOTE: This API server is used only for demonstrating usage of AsyncEngine
and simple performance benchmarks. It is not intended for production use.
......
# SPDX-License-Identifier: Apache-2.0
import asyncio
import codecs
import json
......@@ -408,7 +410,7 @@ class BaseMultiModalItemTracker(ABC, Generic[_T]):
return "<image>"
if model_type == "mllama":
return "<|image|>"
if model_type == "qwen2_vl":
if model_type in ("qwen2_vl", "qwen2_5_vl"):
return "<|vision_start|><|image_pad|><|vision_end|>"
if model_type == "molmo":
return ""
......@@ -428,7 +430,7 @@ class BaseMultiModalItemTracker(ABC, Generic[_T]):
return "(<audio>./</audio>)"
raise TypeError(f"Unknown model type: {model_type}")
elif modality == "video":
if model_type == "qwen2_vl":
if model_type in ("qwen2_vl", "qwen2_5_vl"):
return "<|vision_start|><|video_pad|><|vision_end|>"
if model_type in ("minicpmo", "minicpmv"):
return "(<video>./</video>)"
......
# SPDX-License-Identifier: Apache-2.0
import asyncio
import signal
from http import HTTPStatus
......
# SPDX-License-Identifier: Apache-2.0
import itertools
import warnings
from contextlib import contextmanager
......
# SPDX-License-Identifier: Apache-2.0
from typing import List, Optional, Union
from vllm.logger import init_logger
......
# SPDX-License-Identifier: Apache-2.0
import asyncio
import atexit
import gc
......
# SPDX-License-Identifier: Apache-2.0
"""
This file contains the command line arguments for the vLLM's
OpenAI-compatible server. It is kept in a separate file for documentation
......
# SPDX-License-Identifier: Apache-2.0
from functools import lru_cache, partial
from typing import Dict, FrozenSet, Iterable, List, Optional, Union
......
# SPDX-License-Identifier: Apache-2.0
# Adapted from
# https://github.com/lm-sys/FastChat/blob/168ccc29d3f7edc50823016105c024fe2282732a/fastchat/protocol/openai_api_protocol.py
import re
......
# SPDX-License-Identifier: Apache-2.0
from .abs_reasoning_parsers import ReasoningParser, ReasoningParserManager
from .deepseek_r1_reasoning_parser import DeepSeekR1ReasoningParser
......
# SPDX-License-Identifier: Apache-2.0
import os
from functools import cached_property
from typing import Callable, Dict, List, Optional, Sequence, Tuple, Type, Union
......
# SPDX-License-Identifier: Apache-2.0
import re
from typing import Optional, Sequence, Tuple, Union
......
# SPDX-License-Identifier: Apache-2.0
import asyncio
from http import HTTPStatus
from io import StringIO
......
# SPDX-License-Identifier: Apache-2.0
import asyncio
import json
import time
......
# SPDX-License-Identifier: Apache-2.0
import asyncio
import time
from typing import AsyncGenerator, AsyncIterator, Dict, List, Optional
......
# SPDX-License-Identifier: Apache-2.0
import asyncio
import base64
import time
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment