Commit 66b809cc authored by zhuwenwen's avatar zhuwenwen
Browse files

Merge tag 'v0.7.2' into v0.7.2-dev

parents 37b63c24 0408efc6
# SPDX-License-Identifier: Apache-2.0
import sys
import os
from contextlib import nullcontext
......
# SPDX-License-Identifier: Apache-2.0
import pytest
import os
......
# SPDX-License-Identifier: Apache-2.0
"""Tests for HF_HUB_OFFLINE mode"""
import importlib
import sys
......
# SPDX-License-Identifier: Apache-2.0
from typing import List
import pytest
......
# SPDX-License-Identifier: Apache-2.0
from typing import List, Optional, Tuple, Union
from vllm.entrypoints.openai.protocol import (ChatCompletionRequest,
......
# SPDX-License-Identifier: Apache-2.0
"""
This file test accuracy of the vLLM server via LMEval.
It uses local-completions, which interacts with vLLM
......
# SPDX-License-Identifier: Apache-2.0
import asyncio
import contextlib
import random
......
# SPDX-License-Identifier: Apache-2.0
from typing import Dict, List
import openai
......
# SPDX-License-Identifier: Apache-2.0
import asyncio
from http import HTTPStatus
from typing import List
......
# SPDX-License-Identifier: Apache-2.0
# imports for guided decoding tests
import json
import re
......
# SPDX-License-Identifier: Apache-2.0
from typing import NamedTuple
import os
......
# SPDX-License-Identifier: Apache-2.0
import pytest
import os
......
# SPDX-License-Identifier: Apache-2.0
import os
import openai # use the official client for correctness check
import pytest
......
# SPDX-License-Identifier: Apache-2.0
import json
import pytest
......
# SPDX-License-Identifier: Apache-2.0
# imports for guided decoding tests
import json
import re
......
# SPDX-License-Identifier: Apache-2.0
import base64
import numpy as np
......
# SPDX-License-Identifier: Apache-2.0
import openai
import pytest
import os
......
# SPDX-License-Identifier: Apache-2.0
import asyncio
import json
import shutil
......
# SPDX-License-Identifier: Apache-2.0
import subprocess
import sys
import tempfile
......@@ -204,6 +206,7 @@ EXPECTED_METRICS_V1 = [
"vllm:gpu_cache_usage_perc",
"vllm:prompt_tokens_total",
"vllm:generation_tokens_total",
"vllm:request_success_total",
"vllm:request_prompt_tokens_sum",
"vllm:request_prompt_tokens_bucket",
"vllm:request_prompt_tokens_count",
......
# SPDX-License-Identifier: Apache-2.0
import openai # use the official client for correctness check
import pytest
import os
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment