"lib/vscode:/vscode.git/clone" did not exist on "122777c8aaef748d6756095fc8ea35e31cc1094b"
Commit 66b809cc authored by zhuwenwen's avatar zhuwenwen
Browse files

Merge tag 'v0.7.2' into v0.7.2-dev

parents 37b63c24 0408efc6
# SPDX-License-Identifier: Apache-2.0
import sys import sys
import os import os
from contextlib import nullcontext from contextlib import nullcontext
......
# SPDX-License-Identifier: Apache-2.0
import pytest import pytest
import os import os
......
# SPDX-License-Identifier: Apache-2.0
"""Tests for HF_HUB_OFFLINE mode""" """Tests for HF_HUB_OFFLINE mode"""
import importlib import importlib
import sys import sys
......
# SPDX-License-Identifier: Apache-2.0
from typing import List from typing import List
import pytest import pytest
......
# SPDX-License-Identifier: Apache-2.0
from typing import List, Optional, Tuple, Union from typing import List, Optional, Tuple, Union
from vllm.entrypoints.openai.protocol import (ChatCompletionRequest, from vllm.entrypoints.openai.protocol import (ChatCompletionRequest,
......
# SPDX-License-Identifier: Apache-2.0
""" """
This file test accuracy of the vLLM server via LMEval. This file test accuracy of the vLLM server via LMEval.
It uses local-completions, which interacts with vLLM It uses local-completions, which interacts with vLLM
......
# SPDX-License-Identifier: Apache-2.0
import asyncio import asyncio
import contextlib import contextlib
import random import random
......
# SPDX-License-Identifier: Apache-2.0
from typing import Dict, List from typing import Dict, List
import openai import openai
......
# SPDX-License-Identifier: Apache-2.0
import asyncio import asyncio
from http import HTTPStatus from http import HTTPStatus
from typing import List from typing import List
......
# SPDX-License-Identifier: Apache-2.0
# imports for guided decoding tests # imports for guided decoding tests
import json import json
import re import re
......
# SPDX-License-Identifier: Apache-2.0
from typing import NamedTuple from typing import NamedTuple
import os import os
......
# SPDX-License-Identifier: Apache-2.0
import pytest import pytest
import os import os
......
# SPDX-License-Identifier: Apache-2.0
import os import os
import openai # use the official client for correctness check import openai # use the official client for correctness check
import pytest import pytest
......
# SPDX-License-Identifier: Apache-2.0
import json import json
import pytest import pytest
......
# SPDX-License-Identifier: Apache-2.0
# imports for guided decoding tests # imports for guided decoding tests
import json import json
import re import re
......
# SPDX-License-Identifier: Apache-2.0
import base64 import base64
import numpy as np import numpy as np
......
# SPDX-License-Identifier: Apache-2.0
import openai import openai
import pytest import pytest
import os import os
......
# SPDX-License-Identifier: Apache-2.0
import asyncio import asyncio
import json import json
import shutil import shutil
......
# SPDX-License-Identifier: Apache-2.0
import subprocess import subprocess
import sys import sys
import tempfile import tempfile
...@@ -204,6 +206,7 @@ EXPECTED_METRICS_V1 = [ ...@@ -204,6 +206,7 @@ EXPECTED_METRICS_V1 = [
"vllm:gpu_cache_usage_perc", "vllm:gpu_cache_usage_perc",
"vllm:prompt_tokens_total", "vllm:prompt_tokens_total",
"vllm:generation_tokens_total", "vllm:generation_tokens_total",
"vllm:request_success_total",
"vllm:request_prompt_tokens_sum", "vllm:request_prompt_tokens_sum",
"vllm:request_prompt_tokens_bucket", "vllm:request_prompt_tokens_bucket",
"vllm:request_prompt_tokens_count", "vllm:request_prompt_tokens_count",
......
# SPDX-License-Identifier: Apache-2.0
import openai # use the official client for correctness check import openai # use the official client for correctness check
import pytest import pytest
import os import os
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment