"...git@developer.sourcefind.cn:OpenDAS/ktransformers.git" did not exist on "3d62579a6a237223b4b8158b4b03c9ae10b6abf8"
Unverified Commit 21a8fa16 authored by Yi Zhang's avatar Yi Zhang Committed by GitHub
Browse files

tiny optimize for bench serving (#12553)

parent 7a21d8b2
...@@ -25,6 +25,7 @@ import warnings ...@@ -25,6 +25,7 @@ import warnings
from argparse import ArgumentParser from argparse import ArgumentParser
from dataclasses import dataclass, field from dataclasses import dataclass, field
from datetime import datetime from datetime import datetime
from functools import lru_cache
from json import JSONDecodeError from json import JSONDecodeError
from pathlib import Path from pathlib import Path
from typing import Any, AsyncGenerator, Dict, List, Optional, Tuple, Union from typing import Any, AsyncGenerator, Dict, List, Optional, Tuple, Union
...@@ -1484,9 +1485,15 @@ def sample_image_requests( ...@@ -1484,9 +1485,15 @@ def sample_image_requests(
return dataset return dataset
@lru_cache(maxsize=1)
def get_available_tokens(tokenizer):
"""Get all available token ids from the tokenizer vocabulary."""
return list(tokenizer.get_vocab().values())
def gen_prompt(tokenizer, token_num): def gen_prompt(tokenizer, token_num):
"""Generate a random prompt of specified token length using tokenizer vocabulary.""" """Generate a random prompt of specified token length using tokenizer vocabulary."""
all_available_tokens = list(tokenizer.get_vocab().values()) all_available_tokens = get_available_tokens(tokenizer)
selected_tokens = random.choices(all_available_tokens, k=token_num) selected_tokens = random.choices(all_available_tokens, k=token_num)
return tokenizer.decode(selected_tokens) return tokenizer.decode(selected_tokens)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment