"docs/source/en/using-diffusers/custom_pipeline_overview.mdx" did not exist on "d9c449ea30a4a3e8ed73883b45ae07a7177f60a5"
Unverified Commit 59f8e674 authored by AllentDan's avatar AllentDan Committed by GitHub
Browse files

Import turbomind in gradio server only when it is needed (#303)

parent 4279d8ca
......@@ -6,7 +6,6 @@ import random
from contextlib import contextmanager
from typing import Literal, Optional
from lmdeploy import turbomind as tm
from lmdeploy.model import MODELS, BaseModel
......@@ -30,6 +29,7 @@ class AsyncEngine:
"""
def __init__(self, model_path, instance_num=32, tp=1) -> None:
from lmdeploy import turbomind as tm
from lmdeploy.turbomind.tokenizer import Tokenizer
tokenizer_model_path = osp.join(model_path, 'triton_models',
'tokenizer')
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment