Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
150d7020
Unverified
Commit
150d7020
authored
Apr 23, 2024
by
Liangsheng Yin
Committed by
GitHub
Apr 23, 2024
Browse files
Revert removing the unused imports (#385)
parent
9acc6e35
Changes
33
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
44 additions
and
19 deletions
+44
-19
python/sglang/api.py
python/sglang/api.py
+4
-0
python/sglang/backend/anthropic.py
python/sglang/backend/anthropic.py
+4
-0
python/sglang/backend/base_backend.py
python/sglang/backend/base_backend.py
+1
-1
python/sglang/backend/openai.py
python/sglang/backend/openai.py
+1
-1
python/sglang/backend/runtime_endpoint.py
python/sglang/backend/runtime_endpoint.py
+4
-3
python/sglang/backend/vertexai.py
python/sglang/backend/vertexai.py
+3
-0
python/sglang/lang/chat_template.py
python/sglang/lang/chat_template.py
+2
-2
python/sglang/lang/compiler.py
python/sglang/lang/compiler.py
+7
-1
python/sglang/lang/interpreter.py
python/sglang/lang/interpreter.py
+2
-1
python/sglang/lang/ir.py
python/sglang/lang/ir.py
+1
-1
python/sglang/lang/tracer.py
python/sglang/lang/tracer.py
+5
-1
python/sglang/srt/hf_transformers_utils.py
python/sglang/srt/hf_transformers_utils.py
+1
-1
python/sglang/srt/managers/detokenizer_manager.py
python/sglang/srt/managers/detokenizer_manager.py
+1
-1
python/sglang/srt/managers/router/radix_cache.py
python/sglang/srt/managers/router/radix_cache.py
+2
-0
python/sglang/srt/models/commandr.py
python/sglang/srt/models/commandr.py
+1
-1
python/sglang/srt/models/llama2.py
python/sglang/srt/models/llama2.py
+1
-1
python/sglang/srt/models/llava.py
python/sglang/srt/models/llava.py
+1
-1
python/sglang/srt/models/mixtral.py
python/sglang/srt/models/mixtral.py
+1
-1
python/sglang/srt/models/qwen.py
python/sglang/srt/models/qwen.py
+1
-1
python/sglang/srt/models/qwen2.py
python/sglang/srt/models/qwen2.py
+1
-1
No files found.
python/sglang/api.py
View file @
150d7020
...
...
@@ -3,7 +3,11 @@
import
re
from
typing
import
Callable
,
List
,
Optional
,
Union
from
sglang.backend.anthropic
import
Anthropic
from
sglang.backend.base_backend
import
BaseBackend
from
sglang.backend.openai
import
OpenAI
from
sglang.backend.runtime_endpoint
import
RuntimeEndpoint
from
sglang.backend.vertexai
import
VertexAI
from
sglang.global_config
import
global_config
from
sglang.lang.ir
import
(
SglExpr
,
...
...
python/sglang/backend/anthropic.py
View file @
150d7020
from
typing
import
List
,
Optional
,
Union
import
numpy
as
np
from
sglang.backend.base_backend
import
BaseBackend
from
sglang.lang.chat_template
import
get_chat_template
from
sglang.lang.interpreter
import
StreamExecutor
...
...
python/sglang/backend/base_backend.py
View file @
150d7020
from
typing
import
List
,
Optional
,
Union
from
typing
import
Callable
,
List
,
Optional
,
Union
from
sglang.lang.chat_template
import
get_chat_template
from
sglang.lang.interpreter
import
StreamExecutor
...
...
python/sglang/backend/openai.py
View file @
150d7020
import
logging
import
time
from
typing
import
List
,
Optional
from
typing
import
Callable
,
List
,
Optional
,
Union
import
numpy
as
np
...
...
python/sglang/backend/runtime_endpoint.py
View file @
150d7020
import
json
from
typing
import
List
,
Optional
from
typing
import
Callable
,
List
,
Optional
,
Union
import
numpy
as
np
import
requests
from
sglang.backend.base_backend
import
BaseBackend
from
sglang.global_config
import
global_config
from
sglang.lang.chat_template
import
get_chat_template_by_model_path
from
sglang.lang.interpreter
import
StreamExecutor
from
sglang.lang.ir
import
SglSamplingParams
from
sglang.utils
import
find_printable_text
,
http_request
from
sglang.lang.ir
import
SglArgument
,
SglSamplingParams
from
sglang.utils
import
encode_image_base64
,
find_printable_text
,
http_request
class
RuntimeEndpoint
(
BaseBackend
):
...
...
python/sglang/backend/vertexai.py
View file @
150d7020
import
os
import
warnings
from
typing
import
List
,
Optional
,
Union
import
numpy
as
np
from
sglang.backend.base_backend
import
BaseBackend
from
sglang.lang.chat_template
import
get_chat_template
...
...
python/sglang/lang/chat_template.py
View file @
150d7020
from
dataclasses
import
dataclass
from
dataclasses
import
dataclass
,
field
from
enum
import
Enum
,
auto
from
typing
import
Callable
,
Dict
,
List
,
Tuple
from
typing
import
Callable
,
Dict
,
List
,
Optional
,
Tuple
class
ChatTemplateStyle
(
Enum
):
...
...
python/sglang/lang/compiler.py
View file @
150d7020
...
...
@@ -5,7 +5,13 @@ from typing import List, Union
from
sglang.global_config
import
global_config
from
sglang.lang.interpreter
import
ProgramState
,
StreamExecutor
,
pin_program
from
sglang.lang.ir
import
SglArgument
,
SglExpr
,
SglSamplingParams
,
SglVariable
from
sglang.lang.ir
import
(
SglArgument
,
SglConstantText
,
SglExpr
,
SglSamplingParams
,
SglVariable
,
)
def
compile_func
(
function
,
backend
):
...
...
python/sglang/lang/interpreter.py
View file @
150d7020
...
...
@@ -7,7 +7,7 @@ import threading
import
uuid
from
concurrent.futures
import
ThreadPoolExecutor
from
contextlib
import
contextmanager
from
typing
import
Any
,
Callable
,
Dict
,
List
,
Optional
from
typing
import
Any
,
Callable
,
Dict
,
List
,
Optional
,
Union
import
tqdm
...
...
@@ -18,6 +18,7 @@ from sglang.lang.ir import (
SglConstantText
,
SglExpr
,
SglExprList
,
SglFunction
,
SglGen
,
SglImage
,
SglRoleBegin
,
...
...
python/sglang/lang/ir.py
View file @
150d7020
...
...
@@ -472,4 +472,4 @@ class SglCommitLazy(SglExpr):
super
().
__init__
()
def
__repr__
(
self
):
return
"CommitLazy()"
return
f
"CommitLazy()"
python/sglang/lang/tracer.py
View file @
150d7020
"""Tracing a program."""
import
uuid
from
typing
import
Any
,
Dict
,
List
,
Optional
from
typing
import
Any
,
Callable
,
Dict
,
List
,
Optional
,
Union
from
sglang.backend.base_backend
import
BaseBackend
from
sglang.global_config
import
global_config
from
sglang.lang.interpreter
import
ProgramState
,
ProgramStateGroup
from
sglang.lang.ir
import
(
SglArgument
,
SglCommitLazy
,
SglConcateAndAppend
,
SglConstantText
,
SglExpr
,
SglExprList
,
SglFork
,
SglFunction
,
SglGen
,
SglGetForkItem
,
SglRoleBegin
,
...
...
python/sglang/srt/hf_transformers_utils.py
View file @
150d7020
...
...
@@ -3,7 +3,7 @@
import
json
import
os
import
warnings
from
typing
import
Optional
,
Union
from
typing
import
List
,
Optional
,
Tuple
,
Union
from
huggingface_hub
import
snapshot_download
from
transformers
import
(
...
...
python/sglang/srt/managers/detokenizer_manager.py
View file @
150d7020
...
...
@@ -84,7 +84,7 @@ def start_detokenizer_process(
):
try
:
manager
=
DetokenizerManager
(
server_args
,
port_args
)
except
Exception
:
except
Exception
as
e
:
pipe_writer
.
send
(
get_exception_traceback
())
raise
pipe_writer
.
send
(
"init ok"
)
...
...
python/sglang/srt/managers/router/radix_cache.py
View file @
150d7020
import
heapq
import
time
from
collections
import
defaultdict
from
dataclasses
import
dataclass
from
typing
import
Tuple
import
torch
...
...
python/sglang/srt/models/commandr.py
View file @
150d7020
...
...
@@ -20,7 +20,7 @@
# This file is based on the LLama model definition file in transformers
"""PyTorch Cohere model."""
from
typing
import
Optional
,
Tuple
from
typing
import
List
,
Optional
,
Tuple
import
torch
import
torch.utils.checkpoint
...
...
python/sglang/srt/models/llama2.py
View file @
150d7020
# Adapted from
# https://github.com/vllm-project/vllm/blob/671af2b1c0b3ed6d856d37c21a561cc429a10701/vllm/model_executor/models/llama.py#L1
"""Inference-only LLaMA model compatible with HuggingFace weights."""
from
typing
import
Any
,
Dict
,
Optional
,
Tuple
from
typing
import
Any
,
Dict
,
List
,
Optional
,
Tuple
import
torch
from
torch
import
nn
...
...
python/sglang/srt/models/llava.py
View file @
150d7020
...
...
@@ -5,7 +5,7 @@ from typing import List, Optional
import
numpy
as
np
import
torch
from
torch
import
nn
from
transformers
import
CLIPVisionModel
,
LlavaConfig
from
transformers
import
CLIPVisionModel
,
LlamaConfig
,
LlavaConfig
from
transformers.models.llava.modeling_llava
import
LlavaMultiModalProjector
from
vllm.model_executor.layers.linear
import
LinearMethodBase
from
vllm.model_executor.weight_utils
import
(
...
...
python/sglang/srt/models/mixtral.py
View file @
150d7020
# Adapted from
# https://github.com/vllm-project/vllm/blob/d0215a58e78572d91dadafe9d832a2db89b09a13/vllm/model_executor/models/mixtral.py#L1
"""Inference-only Mixtral model."""
from
typing
import
Optional
from
typing
import
List
,
Optional
,
Tuple
import
numpy
as
np
import
torch
...
...
python/sglang/srt/models/qwen.py
View file @
150d7020
from
typing
import
Any
,
Dict
,
Optional
from
typing
import
Any
,
Dict
,
List
,
Optional
,
Tuple
import
torch
from
torch
import
nn
...
...
python/sglang/srt/models/qwen2.py
View file @
150d7020
# Adapted from llama2.py
# Modify details for the adaptation of Qwen2 model.
"""Inference-only Qwen2 model compatible with HuggingFace weights."""
from
typing
import
Any
,
Dict
,
Optional
,
Tuple
from
typing
import
Any
,
Dict
,
List
,
Optional
,
Tuple
import
torch
from
torch
import
nn
...
...
Prev
1
2
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment