Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
zhaoyu6
sglang
Commits
150d7020
"vscode:/vscode.git/clone" did not exist on "78b7465cad01f97653a1384960e908c1bc9cfe0b"
Unverified
Commit
150d7020
authored
Apr 23, 2024
by
Liangsheng Yin
Committed by
GitHub
Apr 23, 2024
Browse files
Revert removing the unused imports (#385)
parent
9acc6e35
Changes
33
Show whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
44 additions
and
19 deletions
+44
-19
python/sglang/api.py
python/sglang/api.py
+4
-0
python/sglang/backend/anthropic.py
python/sglang/backend/anthropic.py
+4
-0
python/sglang/backend/base_backend.py
python/sglang/backend/base_backend.py
+1
-1
python/sglang/backend/openai.py
python/sglang/backend/openai.py
+1
-1
python/sglang/backend/runtime_endpoint.py
python/sglang/backend/runtime_endpoint.py
+4
-3
python/sglang/backend/vertexai.py
python/sglang/backend/vertexai.py
+3
-0
python/sglang/lang/chat_template.py
python/sglang/lang/chat_template.py
+2
-2
python/sglang/lang/compiler.py
python/sglang/lang/compiler.py
+7
-1
python/sglang/lang/interpreter.py
python/sglang/lang/interpreter.py
+2
-1
python/sglang/lang/ir.py
python/sglang/lang/ir.py
+1
-1
python/sglang/lang/tracer.py
python/sglang/lang/tracer.py
+5
-1
python/sglang/srt/hf_transformers_utils.py
python/sglang/srt/hf_transformers_utils.py
+1
-1
python/sglang/srt/managers/detokenizer_manager.py
python/sglang/srt/managers/detokenizer_manager.py
+1
-1
python/sglang/srt/managers/router/radix_cache.py
python/sglang/srt/managers/router/radix_cache.py
+2
-0
python/sglang/srt/models/commandr.py
python/sglang/srt/models/commandr.py
+1
-1
python/sglang/srt/models/llama2.py
python/sglang/srt/models/llama2.py
+1
-1
python/sglang/srt/models/llava.py
python/sglang/srt/models/llava.py
+1
-1
python/sglang/srt/models/mixtral.py
python/sglang/srt/models/mixtral.py
+1
-1
python/sglang/srt/models/qwen.py
python/sglang/srt/models/qwen.py
+1
-1
python/sglang/srt/models/qwen2.py
python/sglang/srt/models/qwen2.py
+1
-1
No files found.
python/sglang/api.py
View file @
150d7020
...
...
@@ -3,7 +3,11 @@
import
re
from
typing
import
Callable
,
List
,
Optional
,
Union
from
sglang.backend.anthropic
import
Anthropic
from
sglang.backend.base_backend
import
BaseBackend
from
sglang.backend.openai
import
OpenAI
from
sglang.backend.runtime_endpoint
import
RuntimeEndpoint
from
sglang.backend.vertexai
import
VertexAI
from
sglang.global_config
import
global_config
from
sglang.lang.ir
import
(
SglExpr
,
...
...
python/sglang/backend/anthropic.py
View file @
150d7020
from
typing
import
List
,
Optional
,
Union
import
numpy
as
np
from
sglang.backend.base_backend
import
BaseBackend
from
sglang.lang.chat_template
import
get_chat_template
from
sglang.lang.interpreter
import
StreamExecutor
...
...
python/sglang/backend/base_backend.py
View file @
150d7020
from
typing
import
List
,
Optional
,
Union
from
typing
import
Callable
,
List
,
Optional
,
Union
from
sglang.lang.chat_template
import
get_chat_template
from
sglang.lang.interpreter
import
StreamExecutor
...
...
python/sglang/backend/openai.py
View file @
150d7020
import
logging
import
time
from
typing
import
List
,
Optional
from
typing
import
Callable
,
List
,
Optional
,
Union
import
numpy
as
np
...
...
python/sglang/backend/runtime_endpoint.py
View file @
150d7020
import
json
from
typing
import
List
,
Optional
from
typing
import
Callable
,
List
,
Optional
,
Union
import
numpy
as
np
import
requests
from
sglang.backend.base_backend
import
BaseBackend
from
sglang.global_config
import
global_config
from
sglang.lang.chat_template
import
get_chat_template_by_model_path
from
sglang.lang.interpreter
import
StreamExecutor
from
sglang.lang.ir
import
SglSamplingParams
from
sglang.utils
import
find_printable_text
,
http_request
from
sglang.lang.ir
import
SglArgument
,
SglSamplingParams
from
sglang.utils
import
encode_image_base64
,
find_printable_text
,
http_request
class
RuntimeEndpoint
(
BaseBackend
):
...
...
python/sglang/backend/vertexai.py
View file @
150d7020
import
os
import
warnings
from
typing
import
List
,
Optional
,
Union
import
numpy
as
np
from
sglang.backend.base_backend
import
BaseBackend
from
sglang.lang.chat_template
import
get_chat_template
...
...
python/sglang/lang/chat_template.py
View file @
150d7020
from
dataclasses
import
dataclass
from
dataclasses
import
dataclass
,
field
from
enum
import
Enum
,
auto
from
typing
import
Callable
,
Dict
,
List
,
Tuple
from
typing
import
Callable
,
Dict
,
List
,
Optional
,
Tuple
class
ChatTemplateStyle
(
Enum
):
...
...
python/sglang/lang/compiler.py
View file @
150d7020
...
...
@@ -5,7 +5,13 @@ from typing import List, Union
from
sglang.global_config
import
global_config
from
sglang.lang.interpreter
import
ProgramState
,
StreamExecutor
,
pin_program
from
sglang.lang.ir
import
SglArgument
,
SglExpr
,
SglSamplingParams
,
SglVariable
from
sglang.lang.ir
import
(
SglArgument
,
SglConstantText
,
SglExpr
,
SglSamplingParams
,
SglVariable
,
)
def
compile_func
(
function
,
backend
):
...
...
python/sglang/lang/interpreter.py
View file @
150d7020
...
...
@@ -7,7 +7,7 @@ import threading
import
uuid
from
concurrent.futures
import
ThreadPoolExecutor
from
contextlib
import
contextmanager
from
typing
import
Any
,
Callable
,
Dict
,
List
,
Optional
from
typing
import
Any
,
Callable
,
Dict
,
List
,
Optional
,
Union
import
tqdm
...
...
@@ -18,6 +18,7 @@ from sglang.lang.ir import (
SglConstantText
,
SglExpr
,
SglExprList
,
SglFunction
,
SglGen
,
SglImage
,
SglRoleBegin
,
...
...
python/sglang/lang/ir.py
View file @
150d7020
...
...
@@ -472,4 +472,4 @@ class SglCommitLazy(SglExpr):
super
().
__init__
()
def
__repr__
(
self
):
return
"CommitLazy()"
return
f
"CommitLazy()"
python/sglang/lang/tracer.py
View file @
150d7020
"""Tracing a program."""
import
uuid
from
typing
import
Any
,
Dict
,
List
,
Optional
from
typing
import
Any
,
Callable
,
Dict
,
List
,
Optional
,
Union
from
sglang.backend.base_backend
import
BaseBackend
from
sglang.global_config
import
global_config
from
sglang.lang.interpreter
import
ProgramState
,
ProgramStateGroup
from
sglang.lang.ir
import
(
SglArgument
,
SglCommitLazy
,
SglConcateAndAppend
,
SglConstantText
,
SglExpr
,
SglExprList
,
SglFork
,
SglFunction
,
SglGen
,
SglGetForkItem
,
SglRoleBegin
,
...
...
python/sglang/srt/hf_transformers_utils.py
View file @
150d7020
...
...
@@ -3,7 +3,7 @@
import
json
import
os
import
warnings
from
typing
import
Optional
,
Union
from
typing
import
List
,
Optional
,
Tuple
,
Union
from
huggingface_hub
import
snapshot_download
from
transformers
import
(
...
...
python/sglang/srt/managers/detokenizer_manager.py
View file @
150d7020
...
...
@@ -84,7 +84,7 @@ def start_detokenizer_process(
):
try
:
manager
=
DetokenizerManager
(
server_args
,
port_args
)
except
Exception
:
except
Exception
as
e
:
pipe_writer
.
send
(
get_exception_traceback
())
raise
pipe_writer
.
send
(
"init ok"
)
...
...
python/sglang/srt/managers/router/radix_cache.py
View file @
150d7020
import
heapq
import
time
from
collections
import
defaultdict
from
dataclasses
import
dataclass
from
typing
import
Tuple
import
torch
...
...
python/sglang/srt/models/commandr.py
View file @
150d7020
...
...
@@ -20,7 +20,7 @@
# This file is based on the LLama model definition file in transformers
"""PyTorch Cohere model."""
from
typing
import
Optional
,
Tuple
from
typing
import
List
,
Optional
,
Tuple
import
torch
import
torch.utils.checkpoint
...
...
python/sglang/srt/models/llama2.py
View file @
150d7020
# Adapted from
# https://github.com/vllm-project/vllm/blob/671af2b1c0b3ed6d856d37c21a561cc429a10701/vllm/model_executor/models/llama.py#L1
"""Inference-only LLaMA model compatible with HuggingFace weights."""
from
typing
import
Any
,
Dict
,
Optional
,
Tuple
from
typing
import
Any
,
Dict
,
List
,
Optional
,
Tuple
import
torch
from
torch
import
nn
...
...
python/sglang/srt/models/llava.py
View file @
150d7020
...
...
@@ -5,7 +5,7 @@ from typing import List, Optional
import
numpy
as
np
import
torch
from
torch
import
nn
from
transformers
import
CLIPVisionModel
,
LlavaConfig
from
transformers
import
CLIPVisionModel
,
LlamaConfig
,
LlavaConfig
from
transformers.models.llava.modeling_llava
import
LlavaMultiModalProjector
from
vllm.model_executor.layers.linear
import
LinearMethodBase
from
vllm.model_executor.weight_utils
import
(
...
...
python/sglang/srt/models/mixtral.py
View file @
150d7020
# Adapted from
# https://github.com/vllm-project/vllm/blob/d0215a58e78572d91dadafe9d832a2db89b09a13/vllm/model_executor/models/mixtral.py#L1
"""Inference-only Mixtral model."""
from
typing
import
Optional
from
typing
import
List
,
Optional
,
Tuple
import
numpy
as
np
import
torch
...
...
python/sglang/srt/models/qwen.py
View file @
150d7020
from
typing
import
Any
,
Dict
,
Optional
from
typing
import
Any
,
Dict
,
List
,
Optional
,
Tuple
import
torch
from
torch
import
nn
...
...
python/sglang/srt/models/qwen2.py
View file @
150d7020
# Adapted from llama2.py
# Modify details for the adaptation of Qwen2 model.
"""Inference-only Qwen2 model compatible with HuggingFace weights."""
from
typing
import
Any
,
Dict
,
Optional
,
Tuple
from
typing
import
Any
,
Dict
,
List
,
Optional
,
Tuple
import
torch
from
torch
import
nn
...
...
Prev
1
2
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment