Unverified Commit 4ea92f83 authored by Lianmin Zheng's avatar Lianmin Zheng Committed by GitHub
Browse files

Format code (#118)

parent 6b0af285
......@@ -324,7 +324,7 @@ python -m sglang.launch_server --model-path meta-llama/Llama-2-7b-chat-hf --port
- Mixtral
- LLaVA
- `python3 -m sglang.launch_server --model-path liuhaotian/llava-v1.5-7b --tokenizer-path llava-hf/llava-1.5-7b-hf --port 30000`
- Qwen
- Qwen / Qwen 2
- AWQ quantization
## Benchmark And Performance
......
......@@ -319,4 +319,5 @@ class LlamaForCausalLM(nn.Module):
weight_loader = getattr(param, "weight_loader", default_weight_loader)
weight_loader(param, loaded_weight)
EntryClass = LlamaForCausalLM
......@@ -331,4 +331,5 @@ def monkey_path_clip_vision_embed_forward():
clip_vision_embed_forward,
)
EntryClass = LlavaLlamaForCausalLM
......@@ -377,4 +377,5 @@ class MixtralForCausalLM(nn.Module):
weight_loader = getattr(param, "weight_loader", default_weight_loader)
weight_loader(param, loaded_weight)
EntryClass = MixtralForCausalLM
......@@ -259,4 +259,5 @@ class QWenLMHeadModel(nn.Module):
weight_loader = getattr(param, "weight_loader", default_weight_loader)
weight_loader(param, loaded_weight)
EntryClass = QWenLMHeadModel
......@@ -315,4 +315,5 @@ class Qwen2ForCausalLM(nn.Module):
weight_loader = getattr(param, "weight_loader", default_weight_loader)
weight_loader(param, loaded_weight)
EntryClass = Qwen2ForCausalLM
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment