Commit 904b87ba authored by zhuwenwen's avatar zhuwenwen
Browse files

add VLLM_USE_LIGHTOP_FILL_MOE_ALIN

parent cff5c2d2
...@@ -266,6 +266,8 @@ def get_model_architecture( ...@@ -266,6 +266,8 @@ def get_model_architecture(
os.environ['VLLM_USE_LIGHTOP_MOE_SUM_MUL_ADD'] = '1' os.environ['VLLM_USE_LIGHTOP_MOE_SUM_MUL_ADD'] = '1'
if not envs.is_set("VLLM_USE_OPT_CAT"): if not envs.is_set("VLLM_USE_OPT_CAT"):
os.environ['VLLM_USE_OPT_CAT'] = '1' os.environ['VLLM_USE_OPT_CAT'] = '1'
if not envs.is_set("VLLM_USE_LIGHTOP_FILL_MOE_ALIN"):
os.environ['VLLM_USE_LIGHTOP_FILL_MOE_ALIN'] = '1'
# awq相关配置 # awq相关配置
try: try:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment