Commit 77fccdf4 authored by zhuwenwen's avatar zhuwenwen
Browse files

update Is_fuse_fill

parent 5785324e
...@@ -241,7 +241,7 @@ def moe_align_block_size( ...@@ -241,7 +241,7 @@ def moe_align_block_size(
expert_map = expert_map, expert_map = expert_map,
expert_mask = expert_mask, expert_mask = expert_mask,
num_local_tokens = None, num_local_tokens = None,
is_fuse_fill = False if not envs.VLLM_USE_LIGHTOP_FILL_MOE_ALIGN else True) Is_fuse_fill = False if not envs.VLLM_USE_LIGHTOP_FILL_MOE_ALIGN else True)
else: else:
if envs.VLLM_USE_LIGHTOP_MOE_ALIGN: if envs.VLLM_USE_LIGHTOP_MOE_ALIGN:
from lightop import op as op from lightop import op as op
...@@ -250,7 +250,7 @@ def moe_align_block_size( ...@@ -250,7 +250,7 @@ def moe_align_block_size(
expert_map = None, expert_map = None,
expert_mask = None, expert_mask = None,
num_local_tokens = None, num_local_tokens = None,
is_fuse_fill = False if not envs.VLLM_USE_LIGHTOP_FILL_MOE_ALIGN else True) Is_fuse_fill = False if not envs.VLLM_USE_LIGHTOP_FILL_MOE_ALIGN else True)
else: else:
ops.moe_align_block_size(topk_ids, num_experts, block_size, sorted_ids, ops.moe_align_block_size(topk_ids, num_experts, block_size, sorted_ids,
expert_ids, num_tokens_post_pad) expert_ids, num_tokens_post_pad)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment