Commit 1db5839e authored by zhuwenwen's avatar zhuwenwen
Browse files

update moe_align_block_size interface

parent ba7bcccd
...@@ -101,7 +101,8 @@ def moe_align_block_size( ...@@ -101,7 +101,8 @@ def moe_align_block_size(
expert_ids, num_tokens_post_pad, expert_ids, num_tokens_post_pad,
expert_map = expert_map, expert_map = expert_map,
expert_mask = expert_mask, expert_mask = expert_mask,
num_local_tokens = None) num_local_tokens = None,
Is_fuse_fill = False)
else: else:
if envs.VLLM_USE_LIGHTOP_MOE_ALIGN: if envs.VLLM_USE_LIGHTOP_MOE_ALIGN:
from lightop import op as op from lightop import op as op
...@@ -109,7 +110,8 @@ def moe_align_block_size( ...@@ -109,7 +110,8 @@ def moe_align_block_size(
expert_ids, num_tokens_post_pad, expert_ids, num_tokens_post_pad,
expert_map = None, expert_map = None,
expert_mask = None, expert_mask = None,
num_local_tokens = None) num_local_tokens = None,
Is_fuse_fill = False)
else: else:
ops.moe_align_block_size(topk_ids, num_experts, block_size, sorted_ids, ops.moe_align_block_size(topk_ids, num_experts, block_size, sorted_ids,
expert_ids, num_tokens_post_pad) expert_ids, num_tokens_post_pad)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment