Commit 780ed50e authored by 王敏's avatar 王敏
Browse files

[fix]解决编译错误

parent c2ed66f0
......@@ -307,7 +307,7 @@ __global__ void ep_moe_align_block_size_kernel(scalar_t* __restrict__ topk_ids,
* assigned to expert expert_index.
*/
for (int i = start_idx; i < numel && i < start_idx + tokens_per_thread; ++i) {
expert_id = topk_ids[i];
int32_t expert_id = topk_ids[i];
if (expert_id >= start_expert && expert_id < end_expert) {
++tokens_cnts[index(num_experts, threadIdx.x + 1, expert_id - start_expert)];
}
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment