Unverified Commit fbcf4300 authored by fzyzcjy's avatar fzyzcjy Committed by GitHub
Browse files

Update internode_ll.cu (#246)

parent c95997f8
......@@ -498,7 +498,7 @@ combine(void* combined_x,
}
cg::this_grid().sync();
// Reduce tokens with FP8 cast
// Reduce tokens
EP_DEVICE_ASSERT(num_topk <= 32 and hidden_bf16_int4 <= num_threads);
EP_STATIC_ASSERT(kHidden % (32 * kNumElemsPerInt4) == 0, "Invalid vectorization");
if (thread_id < hidden_bf16_int4) {
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment