Commit 58c47942 authored by Shangyan Zhou's avatar Shangyan Zhou
Browse files

Minor fix.

parent 7ce8da4e
......@@ -560,7 +560,6 @@ dispatch(int4* recv_x, float* recv_x_scales, int64_t* recv_topk_idx, float* recv
if (is_token_in_rank_uint64 != 0) {
// Acquire lock first
acquire_lock(rdma_send_channel_lock + lane_id);
auto window = rdma_send_channel_window[lane_id];
auto latest_tail = rdma_send_channel_tail[lane_id];
auto offset = rdma_tail_idx - latest_tail;
while (offset >= 32) {
......@@ -572,7 +571,7 @@ dispatch(int4* recv_x, float* recv_x_scales, int64_t* recv_topk_idx, float* recv
// Release the transaction slot
// Add the bit and move the ones if possible
window |= 1u << offset;
auto window = rdma_send_channel_window[lane_id] | (1u << offset);
if (offset == 0) {
auto num_empty_slots = (~window) == 0 ? 32 : __ffs(~window) - 1;
st_release_cta(rdma_send_channel_tail + lane_id, latest_tail + num_empty_slots);
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment