Commit 4d7b32c5 authored by rusty1s's avatar rusty1s
Browse files

assertions

parent 9b68396b
......@@ -151,8 +151,9 @@ __global__ void segment_add_coo_kernel(const scalar_t *src_data,
#pragma unroll
for (int offset = 1; offset < TB; offset *= 2) {
tmp = __shfl_up_sync(FULL_MASK, val, offset);
if (lane_idx >= offset &&
idx == __ldg(index_data + thread_idx - offset)) {
int idx_next = __ldg(index_data + thread_idx - offset);
// AT_ASSERTM(lane_idx < offset || idx <= idx_next);
if (lane_idx >= offset && idx == idx_next) {
val += tmp;
}
}
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment