Commit abd9c245 authored by Jing Zhang's avatar Jing Zhang
Browse files

fixed sweep logic

parent a5aa963c
...@@ -166,7 +166,7 @@ struct ThreadwiseTensorSliceTransfer_v1r3 ...@@ -166,7 +166,7 @@ struct ThreadwiseTensorSliceTransfer_v1r3
index_t tmp = ordered_access_idx[I0]; index_t tmp = ordered_access_idx[I0];
static_for<1, i, 1>{}([&](auto j) { static_for<1, i, 1>{}([&](auto j) {
tmp = tmp * ordered_access_lengths[j - 1] + ordered_access_idx[j]; tmp = tmp * ordered_access_lengths[j] + ordered_access_idx[j];
}); });
forward_sweep_(i) = tmp % 2 == 0; forward_sweep_(i) = tmp % 2 == 0;
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment