"INSTALL/git@developer.sourcefind.cn:dadigang/Ventoy.git" did not exist on "ebaa4d954aa0b3d70f14b2fd6fec63df1599b8ce"
Unverified Commit 77b9d08e authored by Lei Wang's avatar Lei Wang Committed by GitHub
Browse files

[Bugfix] Use `access_ptr("r")` instead of `access_ptr("w")` for correct pipeline analysis (#983)

* remove debug print

* pipeline fix

* use the correct buffer access scope
parent 117f2b81
......@@ -245,9 +245,9 @@ class TensorCoreIntrinEmitter(MMAIntrinEmitter):
# TODO(lei): inject warpgroup_fence_operand for C_local_buf
desc_a = T.alloc_descriptor()
desc_b = T.alloc_descriptor()
T.initialize_descriptor(desc_a, A_buf.access_ptr("w"), a_swizzle_mode,
T.initialize_descriptor(desc_a, A_buf.access_ptr("r"), a_swizzle_mode,
int(a_leading_byte_offset >> 4), int(a_stride_byte_offset >> 4))
T.initialize_descriptor(desc_b, B_buf.access_ptr("w"), b_swizzle_mode,
T.initialize_descriptor(desc_b, B_buf.access_ptr("r"), b_swizzle_mode,
int(b_leading_byte_offset >> 4), int(b_stride_byte_offset >> 4))
T.warpgroup_arrive()
for ki in T.serial(0, (k_dim // micro_size_k)):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment