threadwise_4d_tensor_op.hip.hpp 11.1 KB