#ifndef CK_THREADWISE_GENERIC_TENSOR_OP_HPP #define CK_THREADWISE_GENERIC_TENSOR_OP_HPP #include "ConstantTensorDescriptor.hpp" #include "ConstantMergedTensorDescriptor.hpp" namespace ck { template __device__ void threadwise_generic_tensor_set_zero(TDesc, Float* __restrict__ p) { static_ford{}([&](auto multi_id) { constexpr index_t offset = TDesc::GetOffsetFromMultiIndex(multi_id); p[offset] = static_cast(0); }); } } // namespace ck #endif