"vscode:/vscode.git/clone" did not exist on "86ceded98b2c1f2be48edb61bedbcc38d2c5c290"
Commit d6dff178 authored by rocking's avatar rocking
Browse files

Sync verification flow with GPU kernel

parent ea6b9481
...@@ -100,7 +100,9 @@ static void host_verify(const Tensor<AType>& a_m_k, ...@@ -100,7 +100,9 @@ static void host_verify(const Tensor<AType>& a_m_k,
static_cast<AccDataType>(b_element_op(b_k_n(k, n))); static_cast<AccDataType>(b_element_op(b_k_n(k, n)));
} }
c_element_op(c_m_n(m, n), v, c0_k_n(m, n)); CType y = static_cast<CType>(v);
c_element_op(c_m_n(m, n), y, c0_k_n(m, n));
}; };
make_ParallelTensorFunctor(f_mk_kn_mn, make_ParallelTensorFunctor(f_mk_kn_mn,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment