"git@developer.sourcefind.cn:gaoqiong/composable_kernel.git" did not exist on "d3929cb051573dba83f549c1ecd4a8f9e47894d5"
Commit b0b67669 authored by Jing Zhang's avatar Jing Zhang
Browse files

fixed host tensor size

parent 66873f3a
...@@ -105,7 +105,7 @@ bool profile_gemm_universal_impl(int do_verification, ...@@ -105,7 +105,7 @@ bool profile_gemm_universal_impl(int do_verification,
const auto c_element_op = CElementOp{}; const auto c_element_op = CElementOp{};
DeviceMem a_device_buf(sizeof(ADataType) * a_m_k.mDesc.GetElementSpaceSize()); DeviceMem a_device_buf(sizeof(ADataType) * a_m_k.mDesc.GetElementSpaceSize());
DeviceMem b_device_buf(sizeof(BDataType) * b_k_n_permute.mDesc.GetElementSpaceSize()); DeviceMem b_device_buf(sizeof(BDataType) * b_k_n_permute.mDesc.GetElementSpaceSize() / (is_same_v<BDataType, ck::pk_i4_t> ? 2 : 1));
DeviceMem c_device_buf(sizeof(CDataType) * c_m_n_device_result.mDesc.GetElementSpaceSize()); DeviceMem c_device_buf(sizeof(CDataType) * c_m_n_device_result.mDesc.GetElementSpaceSize());
a_device_buf.ToDevice(a_m_k.mData.data()); a_device_buf.ToDevice(a_m_k.mData.data());
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment