"vscode:/vscode.git/clone" did not exist on "9bc4ce27e6d9f0a5e9b5e9eb59f7e5224f13b8e5"
Commit dea0555f authored by turneram's avatar turneram
Browse files

Make shared_block char

parent b10116e5
......@@ -58,8 +58,8 @@ __global__ void ck_gemm_kernel(void* a_p, void* b_p, void* c_p)
{
make_tensors()(a_p, b_p, c_p)([](auto a_t, auto b_t, auto c_t) {
constexpr ck::index_t shared_block_size =
hGridwiseGemm::GetSharedMemoryNumberOfByte() /* / sizeof(float) */;
__shared__ void* p_shared_block[shared_block_size];
hGridwiseGemm::GetSharedMemoryNumberOfByte();
__shared__ char p_shared_block[shared_block_size];
make_tensors()(p_shared_block)([&](auto p_t) {
ck_gemm(a_t, b_t, c_t, p_t);
});
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment