"vscode:/vscode.git/clone" did not exist on "d50fbf59d7b74402857ef88fe25f7811801e125d"
Commit 2593dd60 authored by turneram's avatar turneram
Browse files

Formatting

parent d1e27426
...@@ -53,18 +53,18 @@ namespace gpu { ...@@ -53,18 +53,18 @@ namespace gpu {
// extern "C" { // extern "C" {
// __global__ void ck_gemm_kernel(void* a_p, void* b_p, void* c_p) // __global__ void ck_gemm_kernel(void* a_p, void* b_p, void* c_p)
// { // {
// // hipDeviceProp_t hdp{}; // // hipDeviceProp_t hdp{};
// // printf("Shared mem: %i\n", int(hdp.sharedMemPerBlock)); // // printf("Shared mem: %i\n", int(hdp.sharedMemPerBlock));
// // make_tensors()(a_p, b_p, c_p)([](auto&&... xs) { // // make_tensors()(a_p, b_p, c_p)([](auto&&... xs) {
// // ck_gemm(xs...); // // ck_gemm(xs...);
// // }); // // });
// make_tensors()(a_p, b_p, c_p)([](auto a_t, auto b_t, auto c_t) { // make_tensors()(a_p, b_p, c_p)([](auto a_t, auto b_t, auto c_t) {
// __shared__ float p_shared_block[512]; //[(a_t.get_shape().elements() + b_t.get_shape().elements()) * 2]; // __shared__ float p_shared_block[512]; //[(a_t.get_shape().elements() +
// ck_gemm(a_t, b_t, c_t, p_shared_block); // b_t.get_shape().elements()) * 2]; ck_gemm(a_t, b_t, c_t, p_shared_block);
// // make_tensors()(p_shared_block)([&](auto p_t) { // // make_tensors()(p_shared_block)([&](auto p_t) {
// // ck_gemm(a_t, b_t, c_t, p_t); // // ck_gemm(a_t, b_t, c_t, p_t);
// // }); // // });
// }); // });
// } // }
......
...@@ -283,7 +283,7 @@ __device__ void ck_gemm(const T& a_t, const U& b_t, const V& c_t, float* p_t) ...@@ -283,7 +283,7 @@ __device__ void ck_gemm(const T& a_t, const U& b_t, const V& c_t, float* p_t)
constexpr bool HasMainKBlockLoop = true; constexpr bool HasMainKBlockLoop = true;
constexpr bool HasDoubleTailKBlockLoop = true; constexpr bool HasDoubleTailKBlockLoop = true;
auto num_bytes = GridwiseGemm::GetSharedMemoryNumberOfByte(); auto num_bytes = GridwiseGemm::GetSharedMemoryNumberOfByte();
printf("Bytes: %i\n", int(num_bytes)); printf("Bytes: %i\n", int(num_bytes));
GridwiseGemm::Run(a_t.data(), GridwiseGemm::Run(a_t.data(),
b_t.data(), b_t.data(),
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment