"llama/git@developer.sourcefind.cn:OpenDAS/ollama.git" did not exist on "220e133fca8fe128dbf8fecef96c8484f991e39c"
Commit 0285bf05 authored by rtmadduri's avatar rtmadduri
Browse files

building locally

parent f0d626c3
...@@ -430,17 +430,12 @@ struct DeviceGroupedGemmXdlSplitKCShuffle : public DeviceGroupedGemmSplitK<ALayo ...@@ -430,17 +430,12 @@ struct DeviceGroupedGemmXdlSplitKCShuffle : public DeviceGroupedGemmSplitK<ALayo
} }
} }
ave_time = ave_time = launch_and_time_kernel(stream_config,
launch_and_time_kernel(stream_config, kernel,
kernel, dim3(arg.grid_size_),
dim3(arg.grid_size_), dim3(BlockSize),
dim3(BlockSize), 0,
0, arg.gemm_kernel_args_[0].karg_);
cast_pointer_to_constant_address_space(arg.p_workspace_),
arg.gemm_kernel_args_.size(),
PassThrough{},
PassThrough{},
PassThrough{});
}; };
constexpr index_t minimum_occupancy = constexpr index_t minimum_occupancy =
......
...@@ -203,7 +203,6 @@ struct DeviceGroupedGemmSplitkInstanceWrapper ...@@ -203,7 +203,6 @@ struct DeviceGroupedGemmSplitkInstanceWrapper
PassThrough, PassThrough,
PassThrough, PassThrough,
GemmSpec, GemmSpec,
1,
128, 128,
128, 128,
128, 128,
...@@ -230,7 +229,7 @@ struct DeviceGroupedGemmSplitkInstanceWrapper ...@@ -230,7 +229,7 @@ struct DeviceGroupedGemmSplitkInstanceWrapper
BBlockLdsAddExtraM::value, BBlockLdsAddExtraM::value,
1, 1,
1, 1,
S<16, 1, 8>, S<1, 16, 1, 8>,
CDEBlockTransferScalarPerVector_NPerBlock>; CDEBlockTransferScalarPerVector_NPerBlock>;
bool IsSupported(const std::vector<int>& Ms, bool IsSupported(const std::vector<int>& Ms,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment