Commit 414f3ac9 authored by Jing Zhang's avatar Jing Zhang
Browse files

merge develop

parents a60cd1d9 9d58c421
...@@ -74,6 +74,7 @@ struct AddScale ...@@ -74,6 +74,7 @@ struct AddScale
a = scale * (a0 + a1); a = scale * (a0 + a1);
} }
// this attribute will force copy_function applying element_wise with vector_type
static constexpr ck::index_t vec_len = 4; static constexpr ck::index_t vec_len = 4;
float scale = 1.0; float scale = 1.0;
......
...@@ -427,6 +427,7 @@ struct GridwiseGemmMultipleABD_xdl_cshuffle ...@@ -427,6 +427,7 @@ struct GridwiseGemmMultipleABD_xdl_cshuffle
return generate_tuple( return generate_tuple(
[&](auto i) { [&](auto i) {
using ALayout = remove_cvref_t<tuple_element_t<i.value, AsLayout>>; using ALayout = remove_cvref_t<tuple_element_t<i.value, AsLayout>>;
return MakeAGridDescriptor_M_K<ALayout, GemmSpec>(MRaws[i], KRaws[i], AsStride[i]); return MakeAGridDescriptor_M_K<ALayout, GemmSpec>(MRaws[i], KRaws[i], AsStride[i]);
}, },
Number<NumATensor>{}); Number<NumATensor>{});
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment