Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
MIGraphX
Commits
7108c3a8
Commit
7108c3a8
authored
Oct 29, 2022
by
Paul
Browse files
Update instances
parent
dd004bc4
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
8 additions
and
2628 deletions
+8
-2628
src/targets/gpu/jit/ck_gemm_instances.cpp
src/targets/gpu/jit/ck_gemm_instances.cpp
+8
-2628
No files found.
src/targets/gpu/jit/ck_gemm_instances.cpp
View file @
7108c3a8
...
...
@@ -5,2634 +5,14 @@
#include <string>
#include <functional>
const
std
::
vector
<
std
::
string
>&
get_instance
(
std
::
size_t
i
,
const
std
::
function
<
bool
(
const
std
::
vector
<
std
::
string
>&
)
>&
pred
)
const
std
::
vector
<
std
::
string
>&
get_instance
(
std
::
size_t
i
,
const
std
::
function
<
bool
(
const
std
::
vector
<
std
::
string
>&
)
>&
pred
)
{
static
std
::
vector
<
std
::
vector
<
std
::
vector
<
std
::
string
>>>
instances
=
{
{{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<8,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<16,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"1"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
}},
{{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<8,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<16,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"1"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
}},
{{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"64"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"32"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"32"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"64"
,
"32"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
},
{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"32"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
}},
{{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<8,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<16,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"1"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<16,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},
{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"1"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
}}};
auto
it
=
std
::
find_if
(
instances
.
begin
(),
instances
.
end
(),
[
&
](
const
auto
&
v
)
{
return
pred
(
v
[
0
]);
});
static
std
::
vector
<
std
::
vector
<
std
::
vector
<
std
::
string
>>>
instances
=
{{{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<8,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<16,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"1"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"8"
,
"2"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"64"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"64"
,
"32"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"32"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
}},{{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<8,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"2"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<16,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"1"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"64"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"64"
,
"32"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"32"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
}},{{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"32"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"32"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"64"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"64"
,
"32"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::RowMajor"
,
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"32"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<1,0,2>"
,
"ck::Sequence<1,0,2>"
,
"2"
,
"8"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
}},{{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"256"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"256"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"4"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"4"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<8,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"128"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<16,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"128"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"1"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"2"
,
"2"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<16,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"ck::Sequence<8,32,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"2"
,
"0"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"256"
,
"64"
,
"128"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"1"
,
"8"
,
"1"
,
"ck::Sequence<4,64,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,32,1,8>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"64"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"2"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"64"
,
"32"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"2"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
},{
"ck::tensor_layout::gemm::ColumnMajor"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::Tuple<>"
,
"ck::tensor_layout::gemm::RowMajor"
,
"ck::half_t"
,
"ck::half_t"
,
"float"
,
"float"
,
"ck::Tuple<>"
,
"ck::half_t"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck_passthrough"
,
"ck::tensor_operation::device::GemmSpecialization::Default"
,
"1"
,
"64"
,
"32"
,
"64"
,
"32"
,
"8"
,
"8"
,
"32"
,
"32"
,
"1"
,
"2"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"2"
,
"8"
,
"1"
,
"ck::Sequence<4,16,1>"
,
"ck::Sequence<0,2,1>"
,
"ck::Sequence<0,2,1>"
,
"1"
,
"4"
,
"8"
,
"1"
,
"1"
,
"1"
,
"ck::Sequence<1,16,1,4>"
,
"8"
}}};
auto
it
=
std
::
find_if
(
instances
.
begin
(),
instances
.
end
(),
[
&
](
const
auto
&
v
)
{
return
pred
(
v
[
0
]);
});
return
it
->
at
(
i
);
}
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment