Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
a006aa63
Commit
a006aa63
authored
Nov 17, 2021
by
Chao Liu
Browse files
reworking vector_type
parent
0a66c54e
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
89 additions
and
45 deletions
+89
-45
composable_kernel/include/utility/data_type.hpp
composable_kernel/include/utility/data_type.hpp
+45
-45
composable_kernel/include/utility/statically_indexed_array.hpp
...sable_kernel/include/utility/statically_indexed_array.hpp
+44
-0
No files found.
composable_kernel/include/utility/data_type.hpp
View file @
a006aa63
...
...
@@ -137,7 +137,7 @@ struct vector_type<T, 1>
union
{
T
d1_
;
StaticallyIndexedArray
<
T
,
1
>
d1x1_
;
StaticallyIndexedArray
_v2
<
T
,
1
>
d1x1_
;
}
data_
;
__host__
__device__
constexpr
vector_type
()
:
data_
{
type
{
0
}}
{}
...
...
@@ -172,8 +172,8 @@ struct vector_type<T, 2>
union
{
d2_t
d2_
;
StaticallyIndexedArray
<
d1_t
,
2
>
d1x2_
;
StaticallyIndexedArray
<
d2_t
,
1
>
d2x1_
;
StaticallyIndexedArray
_v2
<
d1_t
,
2
>
d1x2_
;
StaticallyIndexedArray
_v2
<
d2_t
,
1
>
d2x1_
;
}
data_
;
__host__
__device__
constexpr
vector_type
()
:
data_
{
type
{
0
}}
{}
...
...
@@ -223,9 +223,9 @@ struct vector_type<T, 4>
union
{
d4_t
d4_
;
StaticallyIndexedArray
<
d1_t
,
4
>
d1x4_
;
StaticallyIndexedArray
<
d2_t
,
2
>
d2x2_
;
StaticallyIndexedArray
<
d4_t
,
1
>
d4x1_
;
StaticallyIndexedArray
_v2
<
d1_t
,
4
>
d1x4_
;
StaticallyIndexedArray
_v2
<
d2_t
,
2
>
d2x2_
;
StaticallyIndexedArray
_v2
<
d4_t
,
1
>
d4x1_
;
}
data_
;
__host__
__device__
constexpr
vector_type
()
:
data_
{
type
{
0
}}
{}
...
...
@@ -286,10 +286,10 @@ struct vector_type<T, 8>
union
{
d8_t
d8_
;
StaticallyIndexedArray
<
d1_t
,
8
>
d1x8_
;
StaticallyIndexedArray
<
d2_t
,
4
>
d2x4_
;
StaticallyIndexedArray
<
d4_t
,
2
>
d4x2_
;
StaticallyIndexedArray
<
d8_t
,
1
>
d8x1_
;
StaticallyIndexedArray
_v2
<
d1_t
,
8
>
d1x8_
;
StaticallyIndexedArray
_v2
<
d2_t
,
4
>
d2x4_
;
StaticallyIndexedArray
_v2
<
d4_t
,
2
>
d4x2_
;
StaticallyIndexedArray
_v2
<
d8_t
,
1
>
d8x1_
;
}
data_
;
__host__
__device__
constexpr
vector_type
()
:
data_
{
type
{
0
}}
{}
...
...
@@ -361,11 +361,11 @@ struct vector_type<T, 16>
union
{
d16_t
d16_
;
StaticallyIndexedArray
<
d1_t
,
16
>
d1x16_
;
StaticallyIndexedArray
<
d2_t
,
8
>
d2x8_
;
StaticallyIndexedArray
<
d4_t
,
4
>
d4x4_
;
StaticallyIndexedArray
<
d8_t
,
2
>
d8x2_
;
StaticallyIndexedArray
<
d16_t
,
1
>
d16x1_
;
StaticallyIndexedArray
_v2
<
d1_t
,
16
>
d1x16_
;
StaticallyIndexedArray
_v2
<
d2_t
,
8
>
d2x8_
;
StaticallyIndexedArray
_v2
<
d4_t
,
4
>
d4x4_
;
StaticallyIndexedArray
_v2
<
d8_t
,
2
>
d8x2_
;
StaticallyIndexedArray
_v2
<
d16_t
,
1
>
d16x1_
;
}
data_
;
__host__
__device__
constexpr
vector_type
()
:
data_
{
type
{
0
}}
{}
...
...
@@ -448,12 +448,12 @@ struct vector_type<T, 32>
union
{
d32_t
d32_
;
StaticallyIndexedArray
<
d1_t
,
32
>
d1x32_
;
StaticallyIndexedArray
<
d2_t
,
16
>
d2x16_
;
StaticallyIndexedArray
<
d4_t
,
8
>
d4x8_
;
StaticallyIndexedArray
<
d8_t
,
4
>
d8x4_
;
StaticallyIndexedArray
<
d16_t
,
2
>
d16x2_
;
StaticallyIndexedArray
<
d32_t
,
1
>
d32x1_
;
StaticallyIndexedArray
_v2
<
d1_t
,
32
>
d1x32_
;
StaticallyIndexedArray
_v2
<
d2_t
,
16
>
d2x16_
;
StaticallyIndexedArray
_v2
<
d4_t
,
8
>
d4x8_
;
StaticallyIndexedArray
_v2
<
d8_t
,
4
>
d8x4_
;
StaticallyIndexedArray
_v2
<
d16_t
,
2
>
d16x2_
;
StaticallyIndexedArray
_v2
<
d32_t
,
1
>
d32x1_
;
}
data_
;
__host__
__device__
constexpr
vector_type
()
:
data_
{
type
{
0
}}
{}
...
...
@@ -545,13 +545,13 @@ struct vector_type<T, 64>
union
{
d64_t
d64_
;
StaticallyIndexedArray
<
d1_t
,
64
>
d1x64_
;
StaticallyIndexedArray
<
d2_t
,
32
>
d2x32_
;
StaticallyIndexedArray
<
d4_t
,
16
>
d4x16_
;
StaticallyIndexedArray
<
d8_t
,
8
>
d8x8_
;
StaticallyIndexedArray
<
d16_t
,
4
>
d16x4_
;
StaticallyIndexedArray
<
d32_t
,
2
>
d32x2_
;
StaticallyIndexedArray
<
d64_t
,
1
>
d64x1_
;
StaticallyIndexedArray
_v2
<
d1_t
,
64
>
d1x64_
;
StaticallyIndexedArray
_v2
<
d2_t
,
32
>
d2x32_
;
StaticallyIndexedArray
_v2
<
d4_t
,
16
>
d4x16_
;
StaticallyIndexedArray
_v2
<
d8_t
,
8
>
d8x8_
;
StaticallyIndexedArray
_v2
<
d16_t
,
4
>
d16x4_
;
StaticallyIndexedArray
_v2
<
d32_t
,
2
>
d32x2_
;
StaticallyIndexedArray
_v2
<
d64_t
,
1
>
d64x1_
;
}
data_
;
__host__
__device__
constexpr
vector_type
()
:
data_
{
type
{
0
}}
{}
...
...
@@ -654,14 +654,14 @@ struct vector_type<T, 128>
union
{
d128_t
d128_
;
StaticallyIndexedArray
<
d1_t
,
128
>
d1x128_
;
StaticallyIndexedArray
<
d2_t
,
64
>
d2x64_
;
StaticallyIndexedArray
<
d4_t
,
32
>
d4x32_
;
StaticallyIndexedArray
<
d8_t
,
16
>
d8x16_
;
StaticallyIndexedArray
<
d16_t
,
8
>
d16x8_
;
StaticallyIndexedArray
<
d32_t
,
4
>
d32x4_
;
StaticallyIndexedArray
<
d64_t
,
2
>
d64x2_
;
StaticallyIndexedArray
<
d128_t
,
1
>
d128x1_
;
StaticallyIndexedArray
_v2
<
d1_t
,
128
>
d1x128_
;
StaticallyIndexedArray
_v2
<
d2_t
,
64
>
d2x64_
;
StaticallyIndexedArray
_v2
<
d4_t
,
32
>
d4x32_
;
StaticallyIndexedArray
_v2
<
d8_t
,
16
>
d8x16_
;
StaticallyIndexedArray
_v2
<
d16_t
,
8
>
d16x8_
;
StaticallyIndexedArray
_v2
<
d32_t
,
4
>
d32x4_
;
StaticallyIndexedArray
_v2
<
d64_t
,
2
>
d64x2_
;
StaticallyIndexedArray
_v2
<
d128_t
,
1
>
d128x1_
;
}
data_
;
__host__
__device__
constexpr
vector_type
()
:
data_
{
type
{
0
}}
{}
...
...
@@ -773,15 +773,15 @@ struct vector_type<T, 256>
union
{
d256_t
d256_
;
StaticallyIndexedArray
<
d1_t
,
256
>
d1x256_
;
StaticallyIndexedArray
<
d2_t
,
128
>
d2x128_
;
StaticallyIndexedArray
<
d4_t
,
64
>
d4x64_
;
StaticallyIndexedArray
<
d8_t
,
32
>
d8x32_
;
StaticallyIndexedArray
<
d16_t
,
16
>
d16x16_
;
StaticallyIndexedArray
<
d32_t
,
8
>
d32x8_
;
StaticallyIndexedArray
<
d64_t
,
4
>
d64x4_
;
StaticallyIndexedArray
<
d128_t
,
2
>
d128x2_
;
StaticallyIndexedArray
<
d256_t
,
1
>
d256x1_
;
StaticallyIndexedArray
_v2
<
d1_t
,
256
>
d1x256_
;
StaticallyIndexedArray
_v2
<
d2_t
,
128
>
d2x128_
;
StaticallyIndexedArray
_v2
<
d4_t
,
64
>
d4x64_
;
StaticallyIndexedArray
_v2
<
d8_t
,
32
>
d8x32_
;
StaticallyIndexedArray
_v2
<
d16_t
,
16
>
d16x16_
;
StaticallyIndexedArray
_v2
<
d32_t
,
8
>
d32x8_
;
StaticallyIndexedArray
_v2
<
d64_t
,
4
>
d64x4_
;
StaticallyIndexedArray
_v2
<
d128_t
,
2
>
d128x2_
;
StaticallyIndexedArray
_v2
<
d256_t
,
1
>
d256x1_
;
}
data_
;
__host__
__device__
constexpr
vector_type
()
:
data_
{
type
{
0
}}
{}
...
...
composable_kernel/include/utility/statically_indexed_array.hpp
View file @
a006aa63
...
...
@@ -54,5 +54,49 @@ __host__ __device__ constexpr auto make_statically_indexed_array()
return
StaticallyIndexedArray
<
X
,
0
>
();
}
template
<
typename
T
,
index_t
N
>
struct
StaticallyIndexedArray_v2
{
__host__
__device__
constexpr
StaticallyIndexedArray_v2
()
=
default
;
__host__
__device__
static
constexpr
index_t
Size
()
{
return
N
;
}
// read access
template
<
index_t
I
>
__host__
__device__
constexpr
const
auto
&
At
(
Number
<
I
>
)
const
{
static_assert
(
I
<
N
,
"wrong! out of range"
);
return
data_
[
I
];
}
// write access
template
<
index_t
I
>
__host__
__device__
constexpr
auto
&
At
(
Number
<
I
>
)
{
static_assert
(
I
<
N
,
"wrong! out of range"
);
return
data_
[
I
];
}
// read access
template
<
index_t
I
>
__host__
__device__
constexpr
const
auto
&
operator
[](
Number
<
I
>
i
)
const
{
return
At
(
i
);
}
// write access
template
<
index_t
I
>
__host__
__device__
constexpr
auto
&
operator
()(
Number
<
I
>
i
)
{
return
At
(
i
);
}
__host__
__device__
static
constexpr
bool
IsStaticBuffer
()
{
return
true
;
}
T
data_
[
N
];
};
}
// namespace ck
#endif
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment