Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
7bbae9af
Unverified
Commit
7bbae9af
authored
Oct 30, 2023
by
Bartłomiej Kocot
Committed by
GitHub
Oct 30, 2023
Browse files
Merge branch 'develop' into barkocot/image-to-column-with-groups
parents
36f54418
f46a6ffa
Changes
6
Show whitespace changes
Inline
Side-by-side
Showing
6 changed files
with
12 additions
and
10 deletions
+12
-10
docs/sphinx/requirements.in
docs/sphinx/requirements.in
+1
-1
docs/sphinx/requirements.txt
docs/sphinx/requirements.txt
+1
-1
example/27_layernorm/run_layernorm_example.inc
example/27_layernorm/run_layernorm_example.inc
+4
-4
example/42_groupnorm/run_groupnorm_example.inc
example/42_groupnorm/run_groupnorm_example.inc
+2
-2
include/ck/utility/type_convert.hpp
include/ck/utility/type_convert.hpp
+2
-0
profiler/include/profiler/profile_gemm_impl.hpp
profiler/include/profiler/profile_gemm_impl.hpp
+2
-2
No files found.
docs/sphinx/requirements.in
View file @
7bbae9af
rocm-docs-core>=0.20.0
rocm-docs-core>=0.20.0
sphinxcontrib-bibtex==2.
5.0
sphinxcontrib-bibtex==2.
6.1
docs/sphinx/requirements.txt
View file @
7bbae9af
...
@@ -139,7 +139,7 @@ sphinx-notfound-page==0.8.3
...
@@ -139,7 +139,7 @@ sphinx-notfound-page==0.8.3
# via rocm-docs-core
# via rocm-docs-core
sphinxcontrib-applehelp==1.0.4
sphinxcontrib-applehelp==1.0.4
# via sphinx
# via sphinx
sphinxcontrib-bibtex==2.
5.0
sphinxcontrib-bibtex==2.
6.1
# via -r requirements.in
# via -r requirements.in
sphinxcontrib-devhelp==1.0.2
sphinxcontrib-devhelp==1.0.2
# via sphinx
# via sphinx
...
...
example/27_layernorm/run_layernorm_example.inc
View file @
7bbae9af
example/42_groupnorm/run_groupnorm_example.inc
View file @
7bbae9af
include/ck/utility/type_convert.hpp
View file @
7bbae9af
...
@@ -100,6 +100,8 @@ template <>
...
@@ -100,6 +100,8 @@ template <>
inline
__host__
__device__
f8_t
type_convert
<
f8_t
,
float
>
(
float
x
)
inline
__host__
__device__
f8_t
type_convert
<
f8_t
,
float
>
(
float
x
)
{
{
#if defined(__gfx940__) || defined(__gfx941__) || defined(__gfx942__)
#if defined(__gfx940__) || defined(__gfx941__) || defined(__gfx942__)
float
max_fp8
=
240.0
f
;
x
=
x
>
max_fp8
?
max_fp8
:
(
x
<
-
max_fp8
?
-
max_fp8
:
x
);
union
union
{
{
float
fval
;
float
fval
;
...
...
profiler/include/profiler/profile_gemm_impl.hpp
View file @
7bbae9af
...
@@ -75,8 +75,8 @@ int profile_gemm_impl(int do_verification,
...
@@ -75,8 +75,8 @@ int profile_gemm_impl(int do_verification,
b_k_n
.
GenerateTensorValue
(
GeneratorTensor_2
<
BDataType
>
{
-
5
,
5
});
b_k_n
.
GenerateTensorValue
(
GeneratorTensor_2
<
BDataType
>
{
-
5
,
5
});
break
;
break
;
default:
default:
a_m_k
.
GenerateTensorValue
(
GeneratorTensor_3
<
ADataType
>
{
0.0
,
1.0
});
a_m_k
.
GenerateTensorValue
(
GeneratorTensor_3
<
ADataType
>
{
0.0
,
0.1
});
b_k_n
.
GenerateTensorValue
(
GeneratorTensor_3
<
BDataType
>
{
-
0.5
,
0.5
});
b_k_n
.
GenerateTensorValue
(
GeneratorTensor_3
<
BDataType
>
{
-
0.
0
5
,
0.
0
5
});
}
}
using
AElementOp
=
ck
::
tensor_operation
::
element_wise
::
PassThrough
;
using
AElementOp
=
ck
::
tensor_operation
::
element_wise
::
PassThrough
;
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment