Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
3e4d0ff3
"vscode:/vscode.git/clone" did not exist on "9da92cdb0f657d23ccf5594387398e4033a76f58"
Commit
3e4d0ff3
authored
Mar 19, 2024
by
Jakub Piasecki
Browse files
Merge remote-tracking branch 'origin/develop' into ggemm_multid_two_stage
parents
1ad29336
9e011bcd
Changes
256
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
67 additions
and
18 deletions
+67
-18
client_example/11_grouped_conv_bwd_weight/grouped_conv3d_bwd_weight_fp16_comp_bf8_fp8.cpp
...wd_weight/grouped_conv3d_bwd_weight_fp16_comp_bf8_fp8.cpp
+1
-1
client_example/11_grouped_conv_bwd_weight/grouped_conv3d_bwd_weight_fp32.cpp
...rouped_conv_bwd_weight/grouped_conv3d_bwd_weight_fp32.cpp
+1
-1
client_example/12_elementwise_normalization/elementwise_layernorm2d.cpp
.../12_elementwise_normalization/elementwise_layernorm2d.cpp
+1
-1
client_example/13_batchnorm/batchnorm_bwd_nhwc.cpp
client_example/13_batchnorm/batchnorm_bwd_nhwc.cpp
+1
-1
client_example/13_batchnorm/batchnorm_fwd_nhwc.cpp
client_example/13_batchnorm/batchnorm_fwd_nhwc.cpp
+1
-1
client_example/13_batchnorm/batchnorm_infer_nhwc.cpp
client_example/13_batchnorm/batchnorm_infer_nhwc.cpp
+1
-1
client_example/14_instance_id/batchnorm_fwd_instance_id.cpp
client_example/14_instance_id/batchnorm_fwd_instance_id.cpp
+1
-1
client_example/15_convnd_bwd_data/conv3d_bwd_data_fp16.cpp
client_example/15_convnd_bwd_data/conv3d_bwd_data_fp16.cpp
+1
-1
client_example/15_convnd_bwd_data/conv3d_bwd_data_fp32.cpp
client_example/15_convnd_bwd_data/conv3d_bwd_data_fp32.cpp
+1
-1
client_example/15_gemm_add_multiply/gemm_add_multiply.cpp
client_example/15_gemm_add_multiply/gemm_add_multiply.cpp
+1
-1
client_example/15_reduce/reduce_nhwc_c.cpp
client_example/15_reduce/reduce_nhwc_c.cpp
+1
-1
client_example/16_convnd_fwd/CMakeLists.txt
client_example/16_convnd_fwd/CMakeLists.txt
+3
-0
client_example/16_convnd_fwd/conv3d_fwd_fp16.cpp
client_example/16_convnd_fwd/conv3d_fwd_fp16.cpp
+1
-1
client_example/16_convnd_fwd/conv3d_fwd_fp16_comp_fp8.cpp
client_example/16_convnd_fwd/conv3d_fwd_fp16_comp_fp8.cpp
+1
-1
client_example/16_convnd_fwd/conv3d_fwd_fp32.cpp
client_example/16_convnd_fwd/conv3d_fwd_fp32.cpp
+1
-1
client_example/16_convnd_fwd/conv3d_fwd_fp8.cpp
client_example/16_convnd_fwd/conv3d_fwd_fp8.cpp
+46
-0
client_example/17_grouped_gemm_fastgelu/grouped_gemm_fastgelu.cpp
...xample/17_grouped_gemm_fastgelu/grouped_gemm_fastgelu.cpp
+1
-1
client_example/18_groupnorm/groupnorm_bwd_data.cpp
client_example/18_groupnorm/groupnorm_bwd_data.cpp
+1
-1
client_example/18_groupnorm/groupnorm_bwd_gamma_beta.cpp
client_example/18_groupnorm/groupnorm_bwd_gamma_beta.cpp
+1
-1
client_example/18_groupnorm/groupnorm_swish_fwd.cpp
client_example/18_groupnorm/groupnorm_swish_fwd.cpp
+1
-1
No files found.
client_example/11_grouped_conv_bwd_weight/grouped_conv3d_bwd_weight_fp16_comp_bf8_fp8.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include "common.hpp"
...
...
client_example/11_grouped_conv_bwd_weight/grouped_conv3d_bwd_weight_fp32.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include "common.hpp"
...
...
client_example/12_elementwise_normalization/elementwise_layernorm2d.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include <iomanip>
#include <vector>
...
...
client_example/13_batchnorm/batchnorm_bwd_nhwc.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include <functional>
#include <numeric>
...
...
client_example/13_batchnorm/batchnorm_fwd_nhwc.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include <functional>
#include <numeric>
...
...
client_example/13_batchnorm/batchnorm_infer_nhwc.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include <functional>
#include <numeric>
...
...
client_example/14_instance_id/batchnorm_fwd_instance_id.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include <functional>
#include <numeric>
...
...
client_example/15_convnd_bwd_data/conv3d_bwd_data_fp16.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include "common.hpp"
...
...
client_example/15_convnd_bwd_data/conv3d_bwd_data_fp32.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include "common.hpp"
...
...
client_example/15_gemm_add_multiply/gemm_add_multiply.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include <iomanip>
#include <vector>
...
...
client_example/15_reduce/reduce_nhwc_c.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include <functional>
#include <numeric>
...
...
client_example/16_convnd_fwd/CMakeLists.txt
View file @
3e4d0ff3
...
...
@@ -7,6 +7,9 @@ endif()
if
((
DTYPES MATCHES
"fp8"
)
OR NOT DEFINED DTYPES
)
add_executable
(
client_conv3d_fwd_fp16_comp_fp8 conv3d_fwd_fp16_comp_fp8.cpp
)
target_link_libraries
(
client_conv3d_fwd_fp16_comp_fp8 PRIVATE composable_kernel::device_conv_operations
)
add_executable
(
client_conv3d_fwd_fp8 conv3d_fwd_fp8.cpp
)
target_link_libraries
(
client_conv3d_fwd_fp8 PRIVATE composable_kernel::device_conv_operations
)
endif
()
if
((
DTYPES MATCHES
"fp32"
)
OR NOT DEFINED DTYPES
)
...
...
client_example/16_convnd_fwd/conv3d_fwd_fp16.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include "common.hpp"
...
...
client_example/16_convnd_fwd/conv3d_fwd_fp16_comp_fp8.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include "common.hpp"
...
...
client_example/16_convnd_fwd/conv3d_fwd_fp32.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include "common.hpp"
...
...
client_example/16_convnd_fwd/conv3d_fwd_fp8.cpp
0 → 100644
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2024, Advanced Micro Devices, Inc. All rights reserved.
#include "common.hpp"
#include "ck/ck.hpp"
#include "ck/tensor_operation/gpu/device/tensor_layout.hpp"
using
InDataType
=
ck
::
f8_t
;
using
WeiDataType
=
ck
::
f8_t
;
using
OutDataType
=
ck
::
f8_t
;
using
InLayout
=
ck
::
tensor_layout
::
convolution
::
NDHWGC
;
using
WeiLayout
=
ck
::
tensor_layout
::
convolution
::
GKZYXC
;
using
OutLayout
=
ck
::
tensor_layout
::
convolution
::
NDHWGK
;
static
constexpr
ck
::
index_t
NumDimSpatial
=
3
;
static
constexpr
ck
::
index_t
G
=
1
;
static
constexpr
ck
::
index_t
N
=
64
;
static
constexpr
ck
::
index_t
K
=
128
;
static
constexpr
ck
::
index_t
C
=
64
;
static
constexpr
ck
::
index_t
Z
=
3
;
static
constexpr
ck
::
index_t
Y
=
3
;
static
constexpr
ck
::
index_t
X
=
3
;
static
constexpr
ck
::
index_t
Di
=
28
;
static
constexpr
ck
::
index_t
Hi
=
28
;
static
constexpr
ck
::
index_t
Wi
=
3
;
static
constexpr
ck
::
index_t
Do
=
28
;
static
constexpr
ck
::
index_t
Ho
=
28
;
static
constexpr
ck
::
index_t
Wo
=
3
;
int
main
()
{
return
run_grouped_conv_fwd
<
NumDimSpatial
,
InDataType
,
WeiDataType
,
OutDataType
,
InLayout
,
WeiLayout
,
OutLayout
,
3
,
ck
::
f8_t
>
(
{
N
,
Di
,
Hi
,
Wi
,
G
,
C
},
{
G
,
K
,
Z
,
Y
,
X
,
C
},
{
N
,
Do
,
Ho
,
Wo
,
G
,
K
})
?
EXIT_SUCCESS
:
EXIT_FAILURE
;
}
client_example/17_grouped_gemm_fastgelu/grouped_gemm_fastgelu.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include <iomanip>
#include <iostream>
...
...
client_example/18_groupnorm/groupnorm_bwd_data.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include <iomanip>
#include <vector>
...
...
client_example/18_groupnorm/groupnorm_bwd_gamma_beta.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include <iomanip>
#include <vector>
...
...
client_example/18_groupnorm/groupnorm_swish_fwd.cpp
View file @
3e4d0ff3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
#include <iomanip>
#include <vector>
...
...
Prev
1
2
3
4
5
6
7
…
13
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment