Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
ec1b65e7
Commit
ec1b65e7
authored
Jan 19, 2025
by
Aleksander Dudek
Browse files
[CK_TILE] Update the file structure
parent
aa30ef56
Changes
262
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
53 additions
and
53 deletions
+53
-53
example/ck_tile/01_fmha/bias.hpp
example/ck_tile/01_fmha/bias.hpp
+2
-2
example/ck_tile/01_fmha/fmha_bwd.hpp
example/ck_tile/01_fmha/fmha_bwd.hpp
+4
-4
example/ck_tile/01_fmha/fmha_fwd.hpp
example/ck_tile/01_fmha/fmha_fwd.hpp
+4
-4
example/ck_tile/01_fmha/mask.hpp
example/ck_tile/01_fmha/mask.hpp
+2
-2
example/ck_tile/01_fmha/rotary.hpp
example/ck_tile/01_fmha/rotary.hpp
+2
-2
example/ck_tile/02_layernorm2d/layernorm2d_fwd.hpp
example/ck_tile/02_layernorm2d/layernorm2d_fwd.hpp
+3
-3
example/ck_tile/03_gemm/gemm_basic.hpp
example/ck_tile/03_gemm/gemm_basic.hpp
+3
-3
example/ck_tile/04_img2col/image_to_column.hpp
example/ck_tile/04_img2col/image_to_column.hpp
+3
-3
example/ck_tile/05_reduce/reduce.hpp
example/ck_tile/05_reduce/reduce.hpp
+4
-4
example/ck_tile/06_permute/alternative_impl/matrix_core_swizzle_kernel.hpp
...6_permute/alternative_impl/matrix_core_swizzle_kernel.hpp
+2
-2
example/ck_tile/06_permute/permute.hpp
example/ck_tile/06_permute/permute.hpp
+3
-3
example/ck_tile/09_topk_softmax/topk_softmax.cpp
example/ck_tile/09_topk_softmax/topk_softmax.cpp
+2
-2
example/ck_tile/09_topk_softmax/topk_softmax_api.hpp
example/ck_tile/09_topk_softmax/topk_softmax_api.hpp
+2
-2
example/ck_tile/10_rmsnorm2d/example_rmsnorm2d_fwd.cpp
example/ck_tile/10_rmsnorm2d/example_rmsnorm2d_fwd.cpp
+2
-2
example/ck_tile/10_rmsnorm2d/rmsnorm2d_fwd.hpp
example/ck_tile/10_rmsnorm2d/rmsnorm2d_fwd.hpp
+3
-3
example/ck_tile/11_add_rmsnorm2d_rdquant/add_rmsnorm2d_rdquant_fwd.hpp
...le/11_add_rmsnorm2d_rdquant/add_rmsnorm2d_rdquant_fwd.hpp
+3
-3
example/ck_tile/11_add_rmsnorm2d_rdquant/example_add_rmsnorm2d_rdquant_fwd.cpp
...d_rmsnorm2d_rdquant/example_add_rmsnorm2d_rdquant_fwd.cpp
+2
-2
example/ck_tile/12_smoothquant/example_smoothquant.cpp
example/ck_tile/12_smoothquant/example_smoothquant.cpp
+2
-2
example/ck_tile/12_smoothquant/smoothquant.hpp
example/ck_tile/12_smoothquant/smoothquant.hpp
+3
-3
example/ck_tile/13_moe_sorting/moe_sorting.cpp
example/ck_tile/13_moe_sorting/moe_sorting.cpp
+2
-2
No files found.
example/ck_tile/01_fmha/bias.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
#include <ostream>
#include <string>
#include "ck_tile/core.hpp"
#include "ck_tile/ops/fmha.hpp"
#include "ck_tile/
device/
ops/fmha.hpp"
// keep sync with BlockAttentionBiasEnum
enum
class
bias_enum
...
...
example/ck_tile/01_fmha/fmha_bwd.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
#include "ck_tile/core.hpp"
#include "ck_tile/host/kernel_launch.hpp"
#include "ck_tile/ops/fmha.hpp"
#include "ck_tile/ops/epilogue.hpp"
#include "ck_tile/host/
util/
kernel_launch.hpp"
#include "ck_tile/
device/
ops/fmha.hpp"
#include "ck_tile/
device/
ops/epilogue.hpp"
#include "mask.hpp"
#include "bias.hpp"
...
...
example/ck_tile/01_fmha/fmha_fwd.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
#include "ck_tile/core.hpp"
#include "ck_tile/host/kernel_launch.hpp"
#include "ck_tile/ops/epilogue.hpp"
#include "ck_tile/ops/fmha.hpp"
#include "ck_tile/host/
util/
kernel_launch.hpp"
#include "ck_tile/
device/
ops/epilogue.hpp"
#include "ck_tile/
device/
ops/fmha.hpp"
#include "bias.hpp"
#include "mask.hpp"
...
...
example/ck_tile/01_fmha/mask.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
...
...
@@ -7,7 +7,7 @@
#include <string>
#include "ck_tile/core.hpp"
#include "ck_tile/ops/fmha.hpp"
#include "ck_tile/
device/
ops/fmha.hpp"
// keep this in sync with ck_tile::GenericAttentionMaskEnum
enum
class
mask_enum
...
...
example/ck_tile/01_fmha/rotary.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
#include "ck_tile/core.hpp"
#include "ck_tile/host/host_tensor.hpp"
#include "ck_tile/host/
util/
host_tensor.hpp"
#include <cassert>
#include <cmath>
...
...
example/ck_tile/02_layernorm2d/layernorm2d_fwd.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
#include "ck_tile/core.hpp"
#include "ck_tile/host/kernel_launch.hpp"
#include "ck_tile/ops/layernorm2d.hpp"
#include "ck_tile/host/
util/
kernel_launch.hpp"
#include "ck_tile/
device/
ops/layernorm2d.hpp"
#include <string>
template
<
typename
InType
,
typename
OutType
,
typename
XScaleDataType_
,
typename
YScaleDataType_
>
...
...
example/ck_tile/03_gemm/gemm_basic.hpp
View file @
ec1b65e7
...
...
@@ -6,9 +6,9 @@
#include <string>
#include "ck_tile/host.hpp"
#include "ck_tile/host/kernel_launch.hpp"
#include "ck_tile/ops/gemm.hpp"
#include "ck_tile/ops/epilogue.hpp"
#include "ck_tile/host/
util/
kernel_launch.hpp"
#include "ck_tile/
device/
ops/gemm.hpp"
#include "ck_tile/
device/
ops/epilogue.hpp"
template
<
typename
DataType
>
struct
GemmBasicTypeConfig
;
...
...
example/ck_tile/04_img2col/image_to_column.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
#include "ck_tile/core.hpp"
#include "ck_tile/host/kernel_launch.hpp"
#include "ck_tile/ops/image_to_column.hpp"
#include "ck_tile/host/
util/
kernel_launch.hpp"
#include "ck_tile/
device/
ops/image_to_column.hpp"
#include <string>
#define DefaultConvParams \
...
...
example/ck_tile/05_reduce/reduce.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
#include "ck_tile/core.hpp"
#include "ck_tile/ops/common.hpp"
#include "ck_tile/ops/reduce/block/block_reduce.hpp"
#include "ck_tile/ops/reduce/block/block_reduce2d_default_policy.hpp"
#include "ck_tile/
device/
ops/common.hpp"
#include "ck_tile/
device/
ops/reduce/block/block_reduce.hpp"
#include "ck_tile/
device/
ops/reduce/block/block_reduce2d_default_policy.hpp"
namespace
ck_tile
{
...
...
example/ck_tile/06_permute/alternative_impl/matrix_core_swizzle_kernel.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
#include "ck_tile/core.hpp"
#include "ck_tile/host.hpp"
#include "ck_tile/ops/gemm.hpp"
#include "ck_tile/
device/
ops/gemm.hpp"
// if set to 1, slightly more instructions generated to calculate address
#ifndef MERGE_2D_013425
...
...
example/ck_tile/06_permute/permute.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
#include "ck_tile/core.hpp"
#include "ck_tile/host/kernel_launch.hpp"
#include "ck_tile/ops/permute.hpp"
#include "ck_tile/host/
util/
kernel_launch.hpp"
#include "ck_tile/
device/
ops/permute.hpp"
#include <string>
struct
permute_traits
...
...
example/ck_tile/09_topk_softmax/topk_softmax.cpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 202
5
, Advanced Micro Devices, Inc. All rights reserved.
#include <vector>
#include <iostream>
...
...
@@ -11,7 +11,7 @@
#include <unordered_set>
#include "ck_tile/core.hpp"
#include "ck_tile/ops/reduce.hpp"
#include "ck_tile/
device/
ops/reduce.hpp"
#include "topk_softmax_api.hpp"
#if 0
...
...
example/ck_tile/09_topk_softmax/topk_softmax_api.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
#include "ck_tile/core.hpp"
#include "ck_tile/host.hpp"
#include "ck_tile/ops/topk_softmax.hpp"
#include "ck_tile/
device/
ops/topk_softmax.hpp"
#include <string>
struct
topk_softmax_trait
...
...
example/ck_tile/10_rmsnorm2d/example_rmsnorm2d_fwd.cpp
View file @
ec1b65e7
#include "ck_tile/host.hpp"
#include "ck_tile/core.hpp"
#include "ck_tile/host/kernel_launch.hpp"
#include "ck_tile/ops/rmsnorm2d.hpp"
#include "ck_tile/host/
util/
kernel_launch.hpp"
#include "ck_tile/
device/
ops/rmsnorm2d.hpp"
#include <cstring>
auto
create_args
(
int
argc
,
char
*
argv
[])
...
...
example/ck_tile/10_rmsnorm2d/rmsnorm2d_fwd.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
#include "ck_tile/core.hpp"
#include "ck_tile/host/kernel_launch.hpp"
#include "ck_tile/ops/rmsnorm2d.hpp"
#include "ck_tile/host/
util/
kernel_launch.hpp"
#include "ck_tile/
device/
ops/rmsnorm2d.hpp"
#include <string>
template
<
typename
DataType
>
...
...
example/ck_tile/11_add_rmsnorm2d_rdquant/add_rmsnorm2d_rdquant_fwd.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
#include "ck_tile/core.hpp"
#include "ck_tile/host/kernel_launch.hpp"
#include "ck_tile/ops/add_rmsnorm2d_rdquant.hpp"
#include "ck_tile/host/
util/
kernel_launch.hpp"
#include "ck_tile/
device/
ops/add_rmsnorm2d_rdquant.hpp"
#include <string>
template
<
typename
DataType
>
...
...
example/ck_tile/11_add_rmsnorm2d_rdquant/example_add_rmsnorm2d_rdquant_fwd.cpp
View file @
ec1b65e7
#include "ck_tile/host.hpp"
#include "ck_tile/core.hpp"
#include "ck_tile/host/kernel_launch.hpp"
#include "ck_tile/ops/add_rmsnorm2d_rdquant.hpp"
#include "ck_tile/host/
util/
kernel_launch.hpp"
#include "ck_tile/
device/
ops/add_rmsnorm2d_rdquant.hpp"
#include <cstring>
// different threshold for different dtype
...
...
example/ck_tile/12_smoothquant/example_smoothquant.cpp
View file @
ec1b65e7
#include "ck_tile/host.hpp"
#include "ck_tile/core.hpp"
#include "ck_tile/host/kernel_launch.hpp"
#include "ck_tile/ops/smoothquant.hpp"
#include "ck_tile/host/
util/
kernel_launch.hpp"
#include "ck_tile/
device/
ops/smoothquant.hpp"
#include <cstring>
// different threshold for different dtype
...
...
example/ck_tile/12_smoothquant/smoothquant.hpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
5
, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
#include "ck_tile/core.hpp"
#include "ck_tile/host/kernel_launch.hpp"
#include "ck_tile/ops/smoothquant.hpp"
#include "ck_tile/host/
util/
kernel_launch.hpp"
#include "ck_tile/
device/
ops/smoothquant.hpp"
#include <string>
template
<
typename
DataType
>
...
...
example/ck_tile/13_moe_sorting/moe_sorting.cpp
View file @
ec1b65e7
// SPDX-License-Identifier: MIT
// Copyright (c) 202
4
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 202
5
, Advanced Micro Devices, Inc. All rights reserved.
#include <set>
#include <vector>
...
...
@@ -12,7 +12,7 @@
#include <unordered_set>
#include "ck_tile/core.hpp"
#include "ck_tile/ops/reduce.hpp"
#include "ck_tile/
device/
ops/reduce.hpp"
#include "moe_sorting_api.hpp"
auto
create_args
(
int
argc
,
char
*
argv
[])
...
...
Prev
1
2
3
4
5
…
14
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment