device.hpp 7.62 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-2025, Advanced Micro Devices, Inc. All rights reserved.

#pragma once

#include "ck_tile/device/ops/common/generic_2d_block_shape.hpp"
#include "ck_tile/device/ops/common/tensor_layout.hpp"
#include "ck_tile/device/ops/common.hpp"
#include "ck_tile/device/ops/epilogue/cshuffle_epilogue.hpp"
#include "ck_tile/device/ops/epilogue/default_2d_epilogue.hpp"
#include "ck_tile/device/ops/epilogue/dynamic_quant_epilogue.hpp"
#include "ck_tile/device/ops/epilogue.hpp"
#include "ck_tile/device/ops/fmha/block/block_attention_bias_enum.hpp"
#include "ck_tile/device/ops/fmha/block/block_dropout.hpp"
#include "ck_tile/device/ops/fmha/block/block_masking.hpp"
#include "ck_tile/device/ops/fmha/block/block_position_encoding.hpp"
#include "ck_tile/device/ops/fmha/block/block_rotary_embedding.hpp"
#include "ck_tile/device/ops/fmha/block/page_block_navigator.hpp"
#include "ck_tile/device/ops/fmha/kernel/fmha_bwd_kernel.hpp"
#include "ck_tile/device/ops/fmha/kernel/fmha_fwd_appendkv_kernel.hpp"
#include "ck_tile/device/ops/fmha/kernel/fmha_fwd_appendkv_tile_partitioner.hpp"
#include "ck_tile/device/ops/fmha/kernel/fmha_fwd_kernel.hpp"
#include "ck_tile/device/ops/fmha/kernel/fmha_fwd_splitkv_combine_kernel.hpp"
#include "ck_tile/device/ops/fmha/kernel/fmha_fwd_splitkv_kernel.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_bwd_convert_dq.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_bwd_dot_do_o.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_bwd_dq_dk_dv_pipeline_kr_ktr_vr.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_bwd_dq_dk_dv_pipeline_kr_ktr_vr_iglp.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_bwd_pipeline_default_policy.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_bwd_pipeline_enum.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_bwd_pipeline_problem.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_fwd_appendkv_pipeline.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_fwd_appendkv_pipeline_default_policy.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_fwd_splitkv_combine_pipeline.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_fwd_splitkv_combine_pipeline_default_policy.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_fwd_splitkv_pipeline_nwarp_sshuffle_qr_ks_vs.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_fwd_splitkv_pipeline_nwarp_sshuffle_qr_ks_vs_default_policy.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_fwd_splitkv_pipeline_qr_ks_vs.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_fwd_splitkv_pipeline_qr_ks_vs_default_policy.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_pipeline_enum.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_pipeline_problem.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_pipeline_qr_ks_vs.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_pipeline_qr_ks_vs_async.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_pipeline_qr_ks_vs_async_default_policy.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_pipeline_qr_ks_vs_default_policy.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_pipeline_qr_ks_vs_fp8.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_pipeline_qs_ks_vs.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_pipeline_qs_ks_vs_default_policy.hpp"
#include "ck_tile/device/ops/fmha/pipeline/block_fmha_pipeline_qx_ks_vs_custom_policy.hpp"
#include "ck_tile/device/ops/fmha/pipeline/tile_fmha_shape.hpp"
#include "ck_tile/device/ops/fmha/pipeline/tile_fmha_traits.hpp"
#include "ck_tile/device/ops/fmha.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_areg_bgmem_creg_v1.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_areg_bgmem_creg_v1_default_policy.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_areg_breg_creg_v1.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_areg_breg_creg_v1_custom_policy.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_areg_breg_creg_v1_default_policy.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_areg_bsmem_creg_one_warp_v1.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_areg_bsmem_creg_v1.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_areg_bsmem_creg_v1_custom_policy.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_areg_bsmem_creg_v1_default_policy.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_areg_bsmem_creg_v2.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_areg_bsmem_creg_v2_custom_policy.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_areg_bsmem_creg_v2_default_policy.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_asmem_breg_creg_v1.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_asmem_breg_creg_v1_custom_policy.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_asmem_breg_creg_v1_default_policy.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_asmem_bsmem_creg_v1.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_asmem_bsmem_creg_v1_custom_policy.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_asmem_bsmem_creg_v1_default_policy.hpp"
#include "ck_tile/device/ops/gemm/block/block_gemm_problem.hpp"
#include "ck_tile/device/ops/gemm/block/block_universal_gemm_as_bs_cr.hpp"
#include "ck_tile/device/ops/gemm/kernel/batched_gemm_kernel.hpp"
#include "ck_tile/device/ops/gemm/kernel/gemm_kernel.hpp"
#include "ck_tile/device/ops/gemm/kernel/gemm_tile_partitioner.hpp"
#include "ck_tile/device/ops/gemm/kernel/grouped_gemm_kernel.hpp"
#include "ck_tile/device/ops/gemm/pipeline/gemm_pipeline_ag_bg_cr_base.hpp"
#include "ck_tile/device/ops/gemm/pipeline/gemm_pipeline_ag_bg_cr_comp_v3.hpp"
#include "ck_tile/device/ops/gemm/pipeline/gemm_pipeline_ag_bg_cr_mem.hpp"
#include "ck_tile/device/ops/gemm/pipeline/gemm_pipeline_ag_bg_cr_scheduler.hpp"
#include "ck_tile/device/ops/gemm/pipeline/gemm_pipeline_agmem_bgmem_creg_v1.hpp"
#include "ck_tile/device/ops/gemm/pipeline/gemm_pipeline_agmem_bgmem_creg_v1_default_policy.hpp"
#include "ck_tile/device/ops/gemm/pipeline/gemm_pipeline_agmem_bgmem_creg_v2.hpp"
#include "ck_tile/device/ops/gemm/pipeline/gemm_pipeline_agmem_bgmem_creg_v2_default_policy.hpp"
#include "ck_tile/device/ops/gemm/pipeline/gemm_pipeline_problem.hpp"
#include "ck_tile/device/ops/gemm/pipeline/gemm_universal_pipeline_ag_bg_cr_policy.hpp"
#include "ck_tile/device/ops/gemm/pipeline/tile_gemm_shape.hpp"
#include "ck_tile/device/ops/gemm/pipeline/tile_gemm_traits.hpp"
#include "ck_tile/device/ops/gemm/warp/warp_gemm.hpp"
#include "ck_tile/device/ops/gemm/warp/warp_gemm_attribute_mfma.hpp"
#include "ck_tile/device/ops/gemm/warp/warp_gemm_attribute_mfma_impl.hpp"
#include "ck_tile/device/ops/gemm/warp/warp_gemm_dispatcher.hpp"
#include "ck_tile/device/ops/gemm/warp/warp_gemm_impl.hpp"
#include "ck_tile/device/ops/gemm.hpp"
#include "ck_tile/device/ops/layernorm2d/kernel/layernorm2d_fwd_kernel.hpp"
#include "ck_tile/device/ops/layernorm2d/pipeline/layernorm2d_fwd_pipeline_default_policy.hpp"
#include "ck_tile/device/ops/layernorm2d/pipeline/layernorm2d_fwd_pipeline_one_pass.hpp"
#include "ck_tile/device/ops/layernorm2d/pipeline/layernorm2d_fwd_pipeline_problem.hpp"
#include "ck_tile/device/ops/layernorm2d/pipeline/layernorm2d_fwd_pipeline_two_pass.hpp"
#include "ck_tile/device/ops/layernorm2d/pipeline/layernorm2d_fwd_traits.hpp"
#include "ck_tile/device/ops/layernorm2d.hpp"
#include "ck_tile/device/ops/reduce/block/block_reduce.hpp"
#include "ck_tile/device/ops/reduce/block/block_reduce2d.hpp"
#include "ck_tile/device/ops/reduce/block/block_reduce2d_default_policy.hpp"
#include "ck_tile/device/ops/reduce/block/block_reduce2d_problem.hpp"
#include "ck_tile/device/ops/reduce.hpp"