common_header.hpp 1.96 KB
Newer Older
1
#pragma once
Chao Liu's avatar
Chao Liu committed
2
#include "config.hpp"
Chao Liu's avatar
Chao Liu committed
3
#include "array.hpp"
Chao Liu's avatar
Chao Liu committed
4
5
6
#include "container_helper.hpp"
#include "statically_indexed_array.hpp"
#include "container_element_picker.hpp"
7
#include "multi_index.hpp"
Chao Liu's avatar
Chao Liu committed
8
#include "data_type.hpp"
Chao Liu's avatar
Chao Liu committed
9
10
#include "data_type_enum.hpp"
#include "data_type_enum_helper.hpp"
Chao Liu's avatar
Chao Liu committed
11
12
13
#include "functional.hpp"
#include "functional2.hpp"
#include "functional3.hpp"
Chao Liu's avatar
Chao Liu committed
14
#include "functional4.hpp"
Chao Liu's avatar
Chao Liu committed
15
#include "enable_if.hpp"
16
#include "ignore.hpp"
Chao Liu's avatar
Chao Liu committed
17
18
19
20
21
22
23
24
#include "integral_constant.hpp"
#include "math.hpp"
#include "number.hpp"
#include "sequence.hpp"
#include "sequence_helper.hpp"
#include "tuple.hpp"
#include "tuple_helper.hpp"
#include "type.hpp"
25
#include "magic_division.hpp"
Chao Liu's avatar
Chao Liu committed
26
#include "c_style_pointer_cast.hpp"
27
28
#include "is_known_at_compile_time.hpp"
#include "transpose_vectors.hpp"
29
#include "inner_product.hpp"
Chao Liu's avatar
Chao Liu committed
30
#include "element_wise_operation.hpp"
Chao Liu's avatar
Chao Liu committed
31
#include "thread_group.hpp"
32
#include "debug.hpp"
33

34
#include "amd_buffer_addressing.hpp"
rocking5566's avatar
rocking5566 committed
35
#include "generic_memory_space_atomic.hpp"
36
37
38
39
40
41
#include "get_id.hpp"
#include "synchronization.hpp"
#include "amd_address_space.hpp"
#include "static_buffer.hpp"
#include "dynamic_buffer.hpp"

Chao Liu's avatar
Chao Liu committed
42
// TODO: remove this
Chao Liu's avatar
Chao Liu committed
43
44
45
46
#if CK_USE_AMD_INLINE_ASM
#include "amd_inline_asm.hpp"
#endif

47
#ifdef CK_USE_AMD_MFMA
48
49
#include "amd_xdlops.hpp"
#endif
Wenkai's avatar
Wenkai committed
50

wangshaojie6's avatar
wangshaojie6 committed
51
#define USEING_STATIC_KERNEL 1
Wenkai's avatar
Wenkai committed
52

Wenkai's avatar
Wenkai committed
53
54
55
56
#define MNKB_0_8 1
#define MNKB_1_4 0
#define MNKB_2_8 0
#define MNKB_3_5 0
Wenkai's avatar
Wenkai committed
57

Wenkai's avatar
Wenkai committed
58
59
60
61
62
63
64
65
66
67
68
69
70
71
#define MNKB_4_5 0
#define MNKB_5_5 0

#if MNKB_0_8
#define M_matrix 16
#define N_matrix 4096
#define K_matrix 12800
#define K_batch 5
#elif MNKB_1_4
#define M_matrix 16
#define N_matrix 4096
#define K_matrix 12800
#define K_batch 5
#elif MNKB_2_8
Wenkai's avatar
Wenkai committed
72
#define M_matrix 16
Wenkai's avatar
Wenkai committed
73
74
75
76
#define N_matrix 4096
#define K_matrix 12800
#define K_batch 5
#elif MNKB_3_5
Wenkai's avatar
Wenkai committed
77
#define M_matrix 16
Wenkai's avatar
Wenkai committed
78
79
80
81
#define N_matrix 4096
#define K_matrix 12800
#define K_batch 5
#elif MNKB_4_5
Wenkai's avatar
Wenkai committed
82
#define M_matrix 16
Wenkai's avatar
Wenkai committed
83
84
85
86
#define N_matrix 4096
#define K_matrix 12800
#define K_batch 5
#elif MNKB_5_5
Wenkai's avatar
Wenkai committed
87
#define M_matrix 16
Wenkai's avatar
Wenkai committed
88
89
#define N_matrix 4096
#define K_matrix 12800
Wenkai's avatar
Wenkai committed
90
91
#define K_batch 5
#endif