profiler.cpp 5.4 KB
Newer Older
Chao Liu's avatar
Chao Liu committed
1
2
3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-2022, Advanced Micro Devices, Inc. All rights reserved.

4
#include <cstring>
5

Chao Liu's avatar
Chao Liu committed
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
int profile_gemm(int, char*[]);
int profile_gemm_splitk(int, char*[]);
int profile_gemm_bilinear(int, char*[]);
int profile_gemm_add_add_fastgelu(int, char*[]);
int profile_gemm_reduce(int, char*[]);
int profile_gemm_bias_add_reduce(int, char*[]);
int profile_batched_gemm(int, char*[]);
int profile_batched_gemm_gemm(int, char*[]);
int profile_batched_gemm_add_relu_gemm_add(int, char*[]);
int profile_batched_gemm_reduce(int, char*[]);
int profile_grouped_gemm(int, char*[]);
int profile_conv_fwd(int, char*[]);
int profile_conv_fwd_bias_relu(int, char*[]);
int profile_conv_fwd_bias_relu_add(int, char*[]);
int profile_conv_bwd_data(int, char*[]);
int profile_grouped_conv_fwd(int, char*[]);
22
int profile_grouped_conv_bwd_weight(int, char*[]);
23
int profile_softmax(int, char*[]);
rocking5566's avatar
rocking5566 committed
24
int profile_layernorm(int, char*[]);
rocking5566's avatar
rocking5566 committed
25
int profile_groupnorm(int, char*[]);
Chao Liu's avatar
Chao Liu committed
26
int profile_reduce(int, char*[]);
27
int profile_batchnorm_forward(int, char*[]);
28
int profile_batchnorm_backward(int, char*[]);
29
30
31
32

static void print_helper_message()
{
    // clang-format off
Chao Liu's avatar
Chao Liu committed
33
34
    printf("arg1: tensor operation (gemm: GEMM\n"
           "                        gemm_splitk: Split-K GEMM\n"
Chao Liu's avatar
Chao Liu committed
35
           "                        gemm_bilinear: GEMM+Bilinear\n"
Chao Liu's avatar
Chao Liu committed
36
37
           "                        gemm_add_add_fastgelu: GEMM+Add+Add+FastGeLU\n"
           "                        gemm_reduce: GEMM+Reduce\n"
Chao Liu's avatar
Chao Liu committed
38
           "                        gemm_bias_add_reduce: GEMM+Bias+Add+Reduce\n"
Chao Liu's avatar
Chao Liu committed
39
           "                        batched_gemm: Batched GEMM\n"
40
41
           "                        batched_gemm_gemm: Batched+GEMM+GEMM\n"
           "                        batched_gemm_add_relu_gemm_add: Batched+GEMM+bias+gelu+GEMM+bias\n"
Chao Liu's avatar
Chao Liu committed
42
           "                        batched_gemm_reduce: Batched GEMM+Reduce\n"
Chao Liu's avatar
Chao Liu committed
43
           "                        grouped_gemm: Grouped GEMM\n"
44
           "                        conv_fwd: Convolution Forward\n"
Chao Liu's avatar
Chao Liu committed
45
46
           "                        conv_fwd_bias_relu: ForwardConvolution+Bias+ReLU\n"
           "                        conv_fwd_bias_relu_add: ForwardConvolution+Bias+ReLU+Add\n"
47
48
           "                        conv_bwd_data: Convolution Backward Data\n"
           "                        grouped_conv_fwd: Grouped Convolution Forward\n"
49
           "                        grouped_conv_bwd_weight: Grouped Convolution Backward Weight\n"
50
           "                        softmax: Softmax\n"
51
52
           "                        reduce: Reduce\n"
	   "                        bnorm_fwd: Batchnorm forward\n");
53
54
    // clang-format on
}
55
56
57

int main(int argc, char* argv[])
{
58
59
60
61
62
63
    if(argc == 1)
    {
        print_helper_message();

        return 0;
    }
64
    else if(strcmp(argv[1], "gemm") == 0)
65
    {
Chao Liu's avatar
Chao Liu committed
66
        return profile_gemm(argc, argv);
67
    }
Chao Liu's avatar
Chao Liu committed
68
69
70
71
    else if(strcmp(argv[1], "gemm_splitk") == 0)
    {
        return profile_gemm_splitk(argc, argv);
    }
Chao Liu's avatar
Chao Liu committed
72
    else if(strcmp(argv[1], "gemm_bilinear") == 0)
Chao Liu's avatar
Chao Liu committed
73
    {
Chao Liu's avatar
Chao Liu committed
74
        return profile_gemm_bilinear(argc, argv);
Chao Liu's avatar
Chao Liu committed
75
    }
Chao Liu's avatar
Chao Liu committed
76
    else if(strcmp(argv[1], "gemm_add_add_fastgelu") == 0)
Chao Liu's avatar
Chao Liu committed
77
    {
Chao Liu's avatar
Chao Liu committed
78
        return profile_gemm_add_add_fastgelu(argc, argv);
Chao Liu's avatar
Chao Liu committed
79
    }
Chao Liu's avatar
Chao Liu committed
80
81
82
83
    else if(strcmp(argv[1], "gemm_reduce") == 0)
    {
        return profile_gemm_reduce(argc, argv);
    }
84
85
86
87
    else if(strcmp(argv[1], "gemm_bias_add_reduce") == 0)
    {
        return profile_gemm_bias_add_reduce(argc, argv);
    }
zjing14's avatar
zjing14 committed
88
89
90
91
    else if(strcmp(argv[1], "batched_gemm") == 0)
    {
        return profile_batched_gemm(argc, argv);
    }
92
93
94
95
96
97
98
99
    else if(strcmp(argv[1], "batched_gemm_gemm") == 0)
    {
        return profile_batched_gemm_gemm(argc, argv);
    }
    else if(strcmp(argv[1], "batched_gemm_add_relu_gemm_add") == 0)
    {
        return profile_batched_gemm_add_relu_gemm_add(argc, argv);
    }
100
101
102
103
    else if(strcmp(argv[1], "batched_gemm_reduce") == 0)
    {
        return profile_batched_gemm_reduce(argc, argv);
    }
Chao Liu's avatar
Chao Liu committed
104
105
    else if(strcmp(argv[1], "grouped_gemm") == 0)
    {
Chao Liu's avatar
Chao Liu committed
106
        return profile_grouped_gemm(argc, argv);
Chao Liu's avatar
Chao Liu committed
107
    }
Chao Liu's avatar
Chao Liu committed
108
    else if(strcmp(argv[1], "conv_fwd") == 0)
109
    {
110
        return profile_conv_fwd(argc, argv);
Chao Liu's avatar
Chao Liu committed
111
112
113
114
115
116
117
118
119
    }
    else if(strcmp(argv[1], "conv_fwd_bias_relu") == 0)
    {
        return profile_conv_fwd_bias_relu(argc, argv);
    }
    else if(strcmp(argv[1], "conv_fwd_bias_relu_add") == 0)
    {
        return profile_conv_fwd_bias_relu_add(argc, argv);
    }
120
    else if(strcmp(argv[1], "conv_bwd_data") == 0)
121
    {
122
        return profile_conv_bwd_data(argc, argv);
123
    }
124
    else if(strcmp(argv[1], "grouped_conv_fwd") == 0)
125
    {
126
        return profile_grouped_conv_fwd(argc, argv);
127
    }
128
129
130
131
    else if(strcmp(argv[1], "conv_bwd_weight") == 0)
    {
        return profile_grouped_conv_bwd_weight(argc, argv);
    }
Chao Liu's avatar
Chao Liu committed
132
    else if(strcmp(argv[1], "reduce") == 0)
133
    {
Chao Liu's avatar
Chao Liu committed
134
        return profile_reduce(argc, argv);
135
    }
136
    else if(strcmp(argv[1], "softmax") == 0)
137
    {
138
        return profile_softmax(argc, argv);
139
    }
rocking5566's avatar
rocking5566 committed
140
141
142
143
    else if(strcmp(argv[1], "layernorm") == 0)
    {
        return profile_layernorm(argc, argv);
    }
rocking5566's avatar
rocking5566 committed
144
145
146
147
    else if(strcmp(argv[1], "groupnorm") == 0)
    {
        return profile_groupnorm(argc, argv);
    }
148
149
150
151
    else if(strcmp(argv[1], "bnorm_fwd") == 0)
    {
        return profile_batchnorm_forward(argc, argv);
    }
152
153
154
155
    else if(strcmp(argv[1], "bnorm_bwd") == 0)
    {
        return profile_batchnorm_backward(argc, argv);
    }
156
157
    else
    {
158
159
160
        print_helper_message();

        return 0;
161
    }
162
}