profiler.cpp 4.76 KB
Newer Older
Chao Liu's avatar
Chao Liu committed
1
2
3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-2022, Advanced Micro Devices, Inc. All rights reserved.

4
#include <cstring>
5

Chao Liu's avatar
Chao Liu committed
6
int profile_gemm(int, char*[]);
Chao Liu's avatar
Chao Liu committed
7
int profile_gemm_splitk(int, char*[]);
8
int profile_gemm_bias_2d(int, char*[]);
Chao Liu's avatar
Chao Liu committed
9
10
int profile_gemm_bias_relu(int, char*[]);
int profile_gemm_bias_relu_add(int, char*[]);
11
int profile_gemm_bias_add_reduce(int, char*[]);
Chao Liu's avatar
Chao Liu committed
12
13
int profile_gemm_add_add_fastgelu(int, char*[]);
int profile_gemm_reduce(int, char*[]);
Chao Liu's avatar
Chao Liu committed
14
int profile_batched_gemm(int, char*[]);
Chao Liu's avatar
Chao Liu committed
15
int profile_batched_gemm_reduce(int, char*[]);
Chao Liu's avatar
Chao Liu committed
16
int profile_grouped_gemm(int, char*[]);
Jianfeng Yan's avatar
Jianfeng Yan committed
17
int profile_conv_fwd(int, char*[]);
Chao Liu's avatar
Chao Liu committed
18
19
int profile_conv_fwd_bias_relu(int, char*[]);
int profile_conv_fwd_bias_relu_add(int, char*[]);
Chao Liu's avatar
Chao Liu committed
20
int profile_convnd_fwd(int argc, char* argv[]);
21
int profile_convnd_bwd_data(int, char*[], int);
22
int profile_conv_bwd_weight(int, char*[]);
23
int profile_normalization(int, char*[]);
Chao Liu's avatar
Chao Liu committed
24
int profile_reduce(int, char*[]);
25
26
27
28

static void print_helper_message()
{
    // clang-format off
Chao Liu's avatar
Chao Liu committed
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
    printf("arg1: tensor operation (gemm: GEMM\n"
           "                        gemm_splitk: Split-K GEMM\n"
           "                        gemm_bias_2d: GEMM+Bias(2D)\n"
           "                        gemm_bias_relu: GEMM+Bias+ReLU\n"
           "                        gemm_bias_relu_add: GEMM+Bias+ReLU+Add\n"
           "                        gemm_add_add_fastgelu: GEMM+Add+Add+FastGeLU\n"
           "                        gemm_reduce: GEMM+Reduce\n"
           "                        batched_gemm: Batched GEMM\n"
           "                        grouped_gemm: Grouped GEMM\n"
           "                        conv_fwd: ForwardConvolution\n"
           "                        conv_fwd_bias_relu: ForwardConvolution+Bias+ReLU\n"
           "                        conv_fwd_bias_relu_add: ForwardConvolution+Bias+ReLU+Add\n"
           "                        conv1d_bwd_data: BackwardConvolution data 1 dim\n"
           "                        conv2d_bwd_data: BackwardConvolution data 2 dim\n"
           "                        conv3d_bwd_data: BackwardConvolution data 3 dim\n"
           "                        conv2d_bwd_weight: Backward Weight Convolution 2d\n"
           "                        reduce: Reduce\n");
46
47
    // clang-format on
}
48
49
50

int main(int argc, char* argv[])
{
51
52
53
54
55
56
57
    if(argc == 1)
    {
        print_helper_message();

        return 0;
    }

58
59
    if(strcmp(argv[1], "gemm") == 0)
    {
Chao Liu's avatar
Chao Liu committed
60
        return profile_gemm(argc, argv);
61
    }
Chao Liu's avatar
Chao Liu committed
62
63
64
65
    else if(strcmp(argv[1], "gemm_splitk") == 0)
    {
        return profile_gemm_splitk(argc, argv);
    }
66
67
68
69
    else if(strcmp(argv[1], "gemm_bias_2d") == 0)
    {
        return profile_gemm_bias_2d(argc, argv);
    }
zjing14's avatar
zjing14 committed
70
    else if(strcmp(argv[1], "gemm_bias_relu") == 0)
Chao Liu's avatar
Chao Liu committed
71
72
73
    {
        return profile_gemm_bias_relu(argc, argv);
    }
zjing14's avatar
zjing14 committed
74
    else if(strcmp(argv[1], "gemm_bias_relu_add") == 0)
Chao Liu's avatar
Chao Liu committed
75
76
77
    {
        return profile_gemm_bias_relu_add(argc, argv);
    }
Chao Liu's avatar
Chao Liu committed
78
79
80
81
    else if(strcmp(argv[1], "gemm_reduce") == 0)
    {
        return profile_gemm_reduce(argc, argv);
    }
82
83
84
85
    else if(strcmp(argv[1], "gemm_bias_add_reduce") == 0)
    {
        return profile_gemm_bias_add_reduce(argc, argv);
    }
zjing14's avatar
zjing14 committed
86
87
88
89
    else if(strcmp(argv[1], "batched_gemm") == 0)
    {
        return profile_batched_gemm(argc, argv);
    }
90
91
92
93
    else if(strcmp(argv[1], "batched_gemm_reduce") == 0)
    {
        return profile_batched_gemm_reduce(argc, argv);
    }
Chao Liu's avatar
Chao Liu committed
94
95
    else if(strcmp(argv[1], "grouped_gemm") == 0)
    {
Chao Liu's avatar
Chao Liu committed
96
        return profile_grouped_gemm(argc, argv);
Chao Liu's avatar
Chao Liu committed
97
    }
Chao Liu's avatar
Chao Liu committed
98
    else if(strcmp(argv[1], "conv_fwd") == 0)
99
    {
Chao Liu's avatar
Chao Liu committed
100
        return profile_convnd_fwd(argc, argv);
Chao Liu's avatar
Chao Liu committed
101
102
103
104
105
106
107
108
109
    }
    else if(strcmp(argv[1], "conv_fwd_bias_relu") == 0)
    {
        return profile_conv_fwd_bias_relu(argc, argv);
    }
    else if(strcmp(argv[1], "conv_fwd_bias_relu_add") == 0)
    {
        return profile_conv_fwd_bias_relu_add(argc, argv);
    }
110
    else if(strcmp(argv[1], "conv1d_bwd_data") == 0)
111
    {
112
113
114
115
116
117
118
119
120
        return profile_convnd_bwd_data(argc, argv, 1);
    }
    else if(strcmp(argv[1], "conv2d_bwd_data") == 0)
    {
        return profile_convnd_bwd_data(argc, argv, 2);
    }
    else if(strcmp(argv[1], "conv3d_bwd_data") == 0)
    {
        return profile_convnd_bwd_data(argc, argv, 3);
121
    }
122
123
124
125
    else if(strcmp(argv[1], "reduce") == 0)
    {
        return profile_reduce(argc, argv);
    }
126
127
128
129
    else if(strcmp(argv[1], "conv2d_bwd_weight") == 0)
    {
        return profile_conv_bwd_weight(argc, argv);
    }
130
131
132
133
    else if(strcmp(argv[1], "gemm_add_add_fastgelu") == 0)
    {
        return profile_gemm_add_add_fastgelu(argc, argv);
    }
134
135
136
137
138
    else if(strcmp(argv[1], "batchnorm") == 0 || strcmp(argv[1], "layernorm") == 0 ||
            strcmp(argv[1], "softmax") == 0)
    {
        return profile_normalization(argc, argv);
    }
139
140
    else
    {
141
142
143
        print_helper_message();

        return 0;
144
    }
145
}