profiler.cpp 4 KB
Newer Older
Chao Liu's avatar
Chao Liu committed
1
2
3
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-2022, Advanced Micro Devices, Inc. All rights reserved.

4
#include <cstring>
5

Chao Liu's avatar
Chao Liu committed
6
7
8
9
10
11
12
13
14
int profile_gemm(int, char*[]);
int profile_gemm_splitk(int, char*[]);
int profile_gemm_bilinear(int, char*[]);
int profile_gemm_add_add_fastgelu(int, char*[]);
int profile_gemm_reduce(int, char*[]);
int profile_gemm_bias_add_reduce(int, char*[]);
int profile_batched_gemm(int, char*[]);
int profile_batched_gemm_reduce(int, char*[]);
int profile_grouped_gemm(int, char*[]);
Jianfeng Yan's avatar
Jianfeng Yan committed
15
int profile_conv_fwd(int, char*[]);
Chao Liu's avatar
Chao Liu committed
16
17
int profile_conv_fwd_bias_relu(int, char*[]);
int profile_conv_fwd_bias_relu_add(int, char*[]);
Chao Liu's avatar
Chao Liu committed
18
// int profile_conv_bwd_data(int, char*[]);
Chao Liu's avatar
Chao Liu committed
19
20
21
int profile_conv_bwd_weight(int, char*[]);
int profile_normalization(int, char*[]);
int profile_reduce(int, char*[]);
22
23
24
25

static void print_helper_message()
{
    // clang-format off
Chao Liu's avatar
Chao Liu committed
26
27
    printf("arg1: tensor operation (gemm: GEMM\n"
           "                        gemm_splitk: Split-K GEMM\n"
Chao Liu's avatar
Chao Liu committed
28
           "                        gemm_bilinear: GEMM+Bilinear\n"
Chao Liu's avatar
Chao Liu committed
29
30
           "                        gemm_add_add_fastgelu: GEMM+Add+Add+FastGeLU\n"
           "                        gemm_reduce: GEMM+Reduce\n"
Chao Liu's avatar
Chao Liu committed
31
           "                        gemm_bias_add_reduce: GEMM+Bias+Add+Reduce\n"
Chao Liu's avatar
Chao Liu committed
32
           "                        batched_gemm: Batched GEMM\n"
Chao Liu's avatar
Chao Liu committed
33
           "                        batched_gemm_reduce: Batched GEMM+Reduce\n"
Chao Liu's avatar
Chao Liu committed
34
           "                        grouped_gemm: Grouped GEMM\n"
35
           "                        conv_fwd: Convolution Forward\n"
Chao Liu's avatar
Chao Liu committed
36
37
           "                        conv_fwd_bias_relu: ForwardConvolution+Bias+ReLU\n"
           "                        conv_fwd_bias_relu_add: ForwardConvolution+Bias+ReLU+Add\n"
38
39
           "                        conv_bwd_data: Convolution Backward Data\n"
           "                        conv_bwd_weight: Convolution Backward Weight\n"
Chao Liu's avatar
Chao Liu committed
40
           "                        reduce: Reduce\n");
41
42
    // clang-format on
}
43
44
45

int main(int argc, char* argv[])
{
46
47
48
49
50
51
52
    if(argc == 1)
    {
        print_helper_message();

        return 0;
    }

53
54
    if(strcmp(argv[1], "gemm") == 0)
    {
Chao Liu's avatar
Chao Liu committed
55
        return profile_gemm(argc, argv);
56
    }
Chao Liu's avatar
Chao Liu committed
57
58
59
60
    else if(strcmp(argv[1], "gemm_splitk") == 0)
    {
        return profile_gemm_splitk(argc, argv);
    }
Chao Liu's avatar
Chao Liu committed
61
    else if(strcmp(argv[1], "gemm_bilinear") == 0)
Chao Liu's avatar
Chao Liu committed
62
    {
Chao Liu's avatar
Chao Liu committed
63
        return profile_gemm_bilinear(argc, argv);
Chao Liu's avatar
Chao Liu committed
64
    }
Chao Liu's avatar
Chao Liu committed
65
    else if(strcmp(argv[1], "gemm_add_add_fastgelu") == 0)
Chao Liu's avatar
Chao Liu committed
66
    {
Chao Liu's avatar
Chao Liu committed
67
        return profile_gemm_add_add_fastgelu(argc, argv);
Chao Liu's avatar
Chao Liu committed
68
    }
Chao Liu's avatar
Chao Liu committed
69
70
71
72
    else if(strcmp(argv[1], "gemm_reduce") == 0)
    {
        return profile_gemm_reduce(argc, argv);
    }
73
74
75
76
    else if(strcmp(argv[1], "gemm_bias_add_reduce") == 0)
    {
        return profile_gemm_bias_add_reduce(argc, argv);
    }
zjing14's avatar
zjing14 committed
77
78
79
80
    else if(strcmp(argv[1], "batched_gemm") == 0)
    {
        return profile_batched_gemm(argc, argv);
    }
81
82
83
84
    else if(strcmp(argv[1], "batched_gemm_reduce") == 0)
    {
        return profile_batched_gemm_reduce(argc, argv);
    }
Chao Liu's avatar
Chao Liu committed
85
86
    else if(strcmp(argv[1], "grouped_gemm") == 0)
    {
Chao Liu's avatar
Chao Liu committed
87
        return profile_grouped_gemm(argc, argv);
Chao Liu's avatar
Chao Liu committed
88
    }
Chao Liu's avatar
Chao Liu committed
89
    else if(strcmp(argv[1], "conv_fwd") == 0)
90
    {
Chao Liu's avatar
Chao Liu committed
91
        return profile_conv_fwd(argc, argv);
Chao Liu's avatar
Chao Liu committed
92
93
94
95
96
97
98
99
100
    }
    else if(strcmp(argv[1], "conv_fwd_bias_relu") == 0)
    {
        return profile_conv_fwd_bias_relu(argc, argv);
    }
    else if(strcmp(argv[1], "conv_fwd_bias_relu_add") == 0)
    {
        return profile_conv_fwd_bias_relu_add(argc, argv);
    }
Chao Liu's avatar
Chao Liu committed
101
#if 0
102
    else if(strcmp(argv[1], "conv_bwd_data") == 0)
103
    {
104
        return profile_conv_bwd_data(argc, argv);
105
    }
Chao Liu's avatar
Chao Liu committed
106
#endif
107
    else if(strcmp(argv[1], "conv_bwd_weight") == 0)
108
109
110
    {
        return profile_conv_bwd_weight(argc, argv);
    }
Chao Liu's avatar
Chao Liu committed
111
    else if(strcmp(argv[1], "reduce") == 0)
112
    {
Chao Liu's avatar
Chao Liu committed
113
        return profile_reduce(argc, argv);
114
    }
115
116
117
118
119
    else if(strcmp(argv[1], "batchnorm") == 0 || strcmp(argv[1], "layernorm") == 0 ||
            strcmp(argv[1], "softmax") == 0)
    {
        return profile_normalization(argc, argv);
    }
120
121
    else
    {
122
123
124
        print_helper_message();

        return 0;
125
    }
126
}