main.cpp 17.8 KB
Newer Older
kahmed10's avatar
kahmed10 committed
1
#include "verify.hpp"
Paul's avatar
Paul committed
2
3
#include "argument_parser.hpp"
#include "command.hpp"
kahmed10's avatar
kahmed10 committed
4
#include "precision.hpp"
Paul's avatar
Paul committed
5
#include "perf.hpp"
6
#include "models.hpp"
7
#include "marker_roctx.hpp"
Paul's avatar
Paul committed
8

Paul's avatar
Paul committed
9
10
11
#include <migraphx/tf.hpp>
#include <migraphx/onnx.hpp>
#include <migraphx/stringutils.hpp>
12
13
#include <migraphx/load_save.hpp>
#include <migraphx/json.hpp>
14
#include <migraphx/version.h>
Paul's avatar
Paul committed
15

16
17
18
#include <migraphx/dead_code_elimination.hpp>
#include <migraphx/eliminate_identity.hpp>
#include <migraphx/eliminate_pad.hpp>
19
20
#include <migraphx/generate.hpp>
#include <migraphx/pass_manager.hpp>
21
#include <migraphx/propagate_constant.hpp>
22
#include <migraphx/quantization.hpp>
23
#include <migraphx/register_op.hpp>
24
#include <migraphx/rewrite_batchnorm.hpp>
25
26
#include <migraphx/simplify_algebra.hpp>
#include <migraphx/simplify_reshapes.hpp>
27
#include <migraphx/register_target.hpp>
28

29
30
#include <fstream>

Paul's avatar
Paul committed
31
32
33
34
35
36
namespace migraphx {
namespace driver {
inline namespace MIGRAPHX_INLINE_NS {

struct loader
{
37
    std::string model;
Paul's avatar
Paul committed
38
    std::string file;
Paul's avatar
Paul committed
39
    std::string file_type;
40
41
42
43
44
    unsigned batch              = 1;
    bool is_nhwc                = true;
    unsigned trim               = 0;
    bool optimize               = false;
    bool skip_unknown_operators = false;
45
46
47
    bool brief                  = false;
    std::string output_type;
    std::string output;
Shucai Xiao's avatar
Shucai Xiao committed
48
    std::vector<std::string> param_dims;
kahmed10's avatar
kahmed10 committed
49
    std::vector<std::string> output_names;
Paul's avatar
Paul committed
50
51
52

    void parse(argument_parser& ap)
    {
Paul's avatar
Paul committed
53
        ap(file, {}, ap.metavar("<input file>"));
54
        ap(model, {"--model"}, ap.help("Load model"), ap.type("resnet50|inceptionv3|alexnet"));
Paul's avatar
Paul committed
55
56
        ap(file_type, {"--onnx"}, ap.help("Load as onnx"), ap.set_value("onnx"));
        ap(file_type, {"--tf"}, ap.help("Load as tensorflow"), ap.set_value("tf"));
57
58
        ap(file_type, {"--migraphx"}, ap.help("Load as MIGraphX"), ap.set_value("migraphx"));
        ap(file_type, {"--migraphx-json"}, ap.help("Load as MIGraphX JSON"), ap.set_value("json"));
59
        ap(batch, {"--batch"}, ap.help("Set batch size for model"));
Paul's avatar
Paul committed
60
        ap(is_nhwc, {"--nhwc"}, ap.help("Treat tensorflow format as nhwc"), ap.set_value(true));
61
62
63
64
        ap(skip_unknown_operators,
           {"--skip-unknown-operators"},
           ap.help("Skip unknown operators when parsing and continue to parse."),
           ap.set_value(true));
Paul's avatar
Paul committed
65
        ap(is_nhwc, {"--nchw"}, ap.help("Treat tensorflow format as nchw"), ap.set_value(false));
Paul's avatar
Paul committed
66
        ap(trim, {"--trim", "-t"}, ap.help("Trim instructions from the end"));
Shucai Xiao's avatar
Shucai Xiao committed
67
68
69
70
71
        ap(param_dims,
           {"--input-dim"},
           ap.help("Dim of a parameter (format: \"@name d1 d2 dn\")"),
           ap.append(),
           ap.nargs(2));
kahmed10's avatar
kahmed10 committed
72
73
74
75
76
77

        ap(output_names,
           {"--output-names"},
           ap.help("Names of node output (format: \"name_1 name_2 name_n\")"),
           ap.append(),
           ap.nargs(2));
78
        ap(optimize, {"--optimize", "-O"}, ap.help("Optimize when reading"), ap.set_value(true));
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
        ap(output_type,
           {"--graphviz", "-g"},
           ap.help("Print out a graphviz representation."),
           ap.set_value("graphviz"));
        ap(brief, {"--brief"}, ap.help("Make the output brief."), ap.set_value(true));
        ap(output_type,
           {"--cpp"},
           ap.help("Print out the program as cpp program."),
           ap.set_value("cpp"));
        ap(output_type, {"--json"}, ap.help("Print out program as json."), ap.set_value("json"));
        ap(output_type,
           {"--text"},
           ap.help("Print out program in text format."),
           ap.set_value("text"));
        ap(output_type,
           {"--binary"},
           ap.help("Print out program in binary format."),
           ap.set_value("binary"));
        ap(output, {"--output", "-o"}, ap.help("Output to file."));
Paul's avatar
Paul committed
98
99
    }

Shucai Xiao's avatar
Shucai Xiao committed
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
    static auto parse_param_dims(const std::vector<std::string>& param_dims_info)
    {
        std::unordered_map<std::string, std::vector<std::size_t>> map_input_dims;
        std::string name = "";
        for(auto&& x : param_dims_info)
        {
            if(x[0] == '@')
            {
                name = x.substr(1);
            }
            else
            {
                map_input_dims[name].push_back(value_parser<std::size_t>::apply(x));
            }
        }

        return map_input_dims;
    }

kahmed10's avatar
kahmed10 committed
119
120
121
122
123
124
125
126
127
128
129
    static auto parse_output_names(const std::vector<std::string>& output_names_info)
    {
        std::vector<std::string> output_node_names;
        std::transform(output_names_info.begin(),
                       output_names_info.end(),
                       std::back_inserter(output_node_names),
                       [&](auto x) { return value_parser<std::string>::apply(x); });

        return output_node_names;
    }

Paul's avatar
Paul committed
130
    program load()
Paul's avatar
Paul committed
131
132
    {
        program p;
133
        if(model.empty())
Paul's avatar
Paul committed
134
        {
kahmed10's avatar
kahmed10 committed
135
136
            auto map_input_dims    = parse_param_dims(param_dims);
            auto output_node_names = parse_output_names(output_names);
137
138
139
140
141
142
            if(file_type.empty())
            {
                if(ends_with(file, ".onnx"))
                    file_type = "onnx";
                else if(ends_with(file, ".pb"))
                    file_type = "tf";
143
144
145
146
                else if(ends_with(file, ".json"))
                    file_type = "json";
                else
                    file_type = "migraphx";
147
148
149
            }
            std::cout << "Reading: " << file << std::endl;
            if(file_type == "onnx")
150
151
152
153
154
            {
                onnx_options options;
                options.default_dim_value      = batch;
                options.skip_unknown_operators = skip_unknown_operators;
                options.print_program_on_error = true;
Shucai Xiao's avatar
Shucai Xiao committed
155
                options.map_input_dims         = map_input_dims;
156
157
                p                              = parse_onnx(file, options);
            }
158
            else if(file_type == "tf")
159
            {
kahmed10's avatar
kahmed10 committed
160
                p = parse_tf(file, tf_options{is_nhwc, batch, map_input_dims, output_node_names});
161
            }
162
163
164
165
166
167
168
169
170
171
            else if(file_type == "json")
            {
                file_options options;
                options.format = "json";
                p              = migraphx::load(file, options);
            }
            else if(file_type == "migraphx")
            {
                p = migraphx::load(file);
            }
172
173
174
175
176
177
178
179
180
181
182
        }
        else
        {
            if(model == "resnet50")
                p = resnet50(batch);
            else if(model == "inceptionv3")
                p = inceptionv3(batch);
            else if(model == "alexnet")
                p = alexnet(batch);
            else
                MIGRAPHX_THROW("Unknown model: " + model);
Paul's avatar
Paul committed
183
        }
Paul's avatar
Paul committed
184
        if(trim > 0)
Paul's avatar
Paul committed
185
        {
186
            auto* mm  = p.get_main_module();
Shucai Xiao's avatar
Shucai Xiao committed
187
188
            auto last = std::prev(mm->end(), trim);
            mm->remove_instructions(last, mm->end());
Paul's avatar
Paul committed
189
        }
Paul's avatar
Paul committed
190
        if(optimize)
191
192
        {
            migraphx::run_passes(*p.get_main_module(),
Paul's avatar
Paul committed
193
                                 {
194
                                     migraphx::rewrite_batchnorm{},
Paul's avatar
Paul committed
195
196
197
198
199
200
201
202
203
204
205
                                     migraphx::eliminate_identity{},
                                     migraphx::dead_code_elimination{},
                                     migraphx::simplify_algebra{},
                                     migraphx::dead_code_elimination{},
                                     migraphx::simplify_reshapes{},
                                     migraphx::dead_code_elimination{},
                                     migraphx::propagate_constant{},
                                     migraphx::dead_code_elimination{},
                                     migraphx::eliminate_pad{},
                                     migraphx::dead_code_elimination{},
                                 });
206
        }
Paul's avatar
Paul committed
207
208
        return p;
    }
209
210
211
212
213
214

    static void write(std::ostream& os, const std::vector<char>& buffer)
    {
        os.write(buffer.data(), buffer.size());
    }

215
    void save(const program& p) const
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
    {
        auto* os = &std::cout;
        std::ofstream fs;
        if(not output.empty())
        {
            fs.open(output);
            os = &fs;
        }

        std::string type = output_type;
        if(type.empty())
        {
            if(output.empty())
                type = "text";
            else
                type = "binary";
        }

        if(type == "cpp")
            p.print_cpp(*os);
        else if(type == "graphviz")
            p.print_graph(*os, brief);
        else if(type == "text")
            *os << p << std::endl;
        else if(type == "json")
            *os << to_json_string(p.to_value()) << std::endl;
        else if(type == "binary")
            write(*os, save_buffer(p));
    }
Paul's avatar
Paul committed
245
246
};

247
248
249
250
251
252
struct program_params
{
    std::vector<std::string> fill0{};
    std::vector<std::string> fill1{};
    void parse(argument_parser& ap)
    {
Shucai Xiao's avatar
Shucai Xiao committed
253
254
        ap(fill0, {"--fill0"}, ap.help("Fill parameter with 0s"), ap.append(), ap.nargs(2));
        ap(fill1, {"--fill1"}, ap.help("Fill parameter with 1s"), ap.append(), ap.nargs(2));
255
256
    }

257
    auto generate(const program& p, const target& t, bool offload)
258
    {
259
        parameter_map m;
260
261
262
263
        for(auto&& s : fill0)
            m[s] = fill_argument(p.get_parameter_shape(s), 0);
        for(auto&& s : fill1)
            m[s] = fill_argument(p.get_parameter_shape(s), 1);
264
        fill_param_map(m, p, t, offload);
265
266
267
268
        return m;
    }
};

269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
struct compiler_target
{
#ifdef HAVE_GPU
    std::string target_name = "gpu";
#else
    std::string target_name = "cpu";
#endif

    void parse(argument_parser& ap)
    {
        ap(target_name, {"--gpu"}, ap.help("Compile on the gpu"), ap.set_value("gpu"));
        ap(target_name, {"--cpu"}, ap.help("Compile on the cpu"), ap.set_value("cpu"));
        ap(target_name,
           {"--ref"},
           ap.help("Compile on the reference implementation"),
           ap.set_value("ref"));
    }

    target get_target() const { return make_target(target_name); }
};

Paul's avatar
Paul committed
290
291
292
struct compiler
{
    loader l;
293
    program_params parameters;
294
    compiler_target ct;
kahmed10's avatar
kahmed10 committed
295
296
297
    bool offload_copy  = false;
    bool fast_math     = true;
    precision quantize = precision::fp32;
298

kahmed10's avatar
kahmed10 committed
299
    std::vector<std::string> fill0;
Paul's avatar
Paul committed
300
    std::vector<std::string> fill1;
Paul's avatar
Paul committed
301
302
    void parse(argument_parser& ap)
    {
Paul's avatar
Paul committed
303
        l.parse(ap);
304
        parameters.parse(ap);
305
        ct.parse(ap);
306
307
308
        ap(offload_copy,
           {"--enable-offload-copy"},
           ap.help("Enable implicit offload copying"),
309
           ap.set_value(true));
kahmed10's avatar
kahmed10 committed
310
311
312
313
        ap(fast_math,
           {"--disable-fast-math"},
           ap.help("Disable fast math optimization"),
           ap.set_value(false));
kahmed10's avatar
kahmed10 committed
314
315
        ap(quantize, {"--fp16"}, ap.help("Quantize for fp16"), ap.set_value(precision::fp16));
        ap(quantize, {"--int8"}, ap.help("Quantize for int8"), ap.set_value(precision::int8));
Paul's avatar
Paul committed
316
317
    }

318
    auto params(const program& p) { return parameters.generate(p, ct.get_target(), offload_copy); }
319
320
321
322

    program compile()
    {
        auto p = l.load();
323
324
325
        // Dont compile if its already been compiled
        if(p.is_compiled())
            return p;
326
        auto t = ct.get_target();
kahmed10's avatar
kahmed10 committed
327
        if(quantize == precision::fp16)
328
329
330
        {
            quantize_fp16(p);
        }
kahmed10's avatar
kahmed10 committed
331
        else if(quantize == precision::int8)
332
        {
333
            quantize_int8(p, t, {params(p)});
334
        }
335
336
        compile_options options;
        options.offload_copy = offload_copy;
kahmed10's avatar
kahmed10 committed
337
        options.fast_math    = fast_math;
338
        p.compile(t, options);
339
        l.save(p);
340
341
        return p;
    }
Paul's avatar
Paul committed
342
343
};

Paul's avatar
Paul committed
344
345
346
struct read : command<read>
{
    loader l;
347
    void parse(argument_parser& ap) { l.parse(ap); }
Paul's avatar
Paul committed
348
349
350
351

    void run()
    {
        auto p = l.load();
352
        l.save(p);
Paul's avatar
Paul committed
353
354
355
    }
};

Paul's avatar
Paul committed
356
357
358
359
360
361
362
363
struct params : command<params>
{
    loader l;
    void parse(argument_parser& ap) { l.parse(ap); }

    void run()
    {
        auto p = l.load();
Paul's avatar
Paul committed
364
        for(auto&& param : p.get_parameter_shapes())
Paul's avatar
Paul committed
365
366
367
368
            std::cout << param.first << ": " << param.second << std::endl;
    }
};

Paul's avatar
Paul committed
369
370
371
struct verify : command<verify>
{
    loader l;
372
    program_params parameters;
373
    compiler_target ct;
Paul's avatar
Paul committed
374
    double tolerance     = 80;
Paul's avatar
Paul committed
375
    bool per_instruction = false;
Paul's avatar
Paul committed
376
    bool reduce          = false;
377
    bool offload_copy    = false;
kahmed10's avatar
kahmed10 committed
378
    bool fast_math       = true;
kahmed10's avatar
kahmed10 committed
379
    precision quantize   = precision::fp32;
Paul's avatar
Paul committed
380
381
    void parse(argument_parser& ap)
    {
Paul's avatar
Paul committed
382
        l.parse(ap);
383
        parameters.parse(ap);
384
        ct.parse(ap);
385
386
387
388
        ap(offload_copy,
           {"--enable-offload-copy"},
           ap.help("Enable implicit offload copying"),
           ap.set_value(true));
kahmed10's avatar
kahmed10 committed
389
390
391
392
        ap(fast_math,
           {"--disable-fast-math"},
           ap.help("Disable fast math optimization"),
           ap.set_value(false));
Paul's avatar
Paul committed
393
394
        ap(tolerance, {"--tolerance"}, ap.help("Tolerance for errors"));
        ap(per_instruction,
Paul's avatar
Paul committed
395
396
397
398
           {"-i", "--per-instruction"},
           ap.help("Verify each instruction"),
           ap.set_value(true));
        ap(reduce, {"-r", "--reduce"}, ap.help("Reduce program and verify"), ap.set_value(true));
kahmed10's avatar
kahmed10 committed
399
        ap(quantize, {"--fp16"}, ap.help("Quantize for fp16"), ap.set_value(precision::fp16));
Paul's avatar
Paul committed
400
401
402
403
404
    }

    void run()
    {
        auto p = l.load();
405
        l.save(p);
Paul's avatar
Paul committed
406
407
        std::cout << p << std::endl;

408
409
        compile_options options;
        options.offload_copy = offload_copy;
kahmed10's avatar
kahmed10 committed
410
        options.fast_math    = fast_math;
411
412
        auto t               = ct.get_target();
        auto m               = parameters.generate(p, t, true);
413

Paul's avatar
Paul committed
414
415
        if(per_instruction)
        {
kahmed10's avatar
kahmed10 committed
416
            verify_instructions(p, t, options, quantize, tolerance);
Paul's avatar
Paul committed
417
418
419
        }
        else if(reduce)
        {
kahmed10's avatar
kahmed10 committed
420
            verify_reduced_program(p, t, options, quantize, m, tolerance);
Paul's avatar
Paul committed
421
422
423
        }
        else
        {
kahmed10's avatar
kahmed10 committed
424
            verify_program(l.file, p, t, options, quantize, m, tolerance);
Paul's avatar
Paul committed
425
426
427
428
        }
    }
};

429
430
431
432
433
434
435
436
437
438
struct version : command<version>
{
    void parse(const argument_parser&) {}
    void run() const
    {
        std::cout << "MIGraphX Version: " << MIGRAPHX_VERSION_MAJOR << "." << MIGRAPHX_VERSION_MINOR
                  << std::endl;
    }
};

Paul's avatar
Paul committed
439
440
441
struct compile : command<compile>
{
    compiler c;
Paul's avatar
Paul committed
442
    void parse(argument_parser& ap) { c.parse(ap); }
Paul's avatar
Paul committed
443
444
445
446

    void run()
    {
        std::cout << "Compiling ... " << std::endl;
447
        c.compile();
Paul's avatar
Paul committed
448
449
450
451
452
453
    }
};

struct run_cmd : command<run_cmd>
{
    compiler c;
Paul's avatar
Paul committed
454
    void parse(argument_parser& ap) { c.parse(ap); }
Paul's avatar
Paul committed
455
456
457
458
459
460
461

    void run()
    {
        std::cout << "Compiling ... " << std::endl;
        auto p = c.compile();
        std::cout << "Allocating params ... " << std::endl;
        auto m = c.params(p);
Paul's avatar
Paul committed
462
        p.eval(m);
Paul's avatar
Paul committed
463
464
465
466
        std::cout << p << std::endl;
    }
};

Paul's avatar
Paul committed
467
468
469
470
struct perf : command<perf>
{
    compiler c;
    unsigned n = 100;
Paul's avatar
Paul committed
471
472
    void parse(argument_parser& ap)
    {
Paul's avatar
Paul committed
473
474
475
476
477
478
479
480
481
482
483
        c.parse(ap);
        ap(n, {"--iterations", "-n"}, ap.help("Number of iterations to run for perf report"));
    }

    void run()
    {
        std::cout << "Compiling ... " << std::endl;
        auto p = c.compile();
        std::cout << "Allocating params ... " << std::endl;
        auto m = c.params(p);
        std::cout << "Running performance report ... " << std::endl;
484
        p.perf_report(std::cout, n, m, c.l.batch);
Paul's avatar
Paul committed
485
    }
486
487
};

488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
struct roctx : command<roctx>
{
    compiler c;
    void parse(argument_parser& ap) { c.parse(ap); }

    void run()
    {
        std::cout << "Compiling ... " << std::endl;
        auto p = c.compile();
        std::cout << "Allocating params ... " << std::endl;
        auto m = c.params(p);
        std::cout << "rocTX:\tLoading rocTX library..." << std::endl;
        auto rtx = create_marker_roctx();
        p.mark(m, std::move(rtx));
    }
};

505
506
507
struct op : command<op>
{
    bool show_ops = false;
508
    std::string op_name{};
509
510
    void parse(argument_parser& ap)
    {
511
        ap(op_name, {}, ap.metavar("<MIGraphX operator name>"));
512
513
514
515
516
517
518
519
520
521
522
523
        ap(show_ops,
           {"--list", "-l"},
           ap.help("List all the operators of MIGraphX"),
           ap.set_value(true));
    }
    void run() const
    {
        if(show_ops)
        {
            for(const auto& name : get_operators())
                std::cout << name << std::endl;
        }
524
525
526
527
528
529
        else
        {
            auto op = load_op(op_name);
            std::cout << op_name << ": " << std::endl;
            std::cout << to_pretty_json_string(op.to_value()) << std::endl;
        }
530
    }
Paul's avatar
Paul committed
531
532
};

533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
struct onnx : command<onnx>
{
    bool show_ops = false;
    void parse(argument_parser& ap)
    {
        ap(show_ops,
           {"--list", "-l"},
           ap.help("List all onnx operators supported by MIGraphX"),
           ap.set_value(true));
    }
    void run() const
    {
        if(show_ops)
        {
            for(const auto& name : get_onnx_operators())
                std::cout << name << std::endl;
        }
    }
};

Paul's avatar
Paul committed
553
554
555
556
557
struct main_command
{
    static std::string get_command_help()
    {
        std::string result = "Commands:\n";
Paul's avatar
Paul committed
558
559
560
561
        return std::accumulate(get_commands().begin(),
                               get_commands().end(),
                               result,
                               [](auto r, auto&& p) { return r + "    " + p.first + "\n"; });
Paul's avatar
Paul committed
562
    }
Paul's avatar
Paul committed
563
    void parse(argument_parser& ap)
Paul's avatar
Paul committed
564
    {
565
566
        std::string version_str = "MIGraphX Version: " + std::to_string(MIGRAPHX_VERSION_MAJOR) +
                                  "." + std::to_string(MIGRAPHX_VERSION_MINOR);
Paul's avatar
Paul committed
567
        ap(nullptr, {"-h", "--help"}, ap.help("Show help"), ap.show_help(get_command_help()));
568
569
570
571
        ap(nullptr,
           {"-v", "--version"},
           ap.help("Show MIGraphX version"),
           ap.show_help(version_str));
Paul's avatar
Paul committed
572
573
574
575
576
    }

    void run() {}
};

Paul's avatar
Paul committed
577
578
579
580
} // namespace MIGRAPHX_INLINE_NS
} // namespace driver
} // namespace migraphx

Paul's avatar
Paul committed
581
using namespace migraphx::driver; // NOLINT
Paul's avatar
Paul committed
582
583
int main(int argc, const char* argv[])
{
Paul's avatar
Paul committed
584
    std::vector<std::string> args(argv + 1, argv + argc);
Shucai Xiao's avatar
Shucai Xiao committed
585
586

    // no argument, print the help infomration by default
Paul's avatar
Paul committed
587
    if(args.empty())
Shucai Xiao's avatar
Shucai Xiao committed
588
589
590
591
    {
        args.push_back("-h");
    }

Paul's avatar
Paul committed
592
    auto&& m = get_commands();
Paul's avatar
Paul committed
593
    auto cmd = args.front();
Paul's avatar
Paul committed
594
    if(m.count(cmd) > 0)
Paul's avatar
Paul committed
595
    {
Paul's avatar
Paul committed
596
        m.at(cmd)({args.begin() + 1, args.end()});
Paul's avatar
Paul committed
597
    }
Paul's avatar
Paul committed
598
    else
Paul's avatar
Paul committed
599
    {
Paul's avatar
Paul committed
600
        run_command<main_command>(args);
Paul's avatar
Paul committed
601
    }
Shucai Xiao's avatar
Shucai Xiao committed
602

Paul's avatar
Paul committed
603
604
    return 0;
}