"src/vscode:/vscode.git/clone" did not exist on "89dfc4ddc7db698fca878737b4977cde87899639"
pack_int8_args.cpp 2.5 KB
Newer Older
1
2
#include <migraphx/gpu/pack_int8_args.hpp>
#include <migraphx/gpu/int8_gemm_pack.hpp>
3
#include <migraphx/gpu/int8_conv_pack.hpp>
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
#include <migraphx/gpu/hip.hpp>
#include <migraphx/instruction.hpp>
#include <migraphx/program.hpp>
#include <migraphx/iterator_for.hpp>

namespace migraphx {
inline namespace MIGRAPHX_INLINE_NS {
namespace gpu {

void pack_int8_args::apply(program& p) const
{
    for(auto ins : iterator_for(p))
    {
        if(ins->name() == "gpu::quant_gemm")
        {
            auto inputs = ins->inputs();
            bool transa = inputs[0]->get_shape().transposed();
            bool transb = inputs[1]->get_shape().transposed();

Shucai Xiao's avatar
Shucai Xiao committed
23
            if(!transb)
24
25
            {
                auto packed_b = p.insert_instruction(ins, hip_allocate{inputs[1]->get_shape()});
Shucai Xiao's avatar
Shucai Xiao committed
26
27
                auto output_b =
                    p.insert_instruction(ins, hip_int8_gemm_pack_a{}, {inputs[1], packed_b});
28
29
30
                instruction::replace_argument(ins, inputs[1], output_b);
            }

Shucai Xiao's avatar
Shucai Xiao committed
31
            if(transa)
32
33
            {
                auto packed_a = p.insert_instruction(ins, hip_allocate{inputs[0]->get_shape()});
Shucai Xiao's avatar
Shucai Xiao committed
34
35
                auto output_a =
                    p.insert_instruction(ins, hip_int8_gemm_pack_b{}, {inputs[0], packed_a});
36
37
38
                instruction::replace_argument(ins, inputs[0], output_a);
            }
        }
Shucai Xiao's avatar
Shucai Xiao committed
39
        else if(ins->name() == "gpu::quant_convolution")
40
        {
41
            auto inputs = ins->inputs();
Shucai Xiao's avatar
Shucai Xiao committed
42
43
44
45
            auto packed_x =
                p.insert_instruction(ins, hip_allocate{pack_int8_shape(inputs[0]->get_shape())});
            auto output_x =
                p.insert_instruction(ins, miopen_int8_conv_pack{}, {inputs[0], packed_x});
46
47
            instruction::replace_argument(ins, inputs[0], output_x);

Shucai Xiao's avatar
Shucai Xiao committed
48
49
50
51
            auto packed_w =
                p.insert_instruction(ins, hip_allocate{pack_int8_shape(inputs[1]->get_shape())});
            auto output_w =
                p.insert_instruction(ins, miopen_int8_conv_pack{}, {inputs[1], packed_w});
52
            instruction::replace_argument(ins, inputs[1], output_w);
53
54
55
56
        }
    }
}

57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
shape pack_int8_args::pack_int8_shape(const shape& s) const
{
    if(s.type() != shape::int8_type)
    {
        MIGRAPHX_THROW("PACK_INT8_ARGS: only process int8_type");
    }

    auto lens    = s.lens();
    auto strides = s.strides();
    lens[1]      = (lens[1] + 3) / 4 * 4;
    strides[0]   = strides[1] * lens[1];

    return {s.type(), lens, strides};
}

72
73
74
} // namespace gpu
} // namespace MIGRAPHX_INLINE_NS
} // namespace migraphx