pack_int8_args.cpp 1.45 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
#include <migraphx/gpu/pack_int8_args.hpp>
#include <migraphx/gpu/int8_gemm_pack.hpp>
#include <migraphx/gpu/hip.hpp>
#include <migraphx/instruction.hpp>
#include <migraphx/program.hpp>
#include <migraphx/iterator_for.hpp>

namespace migraphx {
inline namespace MIGRAPHX_INLINE_NS {
namespace gpu {

void pack_int8_args::apply(program& p) const
{
    for(auto ins : iterator_for(p))
    {
        if(ins->name() == "gpu::quant_gemm")
        {
            auto inputs = ins->inputs();
            bool transa = inputs[0]->get_shape().transposed();
            bool transb = inputs[1]->get_shape().transposed();

Shucai Xiao's avatar
Shucai Xiao committed
22
            if(!transb)
23
24
            {
                auto packed_b = p.insert_instruction(ins, hip_allocate{inputs[1]->get_shape()});
Shucai Xiao's avatar
Shucai Xiao committed
25
26
                auto output_b =
                    p.insert_instruction(ins, hip_int8_gemm_pack_a{}, {inputs[1], packed_b});
27
28
29
                instruction::replace_argument(ins, inputs[1], output_b);
            }

Shucai Xiao's avatar
Shucai Xiao committed
30
            if(transa)
31
32
            {
                auto packed_a = p.insert_instruction(ins, hip_allocate{inputs[0]->get_shape()});
Shucai Xiao's avatar
Shucai Xiao committed
33
34
                auto output_a =
                    p.insert_instruction(ins, hip_int8_gemm_pack_b{}, {inputs[0], packed_a});
35
36
37
                instruction::replace_argument(ins, inputs[0], output_a);
            }
        }
Shucai Xiao's avatar
Shucai Xiao committed
38
        else if(ins->name() == "gpu::quant_convolution")
39
40
41
42
43
44
45
46
        {
        }
    }
}

} // namespace gpu
} // namespace MIGRAPHX_INLINE_NS
} // namespace migraphx