Formatting

96663815 · turneram · 0ccee797 · 96663815 · 96663815 · 96663815
Commit 96663815 authored May 12, 2022 by turneram
8 changed files
--- a/src/include/migraphx/op/transposectx.hpp
+++ b/src/include/migraphx/op/transposectx.hpp
@@ -20,7 +20,7 @@ namespace op {
 struct transposectx
 {
-    int head_size = 64;
+    int head_size    = 64;
    bool reversed_bs = false;
    template <class Self, class F>
@@ -46,9 +46,9 @@ struct transposectx
        // Output: BxSxNxH
        argument result{output_shape};
        visit_all(result, args.front())([&](auto output, const auto input) {
-            par_for(output_shape.elements(), [&](auto i) { 
+            par_for(output_shape.elements(), [&](auto i) {
                // TODO: calculate in_offet and out_offset
-                output[i] = input[i]; 
+                output[i] = input[i];
            });
        });

--- a/src/include/migraphx/op/transposeqkv.hpp
+++ b/src/include/migraphx/op/transposeqkv.hpp
@@ -20,7 +20,7 @@ namespace op {
 struct transposeqkv
 {
-    int head_size = 64;
+    int head_size    = 64;
    bool reversed_bs = false;
    template <class Self, class F>
@@ -47,9 +47,9 @@ struct transposeqkv
        // K is the number of identical matrix
        argument result{output_shape};
        visit_all(result, args.front())([&](auto output, const auto input) {
-            par_for(output_shape.elements(), [&](auto i) { 
+            par_for(output_shape.elements(), [&](auto i) {
                // TODO: calculate in_offet and out_offset
-                output[i] = input[i]; 
+                output[i] = input[i];
            });
        });

--- a/src/onnx/parse_attention.cpp
+++ b/src/onnx/parse_attention.cpp
@@ -162,8 +162,8 @@ struct parse_attention : op_parser<parse_attention>
        auto gemm4 = info.add_instruction(migraphx::make_op("dot"), softmax, v_t);
        // scratch3 is BxNxSxH, transpose to output BxSxNxH
-        gemm4 = info.add_instruction(
+        gemm4 = info.add_instruction(migraphx::make_op("transposectx", {{"head_size", head_size}}),
-            migraphx::make_op("transposectx", {{"head_size", head_size}}), gemm4);
+                                     gemm4);
        gemm4 = info.add_instruction(
            make_op("reshape", {{"dims", {batch_size, sequence_length, num_heads * head_size}}}),
            info.make_contiguous(gemm4));

--- a/src/targets/gpu/jit/bert_transpose.cpp
+++ b/src/targets/gpu/jit/bert_transpose.cpp
@@ -89,7 +89,6 @@ __global__ void transposeqkv_kernel(void* input_p, void* output_p)
 } // namespace migraphx
 )__migraphx__";
 struct transposeqkv_compiler : compiler<transposeqkv_compiler>
 {
    std::vector<std::string> names() const { return {"transposeqkv"}; }
@@ -121,7 +120,6 @@ struct transposeqkv_compiler : compiler<transposeqkv_compiler>
    }
 };
 } // namespace gpu
 } // namespace MIGRAPHX_INLINE_NS
 } // namespace migraphx
--- a/src/targets/gpu/kernels/include/migraphx/kernels/transposectx.hpp
+++ b/src/targets/gpu/kernels/include/migraphx/kernels/transposectx.hpp
@@ -25,32 +25,35 @@ __device__ void transposectx(const T& input_t, const U& output_t, Settings st)
    // Input:  BxNxSxH
    // Output: BxSxNxH
-    auto head_size = st.head_size;
+    auto head_size   = st.head_size;
    auto reversed_bs = st.reversed_bs;
    int n = threadIdx.y;
    int s = blockIdx.x;
    int b = blockIdx.y;
-    int num_heads = blockDim.y;
+    int num_heads       = blockDim.y;
    int sequence_length = gridDim.x;
-    const int NH = num_heads * head_size;
+    const int NH        = num_heads * head_size;
-    const int NHS = NH * sequence_length;
+    const int NHS       = NH * sequence_length;
    const int in_offset = s * head_size + n * sequence_length * head_size + b * NHS;
    int out_offset = 0;
-    if (reversed_bs) {
+    if(reversed_bs)
+    {
        const int batch_size = gridDim.y;
-        const int BNH = NH * batch_size;
+        const int BNH        = NH * batch_size;
-        out_offset = n * head_size + b * NH + s * BNH;
+        out_offset           = n * head_size + b * NH + s * BNH;
-    } else {
+    }
+    else
+    {
        out_offset = n * head_size + s * NH + b * NHS;
    }
    const int i = threadIdx.x;
-    if (i < head_size) {
+    if(i < head_size)
+    {
        output_t[out_offset + i] = input_t[in_offset + i];
    }
 }

--- a/src/targets/gpu/kernels/include/migraphx/kernels/transposeqkv.hpp
+++ b/src/targets/gpu/kernels/include/migraphx/kernels/transposeqkv.hpp
@@ -26,33 +26,37 @@ __device__ void transposeqkv(const T& input_t, const U& output_t, Settings st)
    // Output: KxBxNxSxH
    // K is the number of identical matrix
-    auto H = st.head_size;
+    auto H           = st.head_size;
    auto reversed_bs = st.reversed_bs;
    int n = threadIdx.y;
    int s = blockIdx.x;
    int b = blockIdx.y;
-    int m = blockIdx.z;  // matrix id
+    int m = blockIdx.z; // matrix id
    const int num_heads = blockDim.y;
    const int sequence_length = gridDim.x;
-    const int batch_size = gridDim.y;
+    const int batch_size      = gridDim.y;
-    const int chunk_num = gridDim.z;
+    const int chunk_num       = gridDim.z;
-    const int NH = num_heads * H;
+    const int NH              = num_heads * H;
-    const int NHS = NH * sequence_length;
+    const int NHS             = NH * sequence_length;
    int in_offset = 0;
-    if (reversed_bs) {
+    if(reversed_bs)
+    {
        const int BNH = NH * batch_size;
-        in_offset = n * H + (m + b * chunk_num) * NH + s * BNH * chunk_num;
+        in_offset     = n * H + (m + b * chunk_num) * NH + s * BNH * chunk_num;
-    } else {
+    }
+    else
+    {
        in_offset = n * H + (m + s * chunk_num) * NH + b * NHS * chunk_num;
    }
    const int out_offset = s * H + n * sequence_length * H + b * NHS + m * NHS * batch_size;
    const int i = threadIdx.x;
-    if (i < H) {
+    if(i < H)
+    {
        output_t[out_offset + i] = input_t[in_offset + i];
    }
 }

--- a/test/verify/0transposectx_test.cpp
+++ b/test/verify/0transposectx_test.cpp
@@ -10,7 +10,8 @@ struct test_transposectx : verify_program<test_transposectx>
    {
        migraphx::program p;
        auto* mm = p.get_main_module();
-        auto x = mm->add_parameter("x", migraphx::shape{migraphx::shape::float_type, {1, 12, 128, 64}});
+        auto x =
+            mm->add_parameter("x", migraphx::shape{migraphx::shape::float_type, {1, 12, 128, 64}});
        mm->add_instruction(migraphx::make_op("transposectx", {{"head_size", 64}}), x);
        p.debug_print();
        return p;

--- a/test/verify/0transposeqkv_test.cpp
+++ b/test/verify/0transposeqkv_test.cpp
@@ -9,7 +9,8 @@ struct test_transposeqkv : verify_program<test_transposeqkv>
    {
        migraphx::program p;
        auto* mm = p.get_main_module();
-        auto x = mm->add_parameter("x", migraphx::shape{migraphx::shape::float_type, {1, 1, 3, 12, 64}});
+        auto x =
+            mm->add_parameter("x", migraphx::shape{migraphx::shape::float_type, {1, 1, 3, 12, 64}});
        mm->add_instruction(migraphx::make_op("transposeqkv", {{"head_size", 64}}), x);
        p.debug_print();
        return p;