utility.h 3.56 KB
Newer Older
Your Name's avatar
Your Name committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
// Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once

#include <chrono>
#include <iomanip>
#include <iostream>
#include <ostream>
#include <stdlib.h>
#include <vector>

#include <algorithm>
#include <cstring>
#include <fstream>
#include <numeric>

#include "opencv2/core.hpp"
#include "opencv2/imgcodecs.hpp"
#include "opencv2/imgproc.hpp"

liucong's avatar
liucong committed
33
34
35
36
37
38
39
40
41
42
namespace migraphxSamples
{

struct OCRPredictResult
{
    std::vector<std::vector<int>> box;
    std::string text;
    float score = -1.0;
    float cls_score;
    int cls_label = -1;
Your Name's avatar
Your Name committed
43
44
};

liucong's avatar
liucong committed
45
46
47
48
49
50
51
52
53
struct StructurePredictResult
{
    std::vector<float> box;
    std::vector<std::vector<int>> cell_box;
    std::string type;
    std::vector<OCRPredictResult> text_res;
    std::string html;
    float html_score = -1;
    float confidence;
Your Name's avatar
Your Name committed
54
55
};

liucong's avatar
liucong committed
56
57
58
59
class Utility
{
    public:
    static std::vector<std::string> ReadDict(const std::string& path);
Your Name's avatar
Your Name committed
60

liucong's avatar
liucong committed
61
62
63
    static void VisualizeBboxes(const cv::Mat& srcimg,
                                const std::vector<OCRPredictResult>& ocr_result,
                                const std::string& save_path);
Your Name's avatar
Your Name committed
64

liucong's avatar
liucong committed
65
66
67
    static void VisualizeBboxes(const cv::Mat& srcimg,
                                const StructurePredictResult& structure_result,
                                const std::string& save_path);
Your Name's avatar
Your Name committed
68

liucong's avatar
liucong committed
69
70
71
72
73
    template <class ForwardIterator>
    inline static size_t argmax(ForwardIterator first, ForwardIterator last)
    {
        return std::distance(first, std::max_element(first, last));
    }
Your Name's avatar
Your Name committed
74

liucong's avatar
liucong committed
75
    static void GetAllFiles(const char* dir_name, std::vector<std::string>& all_inputs);
Your Name's avatar
Your Name committed
76

liucong's avatar
liucong committed
77
    static cv::Mat GetRotateCropImage(const cv::Mat& srcimage, std::vector<std::vector<int>> box);
Your Name's avatar
Your Name committed
78

liucong's avatar
liucong committed
79
    static std::vector<int> argsort(const std::vector<float>& array);
Your Name's avatar
Your Name committed
80

liucong's avatar
liucong committed
81
    static std::string basename(const std::string& filename);
Your Name's avatar
Your Name committed
82

liucong's avatar
liucong committed
83
    static bool PathExists(const std::string& path);
Your Name's avatar
Your Name committed
84

liucong's avatar
liucong committed
85
    static void CreateDir(const std::string& path);
Your Name's avatar
Your Name committed
86

liucong's avatar
liucong committed
87
    static void print_result(const std::vector<OCRPredictResult>& ocr_result);
Your Name's avatar
Your Name committed
88

liucong's avatar
liucong committed
89
90
    static cv::Mat crop_image(cv::Mat& img, const std::vector<int>& area);
    static cv::Mat crop_image(cv::Mat& img, const std::vector<float>& area);
Your Name's avatar
Your Name committed
91

liucong's avatar
liucong committed
92
    static void sorted_boxes(std::vector<OCRPredictResult>& ocr_result);
Your Name's avatar
Your Name committed
93

liucong's avatar
liucong committed
94
95
    static std::vector<int> xyxyxyxy2xyxy(std::vector<std::vector<int>>& box);
    static std::vector<int> xyxyxyxy2xyxy(std::vector<int>& box);
Your Name's avatar
Your Name committed
96

liucong's avatar
liucong committed
97
98
99
100
    static float fast_exp(float x);
    static std::vector<float> activation_function_softmax(std::vector<float>& src);
    static float iou(std::vector<int>& box1, std::vector<int>& box2);
    static float iou(std::vector<float>& box1, std::vector<float>& box2);
Your Name's avatar
Your Name committed
101

liucong's avatar
liucong committed
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
    private:
    static bool comparison_box(const OCRPredictResult& result1, const OCRPredictResult& result2)
    {
        if(result1.box[0][1] < result2.box[0][1])
        {
            return true;
        }
        else if(result1.box[0][1] == result2.box[0][1])
        {
            return result1.box[0][0] < result2.box[0][0];
        }
        else
        {
            return false;
        }
Your Name's avatar
Your Name committed
117
118
119
120
    }
};

} // namespace migraphxSamples