utility.h 3.5 KB
Newer Older
littletomatodonkey's avatar
littletomatodonkey 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
// Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once

#include <chrono>
#include <iomanip>
#include <iostream>
#include <ostream>
#include <stdlib.h>
#include <vector>

#include <algorithm>
#include <cstring>
#include <fstream>
#include <numeric>

littletomatodonkey's avatar
littletomatodonkey 已提交
29 30 31 32
#include "opencv2/core.hpp"
#include "opencv2/imgcodecs.hpp"
#include "opencv2/imgproc.hpp"

littletomatodonkey's avatar
littletomatodonkey 已提交
33 34
namespace PaddleOCR {

35 36 37 38 39 40 41 42
struct OCRPredictResult {
  std::vector<std::vector<int>> box;
  std::string text;
  float score = -1.0;
  float cls_score;
  int cls_label = -1;
};

文幕地方's avatar
文幕地方 已提交
43
struct StructurePredictResult {
文幕地方's avatar
fix bug  
文幕地方 已提交
44
  std::vector<float> box;
文幕地方's avatar
文幕地方 已提交
45
  std::vector<std::vector<int>> cell_box;
文幕地方's avatar
文幕地方 已提交
46 47 48 49
  std::string type;
  std::vector<OCRPredictResult> text_res;
  std::string html;
  float html_score = -1;
文幕地方's avatar
文幕地方 已提交
50
  float confidence;
文幕地方's avatar
文幕地方 已提交
51 52
};

littletomatodonkey's avatar
littletomatodonkey 已提交
53 54
class Utility {
public:
M
revert  
MissPenguin 已提交
55 56
  static std::vector<std::string> ReadDict(const std::string &path);

57 58 59
  static void VisualizeBboxes(const cv::Mat &srcimg,
                              const std::vector<OCRPredictResult> &ocr_result,
                              const std::string &save_path);
littletomatodonkey's avatar
littletomatodonkey 已提交
60

文幕地方's avatar
文幕地方 已提交
61
  static void VisualizeBboxes(const cv::Mat &srcimg,
文幕地方's avatar
fix bug  
文幕地方 已提交
62
                              const StructurePredictResult &structure_result,
文幕地方's avatar
文幕地方 已提交
63 64
                              const std::string &save_path);

littletomatodonkey's avatar
littletomatodonkey 已提交
65 66 67 68
  template <class ForwardIterator>
  inline static size_t argmax(ForwardIterator first, ForwardIterator last) {
    return std::distance(first, std::max_element(first, last));
  }
L
LDOUBLEV 已提交
69 70

  static void GetAllFiles(const char *dir_name,
M
revert  
MissPenguin 已提交
71
                          std::vector<std::string> &all_inputs);
文幕地方's avatar
文幕地方 已提交
72

M
MissPenguin 已提交
73
  static cv::Mat GetRotateCropImage(const cv::Mat &srcimage,
文幕地方's avatar
文幕地方 已提交
74 75 76
                                    std::vector<std::vector<int>> box);

  static std::vector<int> argsort(const std::vector<float> &array);
M
MissPenguin 已提交
77

文幕地方's avatar
文幕地方 已提交
78
  static std::string basename(const std::string &filename);
79 80 81

  static bool PathExists(const std::string &path);

文幕地方's avatar
文幕地方 已提交
82 83
  static void CreateDir(const std::string &path);

84
  static void print_result(const std::vector<OCRPredictResult> &ocr_result);
文幕地方's avatar
文幕地方 已提交
85

文幕地方's avatar
fix bug  
文幕地方 已提交
86 87
  static cv::Mat crop_image(cv::Mat &img, const std::vector<int> &area);
  static cv::Mat crop_image(cv::Mat &img, const std::vector<float> &area);
文幕地方's avatar
文幕地方 已提交
88 89 90

  static void sorted_boxes(std::vector<OCRPredictResult> &ocr_result);

文幕地方's avatar
文幕地方 已提交
91 92 93
  static std::vector<int> xyxyxyxy2xyxy(std::vector<std::vector<int>> &box);
  static std::vector<int> xyxyxyxy2xyxy(std::vector<int> &box);

文幕地方's avatar
文幕地方 已提交
94 95 96 97 98 99
  static float fast_exp(float x);
  static std::vector<float>
  activation_function_softmax(std::vector<float> &src);
  static float iou(std::vector<int> &box1, std::vector<int> &box2);
  static float iou(std::vector<float> &box1, std::vector<float> &box2);

文幕地方's avatar
文幕地方 已提交
100 101 102 103 104 105 106 107 108 109 110
private:
  static bool comparison_box(const OCRPredictResult &result1,
                             const OCRPredictResult &result2) {
    if (result1.box[0][1] < result2.box[0][1]) {
      return true;
    } else if (result1.box[0][1] == result2.box[0][1]) {
      return result1.box[0][0] < result2.box[0][0];
    } else {
      return false;
    }
  }
littletomatodonkey's avatar
littletomatodonkey 已提交
111 112 113
};

} // namespace PaddleOCR