transforms.h 7.1 KB
Newer Older
C
Channingss 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
//   Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once

#include <yaml-cpp/yaml.h>

#include <memory>
#include <string>
#include <unordered_map>
#include <utility>
#include <vector>
S
syyxsxx 已提交
24
#include <iostream>
C
Channingss 已提交
25 26 27 28 29 30 31

#include <opencv2/core/core.hpp>
#include <opencv2/highgui/highgui.hpp>
#include <opencv2/imgproc/imgproc.hpp>

namespace PaddleX {

J
jack 已提交
32 33 34 35
/*
 * @brief
 * This class represents object for storing all preprocessed data
 * */
C
Channingss 已提交
36 37 38 39 40 41 42
class ImageBlob {
 public:
  // Original image height and width
  std::vector<int> ori_im_size_ = std::vector<int>(2);
  // Newest image height and width after process
  std::vector<int> new_im_size_ = std::vector<int>(2);
  // Image height and width before resize
C
Channingss 已提交
43
  std::vector<std::vector<int>> im_size_before_resize_;
C
Channingss 已提交
44 45 46 47 48 49 50 51 52 53 54 55 56 57
  // Reshape order
  std::vector<std::string> reshape_order_;
  // Resize scale
  float scale = 1.0;
  // Buffer for image data after preprocessing
  std::vector<float> im_data_;

  void clear() {
    im_size_before_resize_.clear();
    reshape_order_.clear();
    im_data_.clear();
  }
};

J
jack 已提交
58 59 60 61
/*
 * @brief
 * Abstraction of preprocessing operation class
 * */
C
Channingss 已提交
62 63 64
class Transform {
 public:
  virtual void Init(const YAML::Node& item) = 0;
J
jack 已提交
65 66 67 68 69
  /*
   * @brief
   * This method executes preprocessing operation on image matrix,
   * result will be returned at second parameter.
   * @param im: single image matrix to be preprocessed
J
jack 已提交
70
   * @param data: the raw data of single image matrix after preprocessed
J
jack 已提交
71 72
   * @return true if transform successfully
   * */
C
Channingss 已提交
73 74 75
  virtual bool Run(cv::Mat* im, ImageBlob* data) = 0;
};

J
jack 已提交
76 77 78 79
/*
 * @brief
 * This class execute normalization operation on image matrix
 * */
C
Channingss 已提交
80 81 82 83 84 85 86 87 88 89 90 91 92 93
class Normalize : public Transform {
 public:
  virtual void Init(const YAML::Node& item) {
    mean_ = item["mean"].as<std::vector<float>>();
    std_ = item["std"].as<std::vector<float>>();
  }

  virtual bool Run(cv::Mat* im, ImageBlob* data);

 private:
  std::vector<float> mean_;
  std::vector<float> std_;
};

J
jack 已提交
94 95
/*
 * @brief
J
jack 已提交
96
 * This class execute resize by short operation on image matrix. At first, it resizes
J
jack 已提交
97 98
 * the short side of image matrix to specified length. Accordingly, the long side
 * will be resized in the same proportion. If new length of long side exceeds max
J
jack 已提交
99
 * size, the long size will be resized to max size, and the short size will be
J
jack 已提交
100 101
 * resized in the same proportion
 * */
C
Channingss 已提交
102 103 104 105 106 107 108 109 110
class ResizeByShort : public Transform {
 public:
  virtual void Init(const YAML::Node& item) {
    short_size_ = item["short_size"].as<int>();
    if (item["max_size"].IsDefined()) {
      max_size_ = item["max_size"].as<int>();
    } else {
      max_size_ = -1;
    }
C
Channingss 已提交
111
  }
C
Channingss 已提交
112 113 114 115 116 117 118 119
  virtual bool Run(cv::Mat* im, ImageBlob* data);

 private:
  float GenerateScale(const cv::Mat& im);
  int short_size_;
  int max_size_;
};

J
jack 已提交
120 121 122 123 124 125
/*
 * @brief
 * This class execute resize by long operation on image matrix. At first, it resizes
 * the long side of image matrix to specified length. Accordingly, the short side
 * will be resized in the same proportion.
 * */
C
Channingss 已提交
126 127 128 129
class ResizeByLong : public Transform {
 public:
  virtual void Init(const YAML::Node& item) {
    long_size_ = item["long_size"].as<int>();
C
Channingss 已提交
130
  }
C
Channingss 已提交
131 132 133 134 135 136
  virtual bool Run(cv::Mat* im, ImageBlob* data);

 private:
  int long_size_;
};

J
jack 已提交
137 138 139 140 141
/*
 * @brief
 * This class execute resize operation on image matrix. It resizes width and height
 * to specified length.
 * */
C
Channingss 已提交
142 143 144
class Resize : public Transform {
 public:
  virtual void Init(const YAML::Node& item) {
145 146 147
    if (item["interp"].IsDefined()) {
      interp_ = item["interp"].as<std::string>();
    }
C
Channingss 已提交
148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168
    if (item["target_size"].IsScalar()) {
      height_ = item["target_size"].as<int>();
      width_ = item["target_size"].as<int>();
    } else if (item["target_size"].IsSequence()) {
      std::vector<int> target_size = item["target_size"].as<std::vector<int>>();
      width_ = target_size[0];
      height_ = target_size[1];
    }
    if (height_ <= 0 || width_ <= 0) {
      std::cerr << "[Resize] target_size should greater than 0" << std::endl;
      exit(-1);
    }
  }
  virtual bool Run(cv::Mat* im, ImageBlob* data);

 private:
  int height_;
  int width_;
  std::string interp_;
};

J
jack 已提交
169 170 171 172 173
/*
 * @brief
 * This class execute center crop operation on image matrix. It crops the center
 * of image matrix accroding to specified size.
 * */
C
Channingss 已提交
174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192
class CenterCrop : public Transform {
 public:
  virtual void Init(const YAML::Node& item) {
    if (item["crop_size"].IsScalar()) {
      height_ = item["crop_size"].as<int>();
      width_ = item["crop_size"].as<int>();
    } else if (item["crop_size"].IsSequence()) {
      std::vector<int> crop_size = item["crop_size"].as<std::vector<int>>();
      width_ = crop_size[0];
      height_ = crop_size[1];
    }
  }
  virtual bool Run(cv::Mat* im, ImageBlob* data);

 private:
  int height_;
  int width_;
};

J
jack 已提交
193 194 195 196 197
/*
 * @brief
 * This class execute padding operation on image matrix. It makes border on edge
 * of image matrix.
 * */
C
Channingss 已提交
198 199 200 201 202
class Padding : public Transform {
 public:
  virtual void Init(const YAML::Node& item) {
    if (item["coarsest_stride"].IsDefined()) {
      coarsest_stride_ = item["coarsest_stride"].as<int>();
203
      if (coarsest_stride_ < 1) {
C
Channingss 已提交
204 205 206 207
        std::cerr << "[Padding] coarest_stride should greater than 0"
                  << std::endl;
        exit(-1);
      }
208
    }
C
Channingss 已提交
209
    if (item["target_size"].IsDefined()) {
C
Channingss 已提交
210 211 212 213
      if (item["target_size"].IsScalar()) {
        width_ = item["target_size"].as<int>();
        height_ = item["target_size"].as<int>();
      } else if (item["target_size"].IsSequence()) {
214 215
        width_ = item["target_size"].as<std::vector<int>>()[0];
        height_ = item["target_size"].as<std::vector<int>>()[1];
C
Channingss 已提交
216 217
      }
    }
S
syyxsxx 已提交
218 219
    if (item["im_padding_value"].IsDefined()) {
      im_value_ = item["im_padding_value"].as<std::vector<float>>();
S
syyxsxx 已提交
220
    } else {
S
syyxsxx 已提交
221 222
      im_value_ = {0, 0, 0};
    }
C
Channingss 已提交
223 224
  }
  virtual bool Run(cv::Mat* im, ImageBlob* data);
J
jack 已提交
225

C
Channingss 已提交
226 227 228 229
 private:
  int coarsest_stride_ = -1;
  int width_ = 0;
  int height_ = 0;
S
syyxsxx 已提交
230
  std::vector<float> im_value_;
C
Channingss 已提交
231
};
J
jack 已提交
232 233 234 235 236
/*
 * @brief
 * This class is transform operations manager. It stores all neccessary
 * transform operations and run them in correct order.
 * */
C
Channingss 已提交
237 238 239 240 241
class Transforms {
 public:
  void Init(const YAML::Node& node, bool to_rgb = true);
  std::shared_ptr<Transform> CreateTransform(const std::string& name);
  bool Run(cv::Mat* im, ImageBlob* data);
J
jack 已提交
242

C
Channingss 已提交
243 244 245 246 247 248
 private:
  std::vector<std::shared_ptr<Transform>> transforms_;
  bool to_rgb_ = true;
};

}  // namespace PaddleX