transforms.h 7.1 KB
Newer Older
C
Channingss 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30
//   Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once

#include <yaml-cpp/yaml.h>

#include <memory>
#include <string>
#include <unordered_map>
#include <utility>
#include <vector>

#include <opencv2/core/core.hpp>
#include <opencv2/highgui/highgui.hpp>
#include <opencv2/imgproc/imgproc.hpp>

namespace PaddleX {

J
jack 已提交
31 32 33 34
/*
 * @brief
 * This class represents object for storing all preprocessed data
 * */
C
Channingss 已提交
35 36 37 38 39 40 41
class ImageBlob {
 public:
  // Original image height and width
  std::vector<int> ori_im_size_ = std::vector<int>(2);
  // Newest image height and width after process
  std::vector<int> new_im_size_ = std::vector<int>(2);
  // Image height and width before resize
C
Channingss 已提交
42
  std::vector<std::vector<int>> im_size_before_resize_;
C
Channingss 已提交
43 44 45 46 47 48 49 50 51 52 53 54 55 56
  // Reshape order
  std::vector<std::string> reshape_order_;
  // Resize scale
  float scale = 1.0;
  // Buffer for image data after preprocessing
  std::vector<float> im_data_;

  void clear() {
    im_size_before_resize_.clear();
    reshape_order_.clear();
    im_data_.clear();
  }
};

J
jack 已提交
57 58 59 60
/*
 * @brief
 * Abstraction of preprocessing operation class
 * */
C
Channingss 已提交
61 62 63
class Transform {
 public:
  virtual void Init(const YAML::Node& item) = 0;
J
jack 已提交
64 65 66 67 68
  /*
   * @brief
   * This method executes preprocessing operation on image matrix,
   * result will be returned at second parameter.
   * @param im: single image matrix to be preprocessed
J
jack 已提交
69
   * @param data: the raw data of single image matrix after preprocessed
J
jack 已提交
70 71
   * @return true if transform successfully
   * */
C
Channingss 已提交
72 73 74
  virtual bool Run(cv::Mat* im, ImageBlob* data) = 0;
};

J
jack 已提交
75 76 77 78
/*
 * @brief
 * This class execute normalization operation on image matrix
 * */
C
Channingss 已提交
79 80 81 82 83 84 85 86 87 88 89 90 91 92
class Normalize : public Transform {
 public:
  virtual void Init(const YAML::Node& item) {
    mean_ = item["mean"].as<std::vector<float>>();
    std_ = item["std"].as<std::vector<float>>();
  }

  virtual bool Run(cv::Mat* im, ImageBlob* data);

 private:
  std::vector<float> mean_;
  std::vector<float> std_;
};

J
jack 已提交
93 94
/*
 * @brief
J
jack 已提交
95
 * This class execute resize by short operation on image matrix. At first, it resizes
J
jack 已提交
96 97
 * the short side of image matrix to specified length. Accordingly, the long side
 * will be resized in the same proportion. If new length of long side exceeds max
J
jack 已提交
98
 * size, the long size will be resized to max size, and the short size will be
J
jack 已提交
99 100
 * resized in the same proportion
 * */
C
Channingss 已提交
101 102 103 104 105 106 107 108 109
class ResizeByShort : public Transform {
 public:
  virtual void Init(const YAML::Node& item) {
    short_size_ = item["short_size"].as<int>();
    if (item["max_size"].IsDefined()) {
      max_size_ = item["max_size"].as<int>();
    } else {
      max_size_ = -1;
    }
C
Channingss 已提交
110
  }
C
Channingss 已提交
111 112 113 114 115 116 117 118
  virtual bool Run(cv::Mat* im, ImageBlob* data);

 private:
  float GenerateScale(const cv::Mat& im);
  int short_size_;
  int max_size_;
};

J
jack 已提交
119 120 121 122 123 124
/*
 * @brief
 * This class execute resize by long operation on image matrix. At first, it resizes
 * the long side of image matrix to specified length. Accordingly, the short side
 * will be resized in the same proportion.
 * */
C
Channingss 已提交
125 126 127 128
class ResizeByLong : public Transform {
 public:
  virtual void Init(const YAML::Node& item) {
    long_size_ = item["long_size"].as<int>();
C
Channingss 已提交
129
  }
C
Channingss 已提交
130 131 132 133 134 135
  virtual bool Run(cv::Mat* im, ImageBlob* data);

 private:
  int long_size_;
};

J
jack 已提交
136 137 138 139 140
/*
 * @brief
 * This class execute resize operation on image matrix. It resizes width and height
 * to specified length.
 * */
C
Channingss 已提交
141 142 143
class Resize : public Transform {
 public:
  virtual void Init(const YAML::Node& item) {
144 145 146
    if (item["interp"].IsDefined()) {
      interp_ = item["interp"].as<std::string>();
    }
C
Channingss 已提交
147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167
    if (item["target_size"].IsScalar()) {
      height_ = item["target_size"].as<int>();
      width_ = item["target_size"].as<int>();
    } else if (item["target_size"].IsSequence()) {
      std::vector<int> target_size = item["target_size"].as<std::vector<int>>();
      width_ = target_size[0];
      height_ = target_size[1];
    }
    if (height_ <= 0 || width_ <= 0) {
      std::cerr << "[Resize] target_size should greater than 0" << std::endl;
      exit(-1);
    }
  }
  virtual bool Run(cv::Mat* im, ImageBlob* data);

 private:
  int height_;
  int width_;
  std::string interp_;
};

J
jack 已提交
168 169 170 171 172
/*
 * @brief
 * This class execute center crop operation on image matrix. It crops the center
 * of image matrix accroding to specified size.
 * */
C
Channingss 已提交
173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191
class CenterCrop : public Transform {
 public:
  virtual void Init(const YAML::Node& item) {
    if (item["crop_size"].IsScalar()) {
      height_ = item["crop_size"].as<int>();
      width_ = item["crop_size"].as<int>();
    } else if (item["crop_size"].IsSequence()) {
      std::vector<int> crop_size = item["crop_size"].as<std::vector<int>>();
      width_ = crop_size[0];
      height_ = crop_size[1];
    }
  }
  virtual bool Run(cv::Mat* im, ImageBlob* data);

 private:
  int height_;
  int width_;
};

J
jack 已提交
192 193 194 195 196
/*
 * @brief
 * This class execute padding operation on image matrix. It makes border on edge
 * of image matrix.
 * */
C
Channingss 已提交
197 198 199 200 201
class Padding : public Transform {
 public:
  virtual void Init(const YAML::Node& item) {
    if (item["coarsest_stride"].IsDefined()) {
      coarsest_stride_ = item["coarsest_stride"].as<int>();
202
      if (coarsest_stride_ < 1) {
C
Channingss 已提交
203 204 205 206
        std::cerr << "[Padding] coarest_stride should greater than 0"
                  << std::endl;
        exit(-1);
      }
207
    }
C
Channingss 已提交
208
    if (item["target_size"].IsDefined()) {
C
Channingss 已提交
209 210 211 212
      if (item["target_size"].IsScalar()) {
        width_ = item["target_size"].as<int>();
        height_ = item["target_size"].as<int>();
      } else if (item["target_size"].IsSequence()) {
213 214
        width_ = item["target_size"].as<std::vector<int>>()[0];
        height_ = item["target_size"].as<std::vector<int>>()[1];
C
Channingss 已提交
215 216
      }
    }
S
syyxsxx 已提交
217 218 219 220 221 222
    if (item["im_padding_value"].IsDefined()) {
      im_value_ = item["im_padding_value"].as<std::vector<float>>();
    }
    else {
      im_value_ = {0, 0, 0};
    }
C
Channingss 已提交
223 224
  }
  virtual bool Run(cv::Mat* im, ImageBlob* data);
J
jack 已提交
225

C
Channingss 已提交
226 227 228 229
 private:
  int coarsest_stride_ = -1;
  int width_ = 0;
  int height_ = 0;
S
syyxsxx 已提交
230
  std::vector<float> im_value_;
C
Channingss 已提交
231
};
J
jack 已提交
232 233 234 235 236
/*
 * @brief
 * This class is transform operations manager. It stores all neccessary
 * transform operations and run them in correct order.
 * */
C
Channingss 已提交
237 238 239 240 241
class Transforms {
 public:
  void Init(const YAML::Node& node, bool to_rgb = true);
  std::shared_ptr<Transform> CreateTransform(const std::string& name);
  bool Run(cv::Mat* im, ImageBlob* data);
J
jack 已提交
242

C
Channingss 已提交
243 244 245 246 247 248
 private:
  std::vector<std::shared_ptr<Transform>> transforms_;
  bool to_rgb_ = true;
};

}  // namespace PaddleX