// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. // reference from https://github.com/RangiLyu/nanodet/tree/main/demo_openvino #ifndef _PICODET_OPENVINO_H_ #define _PICODET_OPENVINO_H_ #include #include #include #define image_size 416 typedef struct HeadInfo { std::string cls_layer; std::string dis_layer; int stride; } HeadInfo; typedef struct BoxInfo { float x1; float y1; float x2; float y2; float score; int label; } BoxInfo; class PicoDet { public: PicoDet(const char *param); ~PicoDet(); InferenceEngine::ExecutableNetwork network_; InferenceEngine::InferRequest infer_request_; // static bool hasGPU; std::vector heads_info_{ // cls_pred|dis_pred|stride {"transpose_0.tmp_0", "transpose_1.tmp_0", 8}, {"transpose_2.tmp_0", "transpose_3.tmp_0", 16}, {"transpose_4.tmp_0", "transpose_5.tmp_0", 32}, {"transpose_6.tmp_0", "transpose_7.tmp_0", 64}, }; std::vector detect(cv::Mat image, float score_threshold, float nms_threshold); private: void preprocess(cv::Mat &image, InferenceEngine::Blob::Ptr &blob); void decode_infer(const float *&cls_pred, const float *&dis_pred, int stride, float threshold, std::vector> &results); BoxInfo disPred2Bbox(const float *&dfl_det, int label, float score, int x, int y, int stride); static void nms(std::vector &result, float nms_threshold); std::string input_name_; int input_size_ = image_size; int num_class_ = 80; int reg_max_ = 7; }; #endif