resource.h 3.2 KB
Newer Older
W
wangguibao 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once
B
barrierye 已提交
16
#include <map>
X
xulongteng 已提交
17
#include <memory>
W
wangguibao 已提交
18
#include <string>
G
guru4elephant 已提交
19
#include <vector>
H
HexToString 已提交
20
#include <utility>
G
guru4elephant 已提交
21 22 23 24
#include "core/cube/cube-api/include/cube_api.h"
#include "core/predictor/common/inner_common.h"
#include "core/predictor/framework/infer.h"
#include "core/predictor/framework/memory.h"
W
wangguibao 已提交
25 26 27 28 29

namespace baidu {
namespace paddle_serving {
namespace predictor {

G
guru4elephant 已提交
30
class PaddleGeneralModelConfig {
G
guru4elephant 已提交
31 32
 public:
  PaddleGeneralModelConfig() {}
G
guru4elephant 已提交
33

G
guru4elephant 已提交
34
  ~PaddleGeneralModelConfig() {}
G
guru4elephant 已提交
35 36

 public:
37
  std::vector<std::string> _feed_name;
38
  std::vector<std::string> _feed_alias_name;
B
barrierye 已提交
39 40
  std::vector<int> _feed_type;      // 0 int64, 1 float
  std::vector<bool> _is_lod_feed;   // true lod tensor
41
  std::vector<bool> _is_lod_fetch;  // whether a fetch var is lod_tensor
B
barrierye 已提交
42 43 44 45 46 47
  std::vector<int> _capacity;       //  capacity for each tensor
                                    /*
                                      feed_shape_ for feeded variable
                                      feed_shape_[i][j] represents the jth dim for ith input Tensor
                                      if is_lod_feed_[i] == False, feed_shape_[i][0] = -1
                                     */
G
guru4elephant 已提交
48
  std::vector<std::vector<int>> _feed_shape;
49 50

  std::vector<std::string> _fetch_name;
51
  std::vector<std::string> _fetch_alias_name;
52
  std::vector<std::vector<int>> _fetch_shape;
53 54
  std::map<std::string, int> _fetch_name_to_index;
  std::map<std::string, int> _fetch_alias_name_to_index;
G
guru4elephant 已提交
55 56
};

W
wangguibao 已提交
57 58 59
class BaseRdDict;

class Resource {
W
wangguibao 已提交
60
 public:
W
wangguibao 已提交
61 62 63 64 65 66 67
  Resource() {
    // Reference InferManager::instance() explicitly, to make sure static
    // instance of InferManager is constructed before that of Resource, and
    // destruct after that of Resource
    // See https://stackoverflow.com/a/335746/1513460
    InferManager::instance();
  }
W
wangguibao 已提交
68

W
wangguibao 已提交
69
  ~Resource() { finalize(); }
W
wangguibao 已提交
70

W
wangguibao 已提交
71 72 73 74
  static Resource& instance() {
    static Resource ins;
    return ins;
  }
W
wangguibao 已提交
75

W
wangguibao 已提交
76
  int initialize(const std::string& path, const std::string& file);
G
guru4elephant 已提交
77

78 79
  int general_model_initialize(const std::string& path,
                               const std::string& file);
G
guru4elephant 已提交
80

W
wangguibao 已提交
81
  int thread_initialize();
W
wangguibao 已提交
82

W
wangguibao 已提交
83
  int thread_clear();
W
wangguibao 已提交
84

W
wangguibao 已提交
85
  int reload();
W
wangguibao 已提交
86

W
wangguibao 已提交
87
  int finalize();
W
wangguibao 已提交
88

89 90
  std::vector<std::shared_ptr<PaddleGeneralModelConfig>>
  get_general_model_config();
G
guru4elephant 已提交
91 92

  void print_general_model_config(
93
      const std::shared_ptr<PaddleGeneralModelConfig>& config);
G
guru4elephant 已提交
94

W
wangjiawei04 已提交
95
  size_t get_cube_quant_bits();
W
wangguibao 已提交
96

W
wangguibao 已提交
97 98
 private:
  int thread_finalize() { return 0; }
99
  std::vector<std::shared_ptr<PaddleGeneralModelConfig>> _configs;
W
wangjiawei04 已提交
100
  std::string cube_config_fullpath;
W
wangjiawei04 已提交
101
  int cube_quant_bits;  // 0 if no empty
102

W
wangguibao 已提交
103
  THREAD_KEY_T _tls_bspec_key;
W
wangguibao 已提交
104 105
};

W
wangguibao 已提交
106 107 108
}  // namespace predictor
}  // namespace paddle_serving
}  // namespace baidu