__init__.py 7.3 KB
Newer Older
G
guru4elephant 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
#   Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

from .serving_client import PredictorClient
16 17 18
from .proto import sdk_configure_pb2 as sdk
from .proto import general_model_config_pb2 as m_config
import google.protobuf.text_format
G
guru4elephant 已提交
19
import time
20
import sys
G
guru4elephant 已提交
21

G
guru4elephant 已提交
22 23 24
int_type = 0
float_type = 1

M
MRXLT 已提交
25

G
guru4elephant 已提交
26 27 28 29 30 31 32 33 34 35 36 37 38 39
class SDKConfig(object):
    def __init__(self):
        self.sdk_desc = sdk.SDKConf()
        self.endpoints = []

    def set_server_endpoints(self, endpoints):
        self.endpoints = endpoints

    def gen_desc(self):
        predictor_desc = sdk.Predictor()
        predictor_desc.name = "general_model"
        predictor_desc.service_name = \
            "baidu.paddle_serving.predictor.general_model.GeneralModelService"
        predictor_desc.endpoint_router = "WeightedRandomRender"
G
guru4elephant 已提交
40
        predictor_desc.weighted_random_render_conf.variant_weight_list = "100"
G
guru4elephant 已提交
41 42 43

        variant_desc = sdk.VariantConf()
        variant_desc.tag = "var1"
M
MRXLT 已提交
44 45
        variant_desc.naming_conf.cluster = "list://{}".format(":".join(
            self.endpoints))
G
guru4elephant 已提交
46 47 48 49 50 51 52 53 54 55 56 57

        predictor_desc.variants.extend([variant_desc])

        self.sdk_desc.predictors.extend([predictor_desc])
        self.sdk_desc.default_variant_conf.tag = "default"
        self.sdk_desc.default_variant_conf.connection_conf.connect_timeout_ms = 2000
        self.sdk_desc.default_variant_conf.connection_conf.rpc_timeout_ms = 20000
        self.sdk_desc.default_variant_conf.connection_conf.connect_retry_count = 2
        self.sdk_desc.default_variant_conf.connection_conf.max_connection_per_host = 100
        self.sdk_desc.default_variant_conf.connection_conf.hedge_request_timeout_ms = -1
        self.sdk_desc.default_variant_conf.connection_conf.hedge_fetch_retry_count = 2
        self.sdk_desc.default_variant_conf.connection_conf.connection_type = "pooled"
M
MRXLT 已提交
58

G
guru4elephant 已提交
59 60 61 62 63 64 65 66
        self.sdk_desc.default_variant_conf.naming_conf.cluster_filter_strategy = "Default"
        self.sdk_desc.default_variant_conf.naming_conf.load_balance_strategy = "la"

        self.sdk_desc.default_variant_conf.rpc_parameter.compress_type = 0
        self.sdk_desc.default_variant_conf.rpc_parameter.package_size = 20
        self.sdk_desc.default_variant_conf.rpc_parameter.protocol = "baidu_std"
        self.sdk_desc.default_variant_conf.rpc_parameter.max_channel_per_request = 3

G
guru4elephant 已提交
67
        return self.sdk_desc
G
guru4elephant 已提交
68

G
guru4elephant 已提交
69 70 71 72 73 74 75

class Client(object):
    def __init__(self):
        self.feed_names_ = []
        self.fetch_names_ = []
        self.client_handle_ = None
        self.feed_shapes_ = []
G
guru4elephant 已提交
76
        self.feed_types_ = {}
G
guru4elephant 已提交
77 78 79
        self.feed_names_to_idx_ = {}

    def load_client_config(self, path):
80 81 82 83 84
        model_conf = m_config.GeneralModelConfig()
        f = open(path, 'r')
        model_conf = google.protobuf.text_format.Merge(
            str(f.read()), model_conf)

G
guru4elephant 已提交
85 86 87 88
        # load configuraion here
        # get feed vars, fetch vars
        # get feed shapes, feed types
        # map feed names to index
G
guru4elephant 已提交
89 90
        self.client_handle_ = PredictorClient()
        self.client_handle_.init(path)
91
        read_env_flags = ["profile_client", "profile_server"]
M
MRXLT 已提交
92 93
        self.client_handle_.init_gflags([sys.argv[
            0]] + ["--tryfromenv=" + ",".join(read_env_flags)])
94 95 96
        self.feed_names_ = [var.alias_name for var in model_conf.feed_var]
        self.fetch_names_ = [var.alias_name for var in model_conf.fetch_var]
        self.feed_shapes_ = [var.shape for var in model_conf.feed_var]
G
guru4elephant 已提交
97
        self.feed_names_to_idx_ = {}
98 99 100
        for i, var in enumerate(model_conf.feed_var):
            self.feed_names_to_idx_[var.alias_name] = i
            self.feed_types_[var.alias_name] = var.feed_type
G
guru4elephant 已提交
101

G
guru4elephant 已提交
102 103
        return

G
guru4elephant 已提交
104
    def connect(self, endpoints):
G
guru4elephant 已提交
105 106 107
        # check whether current endpoint is available
        # init from client config
        # create predictor here
G
guru4elephant 已提交
108 109 110
        predictor_sdk = SDKConfig()
        predictor_sdk.set_server_endpoints(endpoints)
        sdk_desc = predictor_sdk.gen_desc()
M
MRXLT 已提交
111 112
        self.client_handle_.create_predictor_by_desc(sdk_desc.SerializeToString(
        ))
G
guru4elephant 已提交
113 114 115 116 117 118 119

    def get_feed_names(self):
        return self.feed_names_

    def get_fetch_names(self):
        return self.fetch_names_

M
MRXLT 已提交
120
    def predict(self, feed={}, fetch=[], profile=False):
G
guru4elephant 已提交
121 122 123 124 125 126 127 128 129 130
        int_slot = []
        float_slot = []
        int_feed_names = []
        float_feed_names = []
        fetch_names = []
        for key in feed:
            if key not in self.feed_names_:
                continue
            if self.feed_types_[key] == int_type:
                int_feed_names.append(key)
G
guru4elephant 已提交
131
                int_slot.append(feed[key])
G
guru4elephant 已提交
132 133
            elif self.feed_types_[key] == float_type:
                float_feed_names.append(key)
G
guru4elephant 已提交
134
                float_slot.append(feed[key])
G
guru4elephant 已提交
135 136 137 138 139 140

        for key in fetch:
            if key in self.fetch_names_:
                fetch_names.append(key)

        result = self.client_handle_.predict(
M
MRXLT 已提交
141 142
            float_slot, float_feed_names, int_slot, int_feed_names, fetch_names)

143 144 145
        # TODO(guru4elephant): the order of fetch var name should be consistent with
        #                      general_model_config, this is not friendly
        #                      In the future, we need make the number of fetched variable changable
G
guru4elephant 已提交
146 147 148
        result_map = {}
        for i, name in enumerate(fetch_names):
            result_map[name] = result[i]
M
MRXLT 已提交
149

G
guru4elephant 已提交
150 151
        return result_map

M
MRXLT 已提交
152
    def batch_predict(self, feed_batch=[], fetch=[], profile=False):
M
MRXLT 已提交
153 154 155 156 157
        int_slot_batch = []
        float_slot_batch = []
        int_feed_names = []
        float_feed_names = []
        fetch_names = []
M
MRXLT 已提交
158
        counter = 0
M
MRXLT 已提交
159 160 161 162 163 164 165
        for feed in feed_batch:
            int_slot = []
            float_slot = []
            for key in feed:
                if key not in self.feed_names_:
                    continue
                if self.feed_types_[key] == int_type:
M
MRXLT 已提交
166 167
                    if counter == 0:
                        int_feed_names.append(key)
M
MRXLT 已提交
168 169
                    int_slot.append(feed[key])
                elif self.feed_types_[key] == float_type:
M
MRXLT 已提交
170 171
                    if counter == 0:
                        float_feed_names.append(key)
M
MRXLT 已提交
172
                    float_slot.append(feed[key])
M
MRXLT 已提交
173
            counter += 1
M
MRXLT 已提交
174 175 176 177 178 179 180
            int_slot_batch.append(int_slot)
            float_slot_batch.append(float_slot)

        for key in fetch:
            if key in self.fetch_names_:
                fetch_names.append(key)

M
MRXLT 已提交
181
        result_batch = self.client_handle_.batch_predict(
M
MRXLT 已提交
182
            float_slot_batch, float_feed_names, int_slot_batch, int_feed_names,
M
MRXLT 已提交
183
            fetch_names)
M
MRXLT 已提交
184 185

        result_map_batch = []
M
MRXLT 已提交
186
        for result in result_batch:
M
MRXLT 已提交
187 188 189 190 191
            result_map = {}
            for i, name in enumerate(fetch_names):
                result_map[name] = result[i]
            result_map_batch.append(result_map)

M
MRXLT 已提交
192
        return result_map_batch
193 194 195

    def release(self):
        self.client_handle_.destroy_predictor()