envs.py 8.0 KB
Newer Older
T
tangwei 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

T
tangwei 已提交
15
from contextlib import closing
Y
yaoxuefeng 已提交
16
import yaml
T
tangwei12 已提交
17
import copy
T
tangwei 已提交
18
import os
C
chengmo 已提交
19
import socket
T
tangwei 已提交
20
import sys
C
Chengmo 已提交
21
import six
X
xionghang 已提交
22
import traceback
G
gentelyang 已提交
23
import six
24 25 26 27 28 29
import time
import logging

logging.basicConfig(format="%(asctime)s - %(levelname)s - %(message)s")
logger = logging.getLogger()
logger.setLevel(logging.INFO)
T
tangwei 已提交
30

T
tangwei12 已提交
31
global_envs = {}
T
tangwei 已提交
32
global_envs_flatten = {}
T
tangwei 已提交
33

X
fix  
xjqbest 已提交
34

T
tangwei 已提交
35
def flatten_environs(envs, separator="."):
T
tangwei 已提交
36
    flatten_dict = {}
T
tangwei 已提交
37 38
    assert isinstance(envs, dict)

T
fix bug  
tangwei 已提交
39
    def fatten_env_namespace(namespace_nests, local_envs):
T
fix bug  
tangwei 已提交
40
        if not isinstance(local_envs, dict):
T
tangwei 已提交
41
            global_k = separator.join(namespace_nests)
T
tangwei 已提交
42
            flatten_dict[global_k] = str(local_envs)
T
fix bug  
tangwei 已提交
43 44 45 46 47 48 49
        else:
            for k, v in local_envs.items():
                if isinstance(v, dict):
                    nests = copy.deepcopy(namespace_nests)
                    nests.append(k)
                    fatten_env_namespace(nests, v)
                else:
T
tangwei 已提交
50
                    global_k = separator.join(namespace_nests + [k])
T
tangwei 已提交
51
                    flatten_dict[global_k] = str(v)
T
fix bug  
tangwei 已提交
52

T
tangwei 已提交
53
    for k, v in envs.items():
T
fix bug  
tangwei 已提交
54
        fatten_env_namespace([k], v)
T
tangwei 已提交
55

T
tangwei 已提交
56
    return flatten_dict
T
tangwei 已提交
57

T
tangwei 已提交
58 59 60

def set_runtime_environs(environs):
    for k, v in environs.items():
T
tangwei 已提交
61
        os.environ[k] = str(v)
T
tangwei 已提交
62

T
tangwei 已提交
63

T
tangwei 已提交
64
def get_runtime_environ(key):
T
tangwei 已提交
65 66
    return os.getenv(key, None)

T
tangwei 已提交
67

T
tangwei 已提交
68
def get_trainer():
T
tangwei 已提交
69
    train_mode = get_runtime_environ("train.trainer.trainer")
T
tangwei 已提交
70 71 72
    return train_mode


C
Chengmo 已提交
73 74 75 76 77
def get_fleet_mode():
    fleet_mode = get_runtime_environ("fleet_mode")
    return fleet_mode


T
tangwei 已提交
78
def set_global_envs(envs):
T
tangwei12 已提交
79
    assert isinstance(envs, dict)
T
tangwei 已提交
80

T
tangwei12 已提交
81 82 83 84 85 86
    def fatten_env_namespace(namespace_nests, local_envs):
        for k, v in local_envs.items():
            if isinstance(v, dict):
                nests = copy.deepcopy(namespace_nests)
                nests.append(k)
                fatten_env_namespace(nests, v)
X
fix  
xjqbest 已提交
87 88
            elif (k == "dataset" or k == "phase" or
                  k == "runner") and isinstance(v, list):
X
fix  
xjqbest 已提交
89 90 91 92 93 94 95
                for i in v:
                    if i.get("name") is None:
                        raise ValueError("name must be in dataset list ", v)
                    nests = copy.deepcopy(namespace_nests)
                    nests.append(k)
                    nests.append(i["name"])
                    fatten_env_namespace(nests, i)
T
tangwei12 已提交
96 97 98
            else:
                global_k = ".".join(namespace_nests + [k])
                global_envs[global_k] = v
T
tangwei 已提交
99

X
fix  
xjqbest 已提交
100
    fatten_env_namespace([], envs)
T
tangwei 已提交
101

T
tangwei 已提交
102 103 104 105
    for name, value in global_envs.items():
        if isinstance(value, str):
            value = os_path_adapter(workspace_adapter(value))
            global_envs[name] = value
T
tangwei 已提交
106

T
tangwei 已提交
107 108
    if get_platform() != "LINUX":
        for dataset in envs["dataset"]:
T
tangwei 已提交
109
            name = ".".join(["dataset", dataset["name"], "type"])
T
tangwei 已提交
110 111
            global_envs[name] = "DataLoader"

C
Chengmo 已提交
112
    if get_platform() == "LINUX" and six.PY3:
113
        logger.info("QueueDataset can not support PY3, change to DataLoader")
C
Chengmo 已提交
114 115 116 117
        for dataset in envs["dataset"]:
            name = ".".join(["dataset", dataset["name"], "type"])
            global_envs[name] = "DataLoader"

X
fix  
xjqbest 已提交
118

T
tangwei12 已提交
119
def get_global_env(env_name, default_value=None, namespace=None):
T
tangwei 已提交
120 121 122
    """
    get os environment value
    """
C
chengmo 已提交
123 124
    _env_name = env_name if namespace is None else ".".join(
        [namespace, env_name])
T
tangwei12 已提交
125 126 127
    return global_envs.get(_env_name, default_value)


T
tangwei 已提交
128 129 130 131
def get_global_envs():
    return global_envs


T
tangwei 已提交
132
def paddlerec_adapter(path):
T
tangwei 已提交
133 134
    if path.startswith("paddlerec."):
        package = get_runtime_environ("PACKAGE_BASE")
F
frankwhzhang 已提交
135 136
        l_p = path.split("paddlerec.")[1].replace(".", "/")
        return os.path.join(package, l_p)
T
tangwei 已提交
137
    else:
T
tangwei 已提交
138
        return path
T
tangwei 已提交
139 140


T
tangwei 已提交
141 142 143 144 145 146
def os_path_adapter(value):
    if get_platform() == "WINDOWS":
        value = value.replace("/", "\\")
    else:
        value = value.replace("\\", "/")
    return value
T
tangwei 已提交
147 148


T
tangwei 已提交
149
def workspace_adapter(value):
X
fix  
xjqbest 已提交
150
    workspace = global_envs.get("workspace")
J
Jinhua Liang 已提交
151 152 153 154
    return workspace_adapter_by_specific(value, workspace)


def workspace_adapter_by_specific(value, workspace):
T
tangwei 已提交
155
    workspace = paddlerec_adapter(workspace)
T
tangwei 已提交
156 157
    value = value.replace("{workspace}", workspace)
    return value
T
tangwei 已提交
158

T
tangwei 已提交
159

T
tangwei 已提交
160 161 162 163 164 165 166 167 168
def reader_adapter():
    if get_platform() != "WINDOWS":
        return

    datasets = global_envs.get("dataset")
    for dataset in datasets:
        dataset["type"] = "DataLoader"


T
tangwei12 已提交
169
def pretty_print_envs(envs, header=None):
T
tangwei12 已提交
170 171
    spacing = 5
    max_k = 45
T
tangwei 已提交
172
    max_v = 50
T
tangwei12 已提交
173

T
tangwei 已提交
174
    for k, v in envs.items():
T
tangwei12 已提交
175 176
        max_k = max(max_k, len(k))

T
tangwei12 已提交
177
    h_format = "{{:^{}s}}{}{{:<{}s}}\n".format(max_k, " " * spacing, max_v)
T
tangwei12 已提交
178 179 180 181 182 183 184 185
    l_format = "{{:<{}s}}{{}}{{:<{}s}}\n".format(max_k, max_v)
    length = max_k + max_v + spacing

    border = "".join(["="] * length)
    line = "".join(["-"] * length)

    draws = ""
    draws += border + "\n"
T
tangwei 已提交
186 187 188 189

    if header:
        draws += h_format.format(header[0], header[1])
    else:
190
        draws += h_format.format("paddlerec Global Envs", "Value")
T
tangwei 已提交
191

T
tangwei12 已提交
192 193
    draws += line + "\n"

T
tangwei 已提交
194
    for k, v in envs.items():
T
tangwei 已提交
195 196 197 198 199 200
        if isinstance(v, str) and len(v) >= max_v:
            str_v = "... " + v[-46:]
        else:
            str_v = v

        draws += l_format.format(k, " " * spacing, str(str_v))
T
tangwei12 已提交
201 202 203 204 205

    draws += border

    _str = "\n{}\n".format(draws)
    return _str
T
tangwei 已提交
206 207


T
tangwei 已提交
208
def lazy_instance_by_package(package, class_name):
X
xionghang 已提交
209 210 211 212 213
    try:
        model_package = __import__(package,
                                   globals(), locals(), package.split("."))
        instance = getattr(model_package, class_name)
        return instance
T
tangwei 已提交
214
    except Exception as err:
X
xionghang 已提交
215
        traceback.print_exc()
216
        logger.info('Catch Exception:%s' % str(err))
X
xionghang 已提交
217
        return None
T
tangwei 已提交
218 219


T
tangwei 已提交
220
def lazy_instance_by_fliename(abs, class_name):
X
xionghang 已提交
221 222 223 224 225 226 227 228 229
    try:
        dirname = os.path.dirname(abs)
        sys.path.append(dirname)
        package = os.path.splitext(os.path.basename(abs))[0]

        model_package = __import__(package,
                                   globals(), locals(), package.split("."))
        instance = getattr(model_package, class_name)
        return instance
T
tangwei 已提交
230
    except Exception as err:
X
xionghang 已提交
231
        traceback.print_exc()
232
        logger.info('Catch Exception:%s' % str(err))
X
xionghang 已提交
233
        return None
T
tangwei 已提交
234 235


T
tangwei 已提交
236 237 238 239 240 241 242 243 244
def get_platform():
    import platform
    plats = platform.platform()
    if 'Linux' in plats:
        return "LINUX"
    if 'Darwin' in plats:
        return "DARWIN"
    if 'Windows' in plats:
        return "WINDOWS"
C
chengmo 已提交
245 246 247 248


def find_free_port():
    def __free_port():
T
tangwei 已提交
249
        with closing(socket.socket(socket.AF_INET, socket.SOCK_STREAM)) as s:
C
chengmo 已提交
250 251
            s.bind(('', 0))
            return s.getsockname()[1]
T
tangwei 已提交
252

C
chengmo 已提交
253 254
    new_port = __free_port()
    return new_port
X
test  
xjqbest 已提交
255 256 257 258 259 260 261 262 263 264 265 266 267 268 269


def load_yaml(config):
    vs = [int(i) for i in yaml.__version__.split(".")]
    if vs[0] < 5:
        use_full_loader = False
    elif vs[0] > 5:
        use_full_loader = True
    else:
        if vs[1] >= 1:
            use_full_loader = True
        else:
            use_full_loader = False

    if os.path.isfile(config):
G
gentelyang 已提交
270 271 272 273 274 275 276 277 278 279 280 281 282 283
        if six.PY2:
            with open(config, 'r') as rb:
                if use_full_loader:
                    _config = yaml.load(rb.read(), Loader=yaml.FullLoader)
                else:
                    _config = yaml.load(rb.read())
                return _config
        else:
            with open(config, 'r', encoding="utf-8") as rb:
                if use_full_loader:
                    _config = yaml.load(rb.read(), Loader=yaml.FullLoader)
                else:
                    _config = yaml.load(rb.read())
                return _config
X
test  
xjqbest 已提交
284 285
    else:
        raise ValueError("config {} can not be supported".format(config))