envs.py 7.5 KB
Newer Older
T
tangwei 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

T
tangwei 已提交
15
from contextlib import closing
Y
yaoxuefeng 已提交
16
import yaml
T
tangwei12 已提交
17
import copy
T
tangwei 已提交
18
import os
C
chengmo 已提交
19
import socket
T
tangwei 已提交
20
import sys
X
xionghang 已提交
21
import traceback
G
gentelyang 已提交
22
import six
T
tangwei 已提交
23

T
tangwei12 已提交
24
global_envs = {}
T
tangwei 已提交
25
global_envs_flatten = {}
T
tangwei 已提交
26

X
fix  
xjqbest 已提交
27

T
tangwei 已提交
28
def flatten_environs(envs, separator="."):
T
tangwei 已提交
29
    flatten_dict = {}
T
tangwei 已提交
30 31
    assert isinstance(envs, dict)

T
fix bug  
tangwei 已提交
32
    def fatten_env_namespace(namespace_nests, local_envs):
T
fix bug  
tangwei 已提交
33
        if not isinstance(local_envs, dict):
T
tangwei 已提交
34
            global_k = separator.join(namespace_nests)
T
tangwei 已提交
35
            flatten_dict[global_k] = str(local_envs)
T
fix bug  
tangwei 已提交
36 37 38 39 40 41 42
        else:
            for k, v in local_envs.items():
                if isinstance(v, dict):
                    nests = copy.deepcopy(namespace_nests)
                    nests.append(k)
                    fatten_env_namespace(nests, v)
                else:
T
tangwei 已提交
43
                    global_k = separator.join(namespace_nests + [k])
T
tangwei 已提交
44
                    flatten_dict[global_k] = str(v)
T
fix bug  
tangwei 已提交
45

T
tangwei 已提交
46
    for k, v in envs.items():
T
fix bug  
tangwei 已提交
47
        fatten_env_namespace([k], v)
T
tangwei 已提交
48

T
tangwei 已提交
49
    return flatten_dict
T
tangwei 已提交
50

T
tangwei 已提交
51 52 53

def set_runtime_environs(environs):
    for k, v in environs.items():
T
tangwei 已提交
54
        os.environ[k] = str(v)
T
tangwei 已提交
55

T
tangwei 已提交
56

T
tangwei 已提交
57
def get_runtime_environ(key):
T
tangwei 已提交
58 59
    return os.getenv(key, None)

T
tangwei 已提交
60

T
tangwei 已提交
61
def get_trainer():
T
tangwei 已提交
62
    train_mode = get_runtime_environ("train.trainer.trainer")
T
tangwei 已提交
63 64 65
    return train_mode


C
Chengmo 已提交
66 67 68 69 70
def get_fleet_mode():
    fleet_mode = get_runtime_environ("fleet_mode")
    return fleet_mode


T
tangwei 已提交
71
def set_global_envs(envs):
T
tangwei12 已提交
72
    assert isinstance(envs, dict)
T
tangwei 已提交
73

T
tangwei12 已提交
74 75 76 77 78 79
    def fatten_env_namespace(namespace_nests, local_envs):
        for k, v in local_envs.items():
            if isinstance(v, dict):
                nests = copy.deepcopy(namespace_nests)
                nests.append(k)
                fatten_env_namespace(nests, v)
X
fix  
xjqbest 已提交
80 81
            elif (k == "dataset" or k == "phase" or
                  k == "runner") and isinstance(v, list):
X
fix  
xjqbest 已提交
82 83 84 85 86 87 88
                for i in v:
                    if i.get("name") is None:
                        raise ValueError("name must be in dataset list ", v)
                    nests = copy.deepcopy(namespace_nests)
                    nests.append(k)
                    nests.append(i["name"])
                    fatten_env_namespace(nests, i)
T
tangwei12 已提交
89 90 91
            else:
                global_k = ".".join(namespace_nests + [k])
                global_envs[global_k] = v
T
tangwei 已提交
92

X
fix  
xjqbest 已提交
93
    fatten_env_namespace([], envs)
T
tangwei 已提交
94

T
tangwei 已提交
95 96 97 98
    for name, value in global_envs.items():
        if isinstance(value, str):
            value = os_path_adapter(workspace_adapter(value))
            global_envs[name] = value
T
tangwei 已提交
99

T
tangwei 已提交
100 101
    if get_platform() != "LINUX":
        for dataset in envs["dataset"]:
T
tangwei 已提交
102
            name = ".".join(["dataset", dataset["name"], "type"])
T
tangwei 已提交
103 104
            global_envs[name] = "DataLoader"

X
fix  
xjqbest 已提交
105

T
tangwei12 已提交
106
def get_global_env(env_name, default_value=None, namespace=None):
T
tangwei 已提交
107 108 109
    """
    get os environment value
    """
C
chengmo 已提交
110 111
    _env_name = env_name if namespace is None else ".".join(
        [namespace, env_name])
T
tangwei12 已提交
112 113 114
    return global_envs.get(_env_name, default_value)


T
tangwei 已提交
115 116 117 118
def get_global_envs():
    return global_envs


T
tangwei 已提交
119
def paddlerec_adapter(path):
T
tangwei 已提交
120 121
    if path.startswith("paddlerec."):
        package = get_runtime_environ("PACKAGE_BASE")
F
frankwhzhang 已提交
122 123
        l_p = path.split("paddlerec.")[1].replace(".", "/")
        return os.path.join(package, l_p)
T
tangwei 已提交
124
    else:
T
tangwei 已提交
125
        return path
T
tangwei 已提交
126 127


T
tangwei 已提交
128 129 130 131 132 133
def os_path_adapter(value):
    if get_platform() == "WINDOWS":
        value = value.replace("/", "\\")
    else:
        value = value.replace("\\", "/")
    return value
T
tangwei 已提交
134 135


T
tangwei 已提交
136
def workspace_adapter(value):
X
fix  
xjqbest 已提交
137
    workspace = global_envs.get("workspace")
J
Jinhua Liang 已提交
138 139 140 141
    return workspace_adapter_by_specific(value, workspace)


def workspace_adapter_by_specific(value, workspace):
T
tangwei 已提交
142
    workspace = paddlerec_adapter(workspace)
T
tangwei 已提交
143 144
    value = value.replace("{workspace}", workspace)
    return value
T
tangwei 已提交
145

T
tangwei 已提交
146

T
tangwei 已提交
147 148 149 150 151 152 153 154 155
def reader_adapter():
    if get_platform() != "WINDOWS":
        return

    datasets = global_envs.get("dataset")
    for dataset in datasets:
        dataset["type"] = "DataLoader"


T
tangwei12 已提交
156
def pretty_print_envs(envs, header=None):
T
tangwei12 已提交
157 158
    spacing = 5
    max_k = 45
T
tangwei 已提交
159
    max_v = 50
T
tangwei12 已提交
160

T
tangwei 已提交
161
    for k, v in envs.items():
T
tangwei12 已提交
162 163
        max_k = max(max_k, len(k))

T
tangwei12 已提交
164
    h_format = "{{:^{}s}}{}{{:<{}s}}\n".format(max_k, " " * spacing, max_v)
T
tangwei12 已提交
165 166 167 168 169 170 171 172
    l_format = "{{:<{}s}}{{}}{{:<{}s}}\n".format(max_k, max_v)
    length = max_k + max_v + spacing

    border = "".join(["="] * length)
    line = "".join(["-"] * length)

    draws = ""
    draws += border + "\n"
T
tangwei 已提交
173 174 175 176

    if header:
        draws += h_format.format(header[0], header[1])
    else:
177
        draws += h_format.format("paddlerec Global Envs", "Value")
T
tangwei 已提交
178

T
tangwei12 已提交
179 180
    draws += line + "\n"

T
tangwei 已提交
181
    for k, v in envs.items():
T
tangwei 已提交
182 183 184 185 186 187
        if isinstance(v, str) and len(v) >= max_v:
            str_v = "... " + v[-46:]
        else:
            str_v = v

        draws += l_format.format(k, " " * spacing, str(str_v))
T
tangwei12 已提交
188 189 190 191 192

    draws += border

    _str = "\n{}\n".format(draws)
    return _str
T
tangwei 已提交
193 194


T
tangwei 已提交
195
def lazy_instance_by_package(package, class_name):
X
xionghang 已提交
196 197 198 199 200
    try:
        model_package = __import__(package,
                                   globals(), locals(), package.split("."))
        instance = getattr(model_package, class_name)
        return instance
T
tangwei 已提交
201
    except Exception as err:
X
xionghang 已提交
202 203 204
        traceback.print_exc()
        print('Catch Exception:%s' % str(err))
        return None
T
tangwei 已提交
205 206


T
tangwei 已提交
207
def lazy_instance_by_fliename(abs, class_name):
X
xionghang 已提交
208 209 210 211 212 213 214 215 216
    try:
        dirname = os.path.dirname(abs)
        sys.path.append(dirname)
        package = os.path.splitext(os.path.basename(abs))[0]

        model_package = __import__(package,
                                   globals(), locals(), package.split("."))
        instance = getattr(model_package, class_name)
        return instance
T
tangwei 已提交
217
    except Exception as err:
X
xionghang 已提交
218 219 220
        traceback.print_exc()
        print('Catch Exception:%s' % str(err))
        return None
T
tangwei 已提交
221 222


T
tangwei 已提交
223 224 225 226 227 228 229 230 231
def get_platform():
    import platform
    plats = platform.platform()
    if 'Linux' in plats:
        return "LINUX"
    if 'Darwin' in plats:
        return "DARWIN"
    if 'Windows' in plats:
        return "WINDOWS"
C
chengmo 已提交
232 233 234 235


def find_free_port():
    def __free_port():
T
tangwei 已提交
236
        with closing(socket.socket(socket.AF_INET, socket.SOCK_STREAM)) as s:
C
chengmo 已提交
237 238
            s.bind(('', 0))
            return s.getsockname()[1]
T
tangwei 已提交
239

C
chengmo 已提交
240 241
    new_port = __free_port()
    return new_port
X
test  
xjqbest 已提交
242 243 244 245 246 247 248 249 250 251 252 253 254 255 256


def load_yaml(config):
    vs = [int(i) for i in yaml.__version__.split(".")]
    if vs[0] < 5:
        use_full_loader = False
    elif vs[0] > 5:
        use_full_loader = True
    else:
        if vs[1] >= 1:
            use_full_loader = True
        else:
            use_full_loader = False

    if os.path.isfile(config):
G
gentelyang 已提交
257 258 259 260 261 262 263 264 265 266 267 268 269 270
        if six.PY2:
            with open(config, 'r') as rb:
                if use_full_loader:
                    _config = yaml.load(rb.read(), Loader=yaml.FullLoader)
                else:
                    _config = yaml.load(rb.read())
                return _config
        else:
            with open(config, 'r', encoding="utf-8") as rb:
                if use_full_loader:
                    _config = yaml.load(rb.read(), Loader=yaml.FullLoader)
                else:
                    _config = yaml.load(rb.read())
                return _config
X
test  
xjqbest 已提交
271 272
    else:
        raise ValueError("config {} can not be supported".format(config))