envs.py 7.1 KB
Newer Older
T
tangwei 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

T
tangwei 已提交
15
from contextlib import closing
Y
yaoxuefeng 已提交
16
import yaml
T
tangwei12 已提交
17
import copy
T
tangwei 已提交
18
import os
C
chengmo 已提交
19
import socket
T
tangwei 已提交
20
import sys
X
xionghang 已提交
21
import traceback
T
tangwei 已提交
22

T
tangwei12 已提交
23
global_envs = {}
T
tangwei 已提交
24
global_envs_flatten = {}
T
tangwei 已提交
25

X
fix  
xjqbest 已提交
26

T
tangwei 已提交
27
def flatten_environs(envs, separator="."):
T
tangwei 已提交
28
    flatten_dict = {}
T
tangwei 已提交
29 30
    assert isinstance(envs, dict)

T
fix bug  
tangwei 已提交
31
    def fatten_env_namespace(namespace_nests, local_envs):
T
fix bug  
tangwei 已提交
32
        if not isinstance(local_envs, dict):
T
tangwei 已提交
33
            global_k = separator.join(namespace_nests)
T
tangwei 已提交
34
            flatten_dict[global_k] = str(local_envs)
T
fix bug  
tangwei 已提交
35 36 37 38 39 40 41
        else:
            for k, v in local_envs.items():
                if isinstance(v, dict):
                    nests = copy.deepcopy(namespace_nests)
                    nests.append(k)
                    fatten_env_namespace(nests, v)
                else:
T
tangwei 已提交
42
                    global_k = separator.join(namespace_nests + [k])
T
tangwei 已提交
43
                    flatten_dict[global_k] = str(v)
T
fix bug  
tangwei 已提交
44

T
tangwei 已提交
45
    for k, v in envs.items():
T
fix bug  
tangwei 已提交
46
        fatten_env_namespace([k], v)
T
tangwei 已提交
47

T
tangwei 已提交
48
    return flatten_dict
T
tangwei 已提交
49

T
tangwei 已提交
50 51 52

def set_runtime_environs(environs):
    for k, v in environs.items():
T
tangwei 已提交
53
        os.environ[k] = str(v)
T
tangwei 已提交
54

T
tangwei 已提交
55

T
tangwei 已提交
56
def get_runtime_environ(key):
T
tangwei 已提交
57 58
    return os.getenv(key, None)

T
tangwei 已提交
59

T
tangwei 已提交
60
def get_trainer():
T
tangwei 已提交
61
    train_mode = get_runtime_environ("train.trainer.trainer")
T
tangwei 已提交
62 63 64
    return train_mode


C
Chengmo 已提交
65 66 67 68 69
def get_fleet_mode():
    fleet_mode = get_runtime_environ("fleet_mode")
    return fleet_mode


T
tangwei 已提交
70
def set_global_envs(envs):
T
tangwei12 已提交
71
    assert isinstance(envs, dict)
T
tangwei 已提交
72

T
tangwei12 已提交
73 74 75 76 77 78
    def fatten_env_namespace(namespace_nests, local_envs):
        for k, v in local_envs.items():
            if isinstance(v, dict):
                nests = copy.deepcopy(namespace_nests)
                nests.append(k)
                fatten_env_namespace(nests, v)
X
fix  
xjqbest 已提交
79 80
            elif (k == "dataset" or k == "phase" or
                  k == "runner") and isinstance(v, list):
X
fix  
xjqbest 已提交
81 82 83 84 85 86 87
                for i in v:
                    if i.get("name") is None:
                        raise ValueError("name must be in dataset list ", v)
                    nests = copy.deepcopy(namespace_nests)
                    nests.append(k)
                    nests.append(i["name"])
                    fatten_env_namespace(nests, i)
T
tangwei12 已提交
88 89 90
            else:
                global_k = ".".join(namespace_nests + [k])
                global_envs[global_k] = v
T
tangwei 已提交
91

X
fix  
xjqbest 已提交
92
    fatten_env_namespace([], envs)
T
tangwei 已提交
93

T
tangwei 已提交
94 95 96 97
    for name, value in global_envs.items():
        if isinstance(value, str):
            value = os_path_adapter(workspace_adapter(value))
            global_envs[name] = value
T
tangwei 已提交
98

T
tangwei 已提交
99 100
    if get_platform() != "LINUX":
        for dataset in envs["dataset"]:
T
tangwei 已提交
101
            name = ".".join(["dataset", dataset["name"], "type"])
T
tangwei 已提交
102 103
            global_envs[name] = "DataLoader"

X
fix  
xjqbest 已提交
104

T
tangwei12 已提交
105
def get_global_env(env_name, default_value=None, namespace=None):
T
tangwei 已提交
106 107 108
    """
    get os environment value
    """
C
chengmo 已提交
109 110
    _env_name = env_name if namespace is None else ".".join(
        [namespace, env_name])
T
tangwei12 已提交
111 112 113
    return global_envs.get(_env_name, default_value)


T
tangwei 已提交
114 115 116 117
def get_global_envs():
    return global_envs


T
tangwei 已提交
118
def paddlerec_adapter(path):
T
tangwei 已提交
119 120
    if path.startswith("paddlerec."):
        package = get_runtime_environ("PACKAGE_BASE")
F
frankwhzhang 已提交
121 122
        l_p = path.split("paddlerec.")[1].replace(".", "/")
        return os.path.join(package, l_p)
T
tangwei 已提交
123
    else:
T
tangwei 已提交
124
        return path
T
tangwei 已提交
125 126


T
tangwei 已提交
127 128 129 130 131 132
def os_path_adapter(value):
    if get_platform() == "WINDOWS":
        value = value.replace("/", "\\")
    else:
        value = value.replace("\\", "/")
    return value
T
tangwei 已提交
133 134


T
tangwei 已提交
135
def workspace_adapter(value):
X
fix  
xjqbest 已提交
136
    workspace = global_envs.get("workspace")
T
tangwei 已提交
137
    workspace = paddlerec_adapter(workspace)
T
tangwei 已提交
138 139
    value = value.replace("{workspace}", workspace)
    return value
T
tangwei 已提交
140

T
tangwei 已提交
141

T
tangwei 已提交
142 143 144 145 146 147 148 149 150
def reader_adapter():
    if get_platform() != "WINDOWS":
        return

    datasets = global_envs.get("dataset")
    for dataset in datasets:
        dataset["type"] = "DataLoader"


T
tangwei12 已提交
151
def pretty_print_envs(envs, header=None):
T
tangwei12 已提交
152 153
    spacing = 5
    max_k = 45
T
tangwei 已提交
154
    max_v = 50
T
tangwei12 已提交
155

T
tangwei 已提交
156
    for k, v in envs.items():
T
tangwei12 已提交
157 158
        max_k = max(max_k, len(k))

T
tangwei12 已提交
159
    h_format = "{{:^{}s}}{}{{:<{}s}}\n".format(max_k, " " * spacing, max_v)
T
tangwei12 已提交
160 161 162 163 164 165 166 167
    l_format = "{{:<{}s}}{{}}{{:<{}s}}\n".format(max_k, max_v)
    length = max_k + max_v + spacing

    border = "".join(["="] * length)
    line = "".join(["-"] * length)

    draws = ""
    draws += border + "\n"
T
tangwei 已提交
168 169 170 171

    if header:
        draws += h_format.format(header[0], header[1])
    else:
172
        draws += h_format.format("paddlerec Global Envs", "Value")
T
tangwei 已提交
173

T
tangwei12 已提交
174 175
    draws += line + "\n"

T
tangwei 已提交
176
    for k, v in envs.items():
T
tangwei 已提交
177 178 179 180 181 182
        if isinstance(v, str) and len(v) >= max_v:
            str_v = "... " + v[-46:]
        else:
            str_v = v

        draws += l_format.format(k, " " * spacing, str(str_v))
T
tangwei12 已提交
183 184 185 186 187

    draws += border

    _str = "\n{}\n".format(draws)
    return _str
T
tangwei 已提交
188 189


T
tangwei 已提交
190
def lazy_instance_by_package(package, class_name):
X
xionghang 已提交
191 192 193 194 195
    try:
        model_package = __import__(package,
                                   globals(), locals(), package.split("."))
        instance = getattr(model_package, class_name)
        return instance
T
tangwei 已提交
196
    except Exception as err:
X
xionghang 已提交
197 198 199
        traceback.print_exc()
        print('Catch Exception:%s' % str(err))
        return None
T
tangwei 已提交
200 201


T
tangwei 已提交
202
def lazy_instance_by_fliename(abs, class_name):
X
xionghang 已提交
203 204 205 206 207 208 209 210 211
    try:
        dirname = os.path.dirname(abs)
        sys.path.append(dirname)
        package = os.path.splitext(os.path.basename(abs))[0]

        model_package = __import__(package,
                                   globals(), locals(), package.split("."))
        instance = getattr(model_package, class_name)
        return instance
T
tangwei 已提交
212
    except Exception as err:
X
xionghang 已提交
213 214 215
        traceback.print_exc()
        print('Catch Exception:%s' % str(err))
        return None
T
tangwei 已提交
216 217


T
tangwei 已提交
218 219 220 221 222 223 224 225 226
def get_platform():
    import platform
    plats = platform.platform()
    if 'Linux' in plats:
        return "LINUX"
    if 'Darwin' in plats:
        return "DARWIN"
    if 'Windows' in plats:
        return "WINDOWS"
C
chengmo 已提交
227 228 229 230


def find_free_port():
    def __free_port():
T
tangwei 已提交
231
        with closing(socket.socket(socket.AF_INET, socket.SOCK_STREAM)) as s:
C
chengmo 已提交
232 233
            s.bind(('', 0))
            return s.getsockname()[1]
T
tangwei 已提交
234

C
chengmo 已提交
235 236
    new_port = __free_port()
    return new_port
X
test  
xjqbest 已提交
237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259


def load_yaml(config):
    vs = [int(i) for i in yaml.__version__.split(".")]
    if vs[0] < 5:
        use_full_loader = False
    elif vs[0] > 5:
        use_full_loader = True
    else:
        if vs[1] >= 1:
            use_full_loader = True
        else:
            use_full_loader = False

    if os.path.isfile(config):
        with open(config, 'r') as rb:
            if use_full_loader:
                _config = yaml.load(rb.read(), Loader=yaml.FullLoader)
            else:
                _config = yaml.load(rb.read())
            return _config
    else:
        raise ValueError("config {} can not be supported".format(config))