__init__.py 4.5 KB
Newer Older
1
#   Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
D
dzhwinter 已提交
2
#
D
dzhwinter 已提交
3 4 5
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
D
dzhwinter 已提交
6
#
D
dzhwinter 已提交
7
#     http://www.apache.org/licenses/LICENSE-2.0
D
dzhwinter 已提交
8
#
D
dzhwinter 已提交
9 10 11 12 13 14
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

Y
Yang Yu 已提交
15
from __future__ import print_function
16
# import all class inside framework into fluid module
17 18
from . import framework
from .framework import *
Y
Yang Yu 已提交
19
# import all class inside executor into fluid module
20 21 22 23
from . import executor
from .executor import *
from . import trainer
from . import inferencer
H
Helin Wang 已提交
24

25 26 27 28 29 30 31 32 33 34 35 36 37 38 39
from . import io
from . import evaluator
from . import initializer
from . import layers
from . import contrib
from . import nets
from . import optimizer
from . import backward
from . import regularizer
from . import average
from . import metrics
from . import transpiler
from .param_attr import ParamAttr, WeightNormParamAttr
from .data_feeder import DataFeeder
from .core import LoDTensor, LoDTensorArray, CPUPlace, CUDAPlace, CUDAPinnedPlace, Scope
40
from .transpiler import DistributeTranspiler, \
G
gongweibao 已提交
41
    memory_optimize, release_memory, DistributeTranspilerConfig
42 43 44 45 46 47 48
from .lod_tensor import create_lod_tensor, create_random_int_lodtensor
from . import clip
from . import profiler
from . import unique_name
from . import recordio_writer
from . import parallel_executor
from .parallel_executor import *
X
Xin Pan 已提交
49
from paddle.fluid.layers.math_op_patch import monkey_patch_variable
50 51

Tensor = LoDTensor
Y
Yang Yu 已提交
52

W
Wu Yi 已提交
53
__all__ = framework.__all__ + executor.__all__ + \
54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80
    trainer.__all__ + inferencer.__all__ + transpiler.__all__ + \
    parallel_executor.__all__ + lod_tensor.__all__ + [
        'io',
        'initializer',
        'layers',
        'contrib',
        'transpiler',
        'nets',
        'optimizer',
        'learning_rate_decay',
        'backward',
        'regularizer',
        'LoDTensor',
        'LoDTensorArray',
        'CPUPlace',
        'CUDAPlace',
        'CUDAPinnedPlace',
        'Tensor',
        'ParamAttr',
        'WeightNormParamAttr',
        'DataFeeder',
        'clip',
        'profiler',
        'unique_name',
        'recordio_writer',
        'Scope',
    ]
81 82


Y
Yang Yu 已提交
83
def __bootstrap__():
84 85
    """
    Enable reading gflags from environment variables.
Y
Yu Yang 已提交
86

87 88 89 90
    Returns:
        None
    """
    import sys
Y
Yang Yu 已提交
91
    import os
92
    from . import core
Y
Yang Yu 已提交
93

X
Xin Pan 已提交
94 95
    in_test = 'unittest' in sys.modules

Y
Yang Yu 已提交
96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111
    try:
        num_threads = int(os.getenv('OMP_NUM_THREADS', '1'))
    except ValueError:
        num_threads = 1

    if num_threads > 1:
        print(
            'WARNING: OMP_NUM_THREADS set to {0}, not 1. The computation '
            'speed will not be optimized if you use data parallel. It will '
            'fail if this PaddlePaddle binary is compiled with OpenBlas since'
            ' OpenBlas does not support multi-threads.'.format(num_threads),
            file=sys.stderr)
        print('PLEASE USE OMP_NUM_THREADS WISELY.', file=sys.stderr)

    os.environ['OMP_NUM_THREADS'] = str(num_threads)

112
    read_env_flags = [
Y
Yu Yang 已提交
113
        'use_pinned_memory', 'check_nan_inf', 'benchmark', 'warpctc_dir',
114
        'eager_delete_scope', 'use_mkldnn', 'initial_cpu_memory_in_mb',
C
chengduo 已提交
115
        'init_allocated_mem', 'free_idle_memory', 'paddle_num_threads',
116 117
        'dist_threadpool_size', 'cpu_deterministic', 'eager_delete_tensor_gb',
        'reader_queue_speed_test_mode'
118
    ]
Y
update  
Yancey1989 已提交
119 120
    if core.is_compiled_with_dist():
        read_env_flags.append('rpc_deadline')
Q
qiaolongfei 已提交
121 122
        read_env_flags.append('rpc_server_profile_period')
        read_env_flags.append('rpc_server_profile_path')
G
gongweibao 已提交
123
        read_env_flags.append('enable_rpc_profiler')
Q
Qiao Longfei 已提交
124 125 126
        read_env_flags.append('rpc_send_thread_num')
        read_env_flags.append('rpc_get_thread_num')
        read_env_flags.append('rpc_prefetch_thread_num')
Y
update  
Yancey1989 已提交
127

128
    if core.is_compiled_with_cuda():
129
        read_env_flags += [
D
dzhwinter 已提交
130
            'fraction_of_gpu_memory_to_use', 'cudnn_deterministic'
131
        ]
Q
QI JUN 已提交
132 133
    core.init_gflags([sys.argv[0]] +
                     ["--tryfromenv=" + ",".join(read_env_flags)])
Y
Yang Yu 已提交
134
    core.init_glog(sys.argv[0])
X
Xin Pan 已提交
135 136
    # don't init_p2p when in unittest to save time.
    core.init_devices(not in_test)
D
dzhwinter 已提交
137

138

X
Xin Pan 已提交
139 140
# TODO(panyx0718): Avoid doing complex initialization logic in __init__.py.
# Consider paddle.init(args) or paddle.main(args)
X
Xin Pan 已提交
141
monkey_patch_variable()
Y
Yang Yu 已提交
142
__bootstrap__()