setup.py 6.3 KB
Newer Older
H
Hui Zhang 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
H
Hui Zhang 已提交
14 15
import contextlib
import inspect
H
Hui Zhang 已提交
16 17
import io
import os
H
Hui Zhang 已提交
18
import subprocess as sp
H
Hui Zhang 已提交
19
import sys
H
Hui Zhang 已提交
20
from pathlib import Path
H
Hui Zhang 已提交
21

H
Hui Zhang 已提交
22
from setuptools import Command
H
Hui Zhang 已提交
23 24
from setuptools import find_packages
from setuptools import setup
H
Hui Zhang 已提交
25 26 27
from setuptools.command.develop import develop
from setuptools.command.install import install

H
Hui Zhang 已提交
28
HERE = Path(os.path.abspath(os.path.dirname(__file__)))
H
Hui Zhang 已提交
29

H
huangyuxin 已提交
30 31 32 33 34 35 36 37 38 39 40 41 42 43 44
requirements = {
    "install": [
        "editdistance",
        "g2p_en",
        "g2pM",
        "h5py",
        "inflect",
        "jieba",
        "jsonlines",
        "kaldiio",
        "librosa",
        "loguru",
        "matplotlib",
        "nara_wpe",
        "pandas",
K
KP 已提交
45
        "paddleaudio",
46
        "paddlenlp",
H
huangyuxin 已提交
47
        "paddlespeech_feat",
48
        "praatio==5.0.0",
H
huangyuxin 已提交
49 50 51 52 53 54 55 56 57 58 59 60 61 62
        "pypinyin",
        "python-dateutil",
        "pyworld",
        "resampy==0.2.2",
        "sacrebleu",
        "scipy",
        "sentencepiece~=0.1.96",
        "soundfile~=0.10",
        "textgrid",
        "timer",
        "tqdm",
        "typeguard",
        "visualdl",
        "webrtcvad",
63
        "yacs~=0.1.8",
L
liangym 已提交
64 65 66
        # fastapi server
        "fastapi",
        "uvicorn",
H
huangyuxin 已提交
67 68 69 70 71
    ],
    "develop": [
        "ConfigArgParse",
        "coverage",
        "gpustat",
H
huangyuxin 已提交
72
        "paddlespeech_ctcdecoders",
H
huangyuxin 已提交
73 74 75
        "phkit",
        "Pillow",
        "pybind11",
76
        "pypi-kenlm",
H
huangyuxin 已提交
77
        "snakeviz",
78 79
        "sox",
        "soxbindings",
H
huangyuxin 已提交
80 81 82
        "unidecode",
        "yq",
        "pre-commit",
H
huangyuxin 已提交
83
        "zhon",
H
huangyuxin 已提交
84 85 86
    ]
}

87

H
Hui Zhang 已提交
88 89 90 91
@contextlib.contextmanager
def pushd(new_dir):
    old_dir = os.getcwd()
    os.chdir(new_dir)
92
    print(new_dir)
H
Hui Zhang 已提交
93 94
    yield
    os.chdir(old_dir)
95
    print(old_dir)
H
Hui Zhang 已提交
96 97


H
Hui Zhang 已提交
98
def read(*names, **kwargs):
H
Hui Zhang 已提交
99 100 101
    with io.open(
            os.path.join(os.path.dirname(__file__), *names),
            encoding=kwargs.get("encoding", "utf8")) as fp:
H
Hui Zhang 已提交
102 103 104
        return fp.read()


H
Hui Zhang 已提交
105
def check_call(cmd: str, shell=False, executable=None):
H
Hui Zhang 已提交
106
    try:
H
Hui Zhang 已提交
107 108 109 110
        sp.check_call(
            cmd.split(),
            shell=shell,
            executable="/bin/bash" if shell else executable)
H
Hui Zhang 已提交
111 112 113 114 115
    except sp.CalledProcessError as e:
        print(
            f"{__file__}:{inspect.currentframe().f_lineno}: CMD: {cmd}, Error:",
            e.output,
            file=sys.stderr)
H
Hui Zhang 已提交
116
        raise e
H
Hui Zhang 已提交
117 118


119 120 121 122 123 124
def _remove(files: str):
    for f in files:
        f.unlink()


def _post_install(install_lib_dir):
H
Hui Zhang 已提交
125 126
    # tools/make
    tool_dir = HERE / "tools"
127
    _remove(tool_dir.glob("*.done"))
H
Hui Zhang 已提交
128
    with pushd(tool_dir):
H
Hui Zhang 已提交
129
        check_call("make")
H
Hui Zhang 已提交
130
    print("tools install.")
H
Hui Zhang 已提交
131

H
Hui Zhang 已提交
132
    # ctcdecoder
133
    ctcdecoder_dir = HERE / 'third_party/ctc_decoders'
H
Hui Zhang 已提交
134 135 136 137
    with pushd(ctcdecoder_dir):
        check_call("bash -e setup.sh")
    print("ctcdecoder install.")

H
Hui Zhang 已提交
138

H
Hui Zhang 已提交
139 140 141
class DevelopCommand(develop):
    def run(self):
        develop.run(self)
142
        # must after develop.run, or pkg install by shell will not see
H
Hui Zhang 已提交
143 144 145 146 147 148 149 150
        self.execute(_post_install, (self.install_lib, ), msg="Post Install...")


class InstallCommand(install):
    def run(self):
        install.run(self)


151
    # cmd: python setup.py upload
H
Hui Zhang 已提交
152 153 154 155 156 157 158 159 160 161 162 163 164
class UploadCommand(Command):
    description = "Build and publish the package."
    user_options = []

    def initialize_options(self):
        pass

    def finalize_options(self):
        pass

    def run(self):
        try:
            print("Removing previous dist/ ...")
H
Hui Zhang 已提交
165
            shutil.rmtree(str(HERE / "dist"))
H
Hui Zhang 已提交
166 167 168 169 170 171 172 173 174
        except OSError:
            pass
        print("Building source distribution...")
        sp.check_call([sys.executable, "setup.py", "sdist"])
        print("Uploading package to PyPi...")
        sp.check_call(["twine", "upload", "dist/*"])
        sys.exit()


H
Hui Zhang 已提交
175 176
setup_info = dict(
    # Metadata
H
Hui Zhang 已提交
177
    name='paddlespeech',
H
huangyuxin 已提交
178
    version='0.1.1',
179 180 181 182
    author='PaddlePaddle Speech and Language Team',
    author_email='paddlesl@baidu.com',
    url='https://github.com/PaddlePaddle/PaddleSpeech',
    license='Apache 2.0',
H
Hui Zhang 已提交
183
    description='Speech tools and models based on Paddlepaddle',
H
Hui Zhang 已提交
184
    long_description=read("README.md"),
H
Hui Zhang 已提交
185
    long_description_content_type="text/markdown",
H
Hui Zhang 已提交
186 187 188 189
    keywords=[
        "speech",
        "asr",
        "tts",
190 191
        "speaker verfication",
        "speech classfication",
H
Hui Zhang 已提交
192 193 194
        "text frontend",
        "MFA",
        "paddlepaddle",
195 196 197
        "beam search",
        "ctcdecoder",
        "deepspeech2",
H
Hui Zhang 已提交
198 199 200 201 202 203 204
        "transformer",
        "conformer",
        "fastspeech",
        "vocoder",
        "pwgan",
        "gan",
    ],
H
huangyuxin 已提交
205
    python_requires='>=3.7',
H
huangyuxin 已提交
206
    install_requires=requirements["install"],
H
Hui Zhang 已提交
207
    extras_require={
H
huangyuxin 已提交
208 209
        'develop':
        requirements["develop"],
H
Hui Zhang 已提交
210 211 212 213
        'doc': [
            "sphinx", "sphinx-rtd-theme", "numpydoc", "myst_parser",
            "recommonmark>=0.5.0", "sphinx-markdown-tables", "sphinx-autobuild"
        ],
H
Hui Zhang 已提交
214
    },
H
Hui Zhang 已提交
215 216 217 218 219
    cmdclass={
        'develop': DevelopCommand,
        'install': InstallCommand,
        'upload': UploadCommand,
    },
H
Hui Zhang 已提交
220 221

    # Package info
J
Jackwaterveg 已提交
222
    packages=find_packages(include=('paddlespeech*')),
H
Hui Zhang 已提交
223 224
    zip_safe=True,
    classifiers=[
225
        'Development Status :: 5 - Production/Stable',
H
Hui Zhang 已提交
226 227 228 229
        'Intended Audience :: Developers',
        'Intended Audience :: Science/Research',
        'Topic :: Scientific/Engineering :: Artificial Intelligence',
        'License :: OSI Approved :: Apache Software License',
H
Hui Zhang 已提交
230 231
        'Programming Language :: Python',
        'Programming Language :: Python :: 3',
H
Hui Zhang 已提交
232
        'Programming Language :: Python :: 3.7',
H
Hui Zhang 已提交
233
        'Programming Language :: Python :: 3.8',
234
        'Programming Language :: Python :: 3.9',
K
KP 已提交
235 236
    ],
    entry_points={
L
lym0302 已提交
237 238
        'console_scripts': [
            'paddlespeech=paddlespeech.cli.entry:_execute',
L
lym0302 已提交
239 240
            'paddlespeech_server=paddlespeech.server.entry:server_execute',
            'paddlespeech_client=paddlespeech.server.entry:client_execute'
L
lym0302 已提交
241
        ]
K
KP 已提交
242
    })
H
Hui Zhang 已提交
243 244

setup(**setup_info)