setup.py 6.0 KB
Newer Older
H
Hui Zhang 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
H
Hui Zhang 已提交
14 15
import contextlib
import inspect
H
Hui Zhang 已提交
16 17
import io
import os
H
Hui Zhang 已提交
18
import subprocess as sp
H
Hui Zhang 已提交
19
import sys
H
Hui Zhang 已提交
20
from pathlib import Path
H
Hui Zhang 已提交
21

H
Hui Zhang 已提交
22
from setuptools import Command
H
Hui Zhang 已提交
23 24
from setuptools import find_packages
from setuptools import setup
H
Hui Zhang 已提交
25 26 27
from setuptools.command.develop import develop
from setuptools.command.install import install

H
Hui Zhang 已提交
28
HERE = Path(os.path.abspath(os.path.dirname(__file__)))
H
Hui Zhang 已提交
29

H
huangyuxin 已提交
30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45
requirements = {
    "install": [
        "editdistance",
        "g2p_en",
        "g2pM",
        "h5py",
        "inflect",
        "jieba",
        "jsonlines",
        "kaldiio",
        "librosa",
        "loguru",
        "matplotlib",
        "nara_wpe",
        "nltk",
        "pandas",
K
KP 已提交
46
        "paddleaudio",
47
        "paddlenlp",
H
huangyuxin 已提交
48
        "paddlespeech_feat",
49
        "praatio==5.0.0",
H
huangyuxin 已提交
50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69
        "pypinyin",
        "python-dateutil",
        "pyworld",
        "resampy==0.2.2",
        "sacrebleu",
        "scipy",
        "sentencepiece~=0.1.96",
        "soundfile~=0.10",
        "textgrid",
        "timer",
        "tqdm",
        "typeguard",
        "visualdl",
        "webrtcvad",
        "yacs",
    ],
    "develop": [
        "ConfigArgParse",
        "coverage",
        "gpustat",
H
huangyuxin 已提交
70
        "paddlespeech_ctcdecoders",
H
huangyuxin 已提交
71 72 73
        "phkit",
        "Pillow",
        "pybind11",
74
        "pypi-kenlm",
H
huangyuxin 已提交
75
        "snakeviz",
76 77
        "sox",
        "soxbindings",
H
huangyuxin 已提交
78 79 80 81 82 83
        "unidecode",
        "yq",
        "pre-commit",
    ]
}

84

H
Hui Zhang 已提交
85 86 87 88
@contextlib.contextmanager
def pushd(new_dir):
    old_dir = os.getcwd()
    os.chdir(new_dir)
89
    print(new_dir)
H
Hui Zhang 已提交
90 91
    yield
    os.chdir(old_dir)
92
    print(old_dir)
H
Hui Zhang 已提交
93 94


H
Hui Zhang 已提交
95
def read(*names, **kwargs):
H
Hui Zhang 已提交
96 97 98
    with io.open(
            os.path.join(os.path.dirname(__file__), *names),
            encoding=kwargs.get("encoding", "utf8")) as fp:
H
Hui Zhang 已提交
99 100 101
        return fp.read()


H
Hui Zhang 已提交
102
def check_call(cmd: str, shell=False, executable=None):
H
Hui Zhang 已提交
103
    try:
H
Hui Zhang 已提交
104 105 106 107
        sp.check_call(
            cmd.split(),
            shell=shell,
            executable="/bin/bash" if shell else executable)
H
Hui Zhang 已提交
108 109 110 111 112
    except sp.CalledProcessError as e:
        print(
            f"{__file__}:{inspect.currentframe().f_lineno}: CMD: {cmd}, Error:",
            e.output,
            file=sys.stderr)
H
Hui Zhang 已提交
113
        raise e
H
Hui Zhang 已提交
114 115


116 117 118 119 120 121
def _remove(files: str):
    for f in files:
        f.unlink()


def _post_install(install_lib_dir):
H
Hui Zhang 已提交
122 123
    # tools/make
    tool_dir = HERE / "tools"
124
    _remove(tool_dir.glob("*.done"))
H
Hui Zhang 已提交
125
    with pushd(tool_dir):
H
Hui Zhang 已提交
126
        check_call("make")
H
Hui Zhang 已提交
127
    print("tools install.")
H
Hui Zhang 已提交
128

H
Hui Zhang 已提交
129
    # ctcdecoder
130
    ctcdecoder_dir = HERE / 'paddlespeech/s2t/decoders/ctcdecoder/swig'
H
Hui Zhang 已提交
131 132 133 134
    with pushd(ctcdecoder_dir):
        check_call("bash -e setup.sh")
    print("ctcdecoder install.")

H
Hui Zhang 已提交
135

H
Hui Zhang 已提交
136 137 138
class DevelopCommand(develop):
    def run(self):
        develop.run(self)
139
        # must after develop.run, or pkg install by shell will not see
H
Hui Zhang 已提交
140 141 142 143 144 145 146 147
        self.execute(_post_install, (self.install_lib, ), msg="Post Install...")


class InstallCommand(install):
    def run(self):
        install.run(self)


148
    # cmd: python setup.py upload
H
Hui Zhang 已提交
149 150 151 152 153 154 155 156 157 158 159 160 161
class UploadCommand(Command):
    description = "Build and publish the package."
    user_options = []

    def initialize_options(self):
        pass

    def finalize_options(self):
        pass

    def run(self):
        try:
            print("Removing previous dist/ ...")
H
Hui Zhang 已提交
162
            shutil.rmtree(str(HERE / "dist"))
H
Hui Zhang 已提交
163 164 165 166 167 168 169 170 171
        except OSError:
            pass
        print("Building source distribution...")
        sp.check_call([sys.executable, "setup.py", "sdist"])
        print("Uploading package to PyPi...")
        sp.check_call(["twine", "upload", "dist/*"])
        sys.exit()


H
Hui Zhang 已提交
172 173
setup_info = dict(
    # Metadata
H
Hui Zhang 已提交
174
    name='paddlespeech',
175
    version='0.1.0',
176 177 178 179
    author='PaddlePaddle Speech and Language Team',
    author_email='paddlesl@baidu.com',
    url='https://github.com/PaddlePaddle/PaddleSpeech',
    license='Apache 2.0',
H
Hui Zhang 已提交
180
    description='Speech tools and models based on Paddlepaddle',
H
Hui Zhang 已提交
181
    long_description=read("README.md"),
H
Hui Zhang 已提交
182
    long_description_content_type="text/markdown",
H
Hui Zhang 已提交
183 184 185 186
    keywords=[
        "speech",
        "asr",
        "tts",
187 188
        "speaker verfication",
        "speech classfication",
H
Hui Zhang 已提交
189 190 191
        "text frontend",
        "MFA",
        "paddlepaddle",
192 193 194
        "beam search",
        "ctcdecoder",
        "deepspeech2",
H
Hui Zhang 已提交
195 196 197 198 199 200 201
        "transformer",
        "conformer",
        "fastspeech",
        "vocoder",
        "pwgan",
        "gan",
    ],
H
huangyuxin 已提交
202
    python_requires='>=3.7',
H
huangyuxin 已提交
203
    install_requires=requirements["install"],
H
Hui Zhang 已提交
204
    extras_require={
H
huangyuxin 已提交
205 206
        'develop':
        requirements["develop"],
H
Hui Zhang 已提交
207 208 209 210
        'doc': [
            "sphinx", "sphinx-rtd-theme", "numpydoc", "myst_parser",
            "recommonmark>=0.5.0", "sphinx-markdown-tables", "sphinx-autobuild"
        ],
H
Hui Zhang 已提交
211
    },
H
Hui Zhang 已提交
212 213 214 215 216
    cmdclass={
        'develop': DevelopCommand,
        'install': InstallCommand,
        'upload': UploadCommand,
    },
H
Hui Zhang 已提交
217 218

    # Package info
J
Jackwaterveg 已提交
219
    packages=find_packages(include=('paddlespeech*')),
H
Hui Zhang 已提交
220 221
    zip_safe=True,
    classifiers=[
222
        'Development Status :: 5 - Production/Stable',
H
Hui Zhang 已提交
223 224 225 226
        'Intended Audience :: Developers',
        'Intended Audience :: Science/Research',
        'Topic :: Scientific/Engineering :: Artificial Intelligence',
        'License :: OSI Approved :: Apache Software License',
H
Hui Zhang 已提交
227 228
        'Programming Language :: Python',
        'Programming Language :: Python :: 3',
H
Hui Zhang 已提交
229
        'Programming Language :: Python :: 3.7',
H
Hui Zhang 已提交
230
        'Programming Language :: Python :: 3.8',
231
        'Programming Language :: Python :: 3.9',
K
KP 已提交
232 233 234 235
    ],
    entry_points={
        'console_scripts': ['paddlespeech=paddlespeech.cli.entry:_execute']
    })
H
Hui Zhang 已提交
236 237

setup(**setup_info)