setup.py 6.0 KB
Newer Older
H
Hui Zhang 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
H
Hui Zhang 已提交
14 15
import contextlib
import inspect
H
Hui Zhang 已提交
16 17
import io
import os
H
Hui Zhang 已提交
18
import subprocess as sp
H
Hui Zhang 已提交
19
import sys
H
Hui Zhang 已提交
20
from pathlib import Path
H
Hui Zhang 已提交
21

H
Hui Zhang 已提交
22
from setuptools import Command
H
Hui Zhang 已提交
23 24
from setuptools import find_packages
from setuptools import setup
H
Hui Zhang 已提交
25 26 27
from setuptools.command.develop import develop
from setuptools.command.install import install

H
Hui Zhang 已提交
28
HERE = Path(os.path.abspath(os.path.dirname(__file__)))
H
Hui Zhang 已提交
29

H
huangyuxin 已提交
30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45
requirements = {
    "install": [
        "editdistance",
        "g2p_en",
        "g2pM",
        "h5py",
        "inflect",
        "jieba",
        "jsonlines",
        "kaldiio",
        "librosa",
        "loguru",
        "matplotlib",
        "nara_wpe",
        "nltk",
        "pandas",
K
KP 已提交
46
        "paddleaudio",
H
huangyuxin 已提交
47
        "paddlespeech_feat",
48
        "praatio==5.0.0",
H
huangyuxin 已提交
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68
        "pypinyin",
        "python-dateutil",
        "pyworld",
        "resampy==0.2.2",
        "sacrebleu",
        "scipy",
        "sentencepiece~=0.1.96",
        "soundfile~=0.10",
        "textgrid",
        "timer",
        "tqdm",
        "typeguard",
        "visualdl",
        "webrtcvad",
        "yacs",
    ],
    "develop": [
        "ConfigArgParse",
        "coverage",
        "gpustat",
H
huangyuxin 已提交
69
        "paddlespeech_ctcdecoders",
H
huangyuxin 已提交
70 71 72
        "phkit",
        "Pillow",
        "pybind11",
73
        "pypi-kenlm",
H
huangyuxin 已提交
74
        "snakeviz",
75 76
        "sox",
        "soxbindings",
H
huangyuxin 已提交
77 78 79 80 81 82
        "unidecode",
        "yq",
        "pre-commit",
    ]
}

83

H
Hui Zhang 已提交
84 85 86 87
@contextlib.contextmanager
def pushd(new_dir):
    old_dir = os.getcwd()
    os.chdir(new_dir)
88
    print(new_dir)
H
Hui Zhang 已提交
89 90
    yield
    os.chdir(old_dir)
91
    print(old_dir)
H
Hui Zhang 已提交
92 93


H
Hui Zhang 已提交
94
def read(*names, **kwargs):
H
Hui Zhang 已提交
95 96 97
    with io.open(
            os.path.join(os.path.dirname(__file__), *names),
            encoding=kwargs.get("encoding", "utf8")) as fp:
H
Hui Zhang 已提交
98 99 100
        return fp.read()


H
Hui Zhang 已提交
101
def check_call(cmd: str, shell=False, executable=None):
H
Hui Zhang 已提交
102
    try:
H
Hui Zhang 已提交
103 104 105 106
        sp.check_call(
            cmd.split(),
            shell=shell,
            executable="/bin/bash" if shell else executable)
H
Hui Zhang 已提交
107 108 109 110 111
    except sp.CalledProcessError as e:
        print(
            f"{__file__}:{inspect.currentframe().f_lineno}: CMD: {cmd}, Error:",
            e.output,
            file=sys.stderr)
H
Hui Zhang 已提交
112
        raise e
H
Hui Zhang 已提交
113 114


115 116 117 118 119 120
def _remove(files: str):
    for f in files:
        f.unlink()


def _post_install(install_lib_dir):
H
Hui Zhang 已提交
121 122
    # tools/make
    tool_dir = HERE / "tools"
123
    _remove(tool_dir.glob("*.done"))
H
Hui Zhang 已提交
124
    with pushd(tool_dir):
H
Hui Zhang 已提交
125
        check_call("make")
H
Hui Zhang 已提交
126
    print("tools install.")
H
Hui Zhang 已提交
127

H
Hui Zhang 已提交
128
    # ctcdecoder
129
    ctcdecoder_dir = HERE / 'paddlespeech/s2t/decoders/ctcdecoder/swig'
H
Hui Zhang 已提交
130 131 132 133
    with pushd(ctcdecoder_dir):
        check_call("bash -e setup.sh")
    print("ctcdecoder install.")

H
Hui Zhang 已提交
134

H
Hui Zhang 已提交
135 136 137
class DevelopCommand(develop):
    def run(self):
        develop.run(self)
138
        # must after develop.run, or pkg install by shell will not see
H
Hui Zhang 已提交
139 140 141 142 143 144 145 146
        self.execute(_post_install, (self.install_lib, ), msg="Post Install...")


class InstallCommand(install):
    def run(self):
        install.run(self)


147
    # cmd: python setup.py upload
H
Hui Zhang 已提交
148 149 150 151 152 153 154 155 156 157 158 159 160
class UploadCommand(Command):
    description = "Build and publish the package."
    user_options = []

    def initialize_options(self):
        pass

    def finalize_options(self):
        pass

    def run(self):
        try:
            print("Removing previous dist/ ...")
H
Hui Zhang 已提交
161
            shutil.rmtree(str(HERE / "dist"))
H
Hui Zhang 已提交
162 163 164 165 166 167 168 169 170
        except OSError:
            pass
        print("Building source distribution...")
        sp.check_call([sys.executable, "setup.py", "sdist"])
        print("Uploading package to PyPi...")
        sp.check_call(["twine", "upload", "dist/*"])
        sys.exit()


H
Hui Zhang 已提交
171 172
setup_info = dict(
    # Metadata
H
Hui Zhang 已提交
173
    name='paddlespeech',
174
    version='0.1.0',
175 176 177 178
    author='PaddlePaddle Speech and Language Team',
    author_email='paddlesl@baidu.com',
    url='https://github.com/PaddlePaddle/PaddleSpeech',
    license='Apache 2.0',
H
Hui Zhang 已提交
179
    description='Speech tools and models based on Paddlepaddle',
H
Hui Zhang 已提交
180
    long_description=read("README.md"),
H
Hui Zhang 已提交
181
    long_description_content_type="text/markdown",
H
Hui Zhang 已提交
182 183 184 185
    keywords=[
        "speech",
        "asr",
        "tts",
186 187
        "speaker verfication",
        "speech classfication",
H
Hui Zhang 已提交
188 189 190
        "text frontend",
        "MFA",
        "paddlepaddle",
191 192 193
        "beam search",
        "ctcdecoder",
        "deepspeech2",
H
Hui Zhang 已提交
194 195 196 197 198 199 200
        "transformer",
        "conformer",
        "fastspeech",
        "vocoder",
        "pwgan",
        "gan",
    ],
H
huangyuxin 已提交
201
    python_requires='>=3.7',
H
huangyuxin 已提交
202
    install_requires=requirements["install"],
H
Hui Zhang 已提交
203
    extras_require={
H
huangyuxin 已提交
204 205
        'develop':
        requirements["develop"],
H
Hui Zhang 已提交
206 207 208 209
        'doc': [
            "sphinx", "sphinx-rtd-theme", "numpydoc", "myst_parser",
            "recommonmark>=0.5.0", "sphinx-markdown-tables", "sphinx-autobuild"
        ],
H
Hui Zhang 已提交
210
    },
H
Hui Zhang 已提交
211 212 213 214 215
    cmdclass={
        'develop': DevelopCommand,
        'install': InstallCommand,
        'upload': UploadCommand,
    },
H
Hui Zhang 已提交
216 217

    # Package info
J
Jackwaterveg 已提交
218
    packages=find_packages(include=('paddlespeech*')),
H
Hui Zhang 已提交
219 220
    zip_safe=True,
    classifiers=[
221
        'Development Status :: 5 - Production/Stable',
H
Hui Zhang 已提交
222 223 224 225
        'Intended Audience :: Developers',
        'Intended Audience :: Science/Research',
        'Topic :: Scientific/Engineering :: Artificial Intelligence',
        'License :: OSI Approved :: Apache Software License',
H
Hui Zhang 已提交
226 227
        'Programming Language :: Python',
        'Programming Language :: Python :: 3',
H
Hui Zhang 已提交
228
        'Programming Language :: Python :: 3.7',
H
Hui Zhang 已提交
229
        'Programming Language :: Python :: 3.8',
230
        'Programming Language :: Python :: 3.9',
K
KP 已提交
231 232 233 234
    ],
    entry_points={
        'console_scripts': ['paddlespeech=paddlespeech.cli.entry:_execute']
    })
H
Hui Zhang 已提交
235 236

setup(**setup_info)