PaddleSpeech/setup.py

# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import contextlib
import inspect
import io
import os
import subprocess as sp
import sys
from pathlib import Path

from setuptools import Command
from setuptools import find_packages
from setuptools import setup
from setuptools.command.develop import develop
from setuptools.command.install import install
from setuptools.command.test import test

HERE = Path(os.path.abspath(os.path.dirname(__file__)))

VERSION = '0.0.0'
COMMITID = 'none'

base = [
    "editdistance",
    "g2p_en",
    "g2pM",
    "h5py",
    "inflect",
    "jieba",
    "jsonlines",
    "kaldiio",
    "librosa==0.8.1",
    "loguru",
    "matplotlib",
    "nara_wpe",
    "onnxruntime==1.10.0",
    "opencc",
    "pandas",
    "paddlenlp",
    "paddlespeech_feat",
    "Pillow>=9.0.0",
    "praatio==5.0.0",
    "protobuf>=3.1.0, <=3.20.0",
    "pypinyin<=0.44.0",
    "pypinyin-dict",
    "python-dateutil",
    "pyworld==0.2.12",
    "resampy==0.2.2",
    "sacrebleu",
    "scipy",
    "sentencepiece~=0.1.96",
    "soundfile~=0.10",
    "textgrid",
    "timer",
    "tqdm",
    "typeguard",
    "visualdl",
    "webrtcvad",
    "yacs~=0.1.8",
    "prettytable",
    "zhon",
    "colorlog",
    "pathos == 0.2.8",
    "braceexpand",
    "pyyaml",
    "pybind11",
]

server = ["fastapi", "uvicorn", "pattern_singleton", "websockets"]

requirements = {
    "install":
    base + server,
    "develop": [
        "ConfigArgParse",
        "coverage",
        "gpustat",
        "paddlespeech_ctcdecoders",
        "phkit",
        "pypi-kenlm",
        "snakeviz",
        "sox",
        "soxbindings",
        "unidecode",
        "yq",
        "pre-commit",
    ]
}


def check_call(cmd: str, shell=False, executable=None):
    try:
        sp.check_call(
            cmd.split(),
            shell=shell,
            executable="/bin/bash" if shell else executable)
    except sp.CalledProcessError as e:
        print(
            f"{__file__}:{inspect.currentframe().f_lineno}: CMD: {cmd}, Error:",
            e.output,
            file=sys.stderr)
        raise e


def check_output(cmd: str, shell=False):
    try:
        out_bytes = sp.check_output(cmd.split())
    except sp.CalledProcessError as e:
        out_bytes = e.output  # Output generated before error
        code = e.returncode  # Return code
        print(
            f"{__file__}:{inspect.currentframe().f_lineno}: CMD: {cmd}, Error:",
            out_bytes,
            file=sys.stderr)
    return out_bytes.strip().decode('utf8')


@contextlib.contextmanager
def pushd(new_dir):
    old_dir = os.getcwd()
    os.chdir(new_dir)
    print(new_dir)
    yield
    os.chdir(old_dir)
    print(old_dir)


def read(*names, **kwargs):
    with io.open(
            os.path.join(os.path.dirname(__file__), *names),
            encoding=kwargs.get("encoding", "utf8")) as fp:
        return fp.read()


def _remove(files: str):
    for f in files:
        f.unlink()


################################# Install ##################################


def _post_install(install_lib_dir):
    # tools/make
    tool_dir = HERE / "tools"
    _remove(tool_dir.glob("*.done"))
    with pushd(tool_dir):
        check_call("make")
    print("tools install.")

    # ctcdecoder
    ctcdecoder_dir = HERE / 'third_party/ctc_decoders'
    with pushd(ctcdecoder_dir):
        check_call("bash -e setup.sh")
    print("ctcdecoder install.")


class DevelopCommand(develop):
    def run(self):
        develop.run(self)
        # must after develop.run, or pkg install by shell will not see
        self.execute(_post_install, (self.install_lib, ), msg="Post Install...")


class InstallCommand(install):
    def run(self):
        install.run(self)


class TestCommand(test):
    def finalize_options(self):
        test.finalize_options(self)
        self.test_args = []
        self.test_suite = True

    def run_tests(self):
        # Run nose ensuring that argv simulates running nosetests directly
        import nose
        nose.run_exit(argv=['nosetests', '-w', 'tests'])


# cmd: python setup.py upload
class UploadCommand(Command):
    description = "Build and publish the package."
    user_options = []

    def initialize_options(self):
        pass

    def finalize_options(self):
        pass

    def run(self):
        try:
            print("Removing previous dist/ ...")
            shutil.rmtree(str(HERE / "dist"))
        except OSError:
            pass
        print("Building source distribution...")
        sp.check_call([sys.executable, "setup.py", "sdist"])
        print("Uploading package to PyPi...")
        sp.check_call(["twine", "upload", "dist/*"])
        sys.exit()


################################# Version ##################################
def write_version_py(filename='paddlespeech/__init__.py'):
    import paddlespeech
    if hasattr(paddlespeech,
               "__version__") and paddlespeech.__version__ == VERSION:
        return
    with open(filename, "a") as f:
        out_str = f"\n__version__ = '{VERSION}'\n"
        print(out_str)
        f.write(f"\n__version__ = '{VERSION}'\n")

    COMMITID = check_output("git rev-parse HEAD")
    with open(filename, 'a') as f:
        out_str = f"\n__commit__ = '{COMMITID}'\n"
        print(out_str)
        f.write(f"\n__commit__ = '{COMMITID}'\n")

    print(f"{inspect.currentframe().f_code.co_name} done")


def remove_version_py(filename='paddlespeech/__init__.py'):
    with open(filename, "r") as f:
        lines = f.readlines()
    with open(filename, "w") as f:
        for line in lines:
            if "__version__" in line or "__commit__" in line:
                continue
            f.write(line)
    print(f"{inspect.currentframe().f_code.co_name} done")


@contextlib.contextmanager
def version_info():
    write_version_py()
    yield
    remove_version_py()


################################# Steup ##################################
setup_info = dict(
    # Metadata
    name='paddlespeech',
    version=VERSION,
    author='PaddlePaddle Speech and Language Team',
    author_email='paddlesl@baidu.com',
    url='https://github.com/PaddlePaddle/PaddleSpeech',
    license='Apache 2.0',
    description='Speech tools and models based on Paddlepaddle',
    long_description=read("README.md"),
    long_description_content_type="text/markdown",
    keywords=[
        "speech",
        "asr",
        "tts",
        "speaker verfication",
        "speech classfication",
        "text frontend",
        "MFA",
        "paddlepaddle",
        "beam search",
        "ctcdecoder",
        "deepspeech2",
        "transformer",
        "conformer",
        "fastspeech",
        "vocoder",
        "pwgan",
        "gan",
    ],
    python_requires='>=3.7',
    install_requires=requirements["install"],
    extras_require={
        'develop':
        requirements["develop"],
        'doc': [
            "sphinx", "sphinx-rtd-theme", "numpydoc", "myst_parser",
            "recommonmark>=0.5.0", "sphinx-markdown-tables", "sphinx-autobuild"
        ],
        'test': ['nose', 'torchaudio==0.10.2'],
    },
    cmdclass={
        'develop': DevelopCommand,
        'install': InstallCommand,
        'upload': UploadCommand,
        'test': TestCommand,
    },

    # Package info
    packages=find_packages(include=('paddlespeech*')),
    zip_safe=True,
    classifiers=[
        'Development Status :: 5 - Production/Stable',
        'Intended Audience :: Developers',
        'Intended Audience :: Science/Research',
        'Topic :: Scientific/Engineering :: Artificial Intelligence',
        'License :: OSI Approved :: Apache Software License',
        'Programming Language :: Python',
        'Programming Language :: Python :: 3',
        'Programming Language :: Python :: 3.7',
        'Programming Language :: Python :: 3.8',
        'Programming Language :: Python :: 3.9',
    ],
    entry_points={
        'console_scripts': [
            'paddlespeech=paddlespeech.cli.entry:_execute',
            'paddlespeech_server=paddlespeech.server.entry:server_execute',
            'paddlespeech_client=paddlespeech.server.entry:client_execute'
        ]
    })

with version_info():
    setup(**setup_info, include_package_data=True)
merge parakeet repo into deepspeech 3 years ago			`# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.`
			`#`
			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`
recog into decoders, format code 3 years ago			`import contextlib`
			`import inspect`
merge parakeet repo into deepspeech 3 years ago			`import io`
			`import os`
recog into decoders, format code 3 years ago			`import subprocess as sp`
setup.py install cpp deps 3 years ago			`import sys`
tools make 3 years ago			`from pathlib import Path`
merge parakeet repo into deepspeech 3 years ago
recog into decoders, format code 3 years ago			`from setuptools import Command`
merge parakeet repo into deepspeech 3 years ago			`from setuptools import find_packages`
			`from setuptools import setup`
setup with ubuntu deps 3 years ago			`from setuptools.command.develop import develop`
			`from setuptools.command.install import install`
Refactor paddleaudio to paddlespeech.audio 2 years ago			`from setuptools.command.test import test`
setup with ubuntu deps 3 years ago
tools make 3 years ago			`HERE = Path(os.path.abspath(os.path.dirname(__file__)))`
merge parakeet repo into deepspeech 3 years ago
dev using 0.0.0 as version 3 years ago			`VERSION = '0.0.0'`
add commmit to version info 3 years ago			`COMMITID = 'none'`
refactor the version 3 years ago
format, test=doct 3 years ago			`base = [`
fix version of pyworld 2 years ago			`"editdistance",`
			`"g2p_en",`
			`"g2pM",`
			`"h5py",`
			`"inflect",`
			`"jieba",`
			`"jsonlines",`
			`"kaldiio",`
			`"librosa==0.8.1",`
			`"loguru",`
			`"matplotlib",`
			`"nara_wpe",`
onnxruntime doesn't support gpu for mac 2 years ago			`"onnxruntime==1.10.0",`
Add g2pW to Chinese frontend 2 years ago			`"opencc",`
fix version of pyworld 2 years ago			`"pandas",`
			`"paddlenlp",`
			`"paddlespeech_feat",`
Update setup.py 2 years ago			`"Pillow>=9.0.0",`
fix version of pyworld 2 years ago			`"praatio==5.0.0",`
fix protobuf version 2 years ago			`"protobuf>=3.1.0, <=3.20.0",`
Added pre-install doc for G2P and TN modules and updated the dependency version of pypinyin second, test=doc 2 years ago			`"pypinyin<=0.44.0",`
fix version of pyworld 2 years ago			`"pypinyin-dict",`
			`"python-dateutil",`
			`"pyworld==0.2.12",`
			`"resampy==0.2.2",`
			`"sacrebleu",`
			`"scipy",`
			`"sentencepiece~=0.1.96",`
			`"soundfile~=0.10",`
			`"textgrid",`
			`"timer",`
			`"tqdm",`
			`"typeguard",`
			`"visualdl",`
			`"webrtcvad",`
			`"yacs~=0.1.8",`
			`"prettytable",`
			`"zhon",`
			`"colorlog",`
Merge branch 'develop' into webdataset 2 years ago			`"pathos == 0.2.8",`
			`"braceexpand",`
refactor attention cache 2 years ago			`"pyyaml",`
			`"pybind11",`
format, test=doct 3 years ago			`]`

format paddlespeech with pre-commit (#2331) 2 years ago			`server = ["fastapi", "uvicorn", "pattern_singleton", "websockets"]`
refactor the version 3 years ago
optimize the setup.py and setup.sh 3 years ago			`requirements = {`
format, test=doct 3 years ago			`"install":`
			`base + server,`
optimize the setup.py and setup.sh 3 years ago			`"develop": [`
			`"ConfigArgParse",`
			`"coverage",`
			`"gpustat",`
Separate the ctcdecoders 3 years ago			`"paddlespeech_ctcdecoders",`
optimize the setup.py and setup.sh 3 years ago			`"phkit",`
move pypi-kenlm from install requirements to develop requirements 3 years ago			`"pypi-kenlm",`
optimize the setup.py and setup.sh 3 years ago			`"snakeviz",`
separate the sox and soxbindings with the requirements 3 years ago			`"sox",`
			`"soxbindings",`
optimize the setup.py and setup.sh 3 years ago			`"unidecode",`
			`"yq",`
			`"pre-commit",`
			`]`
			`}`

using setup.py to install pkgs by shell script 3 years ago
add commmit to version info 3 years ago			`def check_call(cmd: str, shell=False, executable=None):`
			`try:`
			`sp.check_call(`
			`cmd.split(),`
			`shell=shell,`
			`executable="/bin/bash" if shell else executable)`
			`except sp.CalledProcessError as e:`
			`print(`
			`f"{__file__}:{inspect.currentframe().f_lineno}: CMD: {cmd}, Error:",`
			`e.output,`
			`file=sys.stderr)`
			`raise e`
Merge branch 'develop' of https://github.com/PaddlePaddle/DeepSpeech into Setup 3 years ago
format 3 years ago
add commmit to version info 3 years ago			`def check_output(cmd: str, shell=False):`
			`try:`
			`out_bytes = sp.check_output(cmd.split())`
			`except sp.CalledProcessError as e:`
format 3 years ago			`out_bytes = e.output # Output generated before error`
			`code = e.returncode # Return code`
add commmit to version info 3 years ago			`print(`
			`f"{__file__}:{inspect.currentframe().f_lineno}: CMD: {cmd}, Error:",`
			`out_bytes,`
			`file=sys.stderr)`
			`return out_bytes.strip().decode('utf8')`
add remove_version_py 3 years ago
refactor the version 3 years ago
tools make 3 years ago			`@contextlib.contextmanager`
			`def pushd(new_dir):`
			`old_dir = os.getcwd()`
			`os.chdir(new_dir)`
using setup.py to install pkgs by shell script 3 years ago			`print(new_dir)`
setup.py install cpp deps 3 years ago			`yield`
			`os.chdir(old_dir)`
using setup.py to install pkgs by shell script 3 years ago			`print(old_dir)`
tools make 3 years ago

fix not found pushd 3 years ago			`def read(names, *kwargs):`
recog into decoders, format code 3 years ago			`with io.open(`
			`os.path.join(os.path.dirname(__file__), *names),`
			`encoding=kwargs.get("encoding", "utf8")) as fp:`
fix not found pushd 3 years ago			`return fp.read()`


using setup.py to install pkgs by shell script 3 years ago			`def _remove(files: str):`
			`for f in files:`
			`f.unlink()`

format 3 years ago
add commmit to version info 3 years ago			`################################# Install ##################################`

using setup.py to install pkgs by shell script 3 years ago
			`def _post_install(install_lib_dir):`
tools make 3 years ago			`# tools/make`
			`tool_dir = HERE / "tools"`
using setup.py to install pkgs by shell script 3 years ago			`_remove(tool_dir.glob("*.done"))`
tools make 3 years ago			`with pushd(tool_dir):`
fix not found pushd 3 years ago			`check_call("make")`
setup.py install cpp deps 3 years ago			`print("tools install.")`
setup with ubuntu deps 3 years ago
tools make 3 years ago			`# ctcdecoder`
mv the ctcdecoders to third_part (#1313) 3 years ago			`ctcdecoder_dir = HERE / 'third_party/ctc_decoders'`
setup.py install cpp deps 3 years ago			`with pushd(ctcdecoder_dir):`
			`check_call("bash -e setup.sh")`
			`print("ctcdecoder install.")`

fix install 3 years ago
setup with ubuntu deps 3 years ago			`class DevelopCommand(develop):`
			`def run(self):`
			`develop.run(self)`
using setup.py to install pkgs by shell script 3 years ago			`# must after develop.run, or pkg install by shell will not see`
setup with ubuntu deps 3 years ago			`self.execute(_post_install, (self.install_lib, ), msg="Post Install...")`


			`class InstallCommand(install):`
			`def run(self):`
			`install.run(self)`


Refactor paddleaudio to paddlespeech.audio 2 years ago			`class TestCommand(test):`
			`def finalize_options(self):`
			`test.finalize_options(self)`
			`self.test_args = []`
			`self.test_suite = True`

			`def run_tests(self):`
			`# Run nose ensuring that argv simulates running nosetests directly`
			`import nose`
			`nose.run_exit(argv=['nosetests', '-w', 'tests'])`


			`# cmd: python setup.py upload`
setup with ubuntu deps 3 years ago			`class UploadCommand(Command):`
			`description = "Build and publish the package."`
			`user_options = []`

			`def initialize_options(self):`
			`pass`

			`def finalize_options(self):`
			`pass`

			`def run(self):`
			`try:`
			`print("Removing previous dist/ ...")`
tools make 3 years ago			`shutil.rmtree(str(HERE / "dist"))`
setup with ubuntu deps 3 years ago			`except OSError:`
			`pass`
			`print("Building source distribution...")`
			`sp.check_call([sys.executable, "setup.py", "sdist"])`
			`print("Uploading package to PyPi...")`
			`sp.check_call(["twine", "upload", "dist/*"])`
			`sys.exit()`


add commmit to version info 3 years ago			`################################# Version ##################################`
			`def write_version_py(filename='paddlespeech/__init__.py'):`
			`import paddlespeech`
			`if hasattr(paddlespeech,`
			`"__version__") and paddlespeech.__version__ == VERSION:`
			`return`
			`with open(filename, "a") as f:`
			`out_str = f"\n__version__ = '{VERSION}'\n"`
			`print(out_str)`
			`f.write(f"\n__version__ = '{VERSION}'\n")`

			`COMMITID = check_output("git rev-parse HEAD")`
			`with open(filename, 'a') as f:`
			`out_str = f"\n__commit__ = '{COMMITID}'\n"`
			`print(out_str)`
			`f.write(f"\n__commit__ = '{COMMITID}'\n")`

			`print(f"{inspect.currentframe().f_code.co_name} done")`


			`def remove_version_py(filename='paddlespeech/__init__.py'):`
			`with open(filename, "r") as f:`
			`lines = f.readlines()`
			`with open(filename, "w") as f:`
			`for line in lines:`
			`if "__version__" in line or "__commit__" in line:`
			`continue`
			`f.write(line)`
			`print(f"{inspect.currentframe().f_code.co_name} done")`


			`@contextlib.contextmanager`
			`def version_info():`
			`write_version_py()`
			`yield`
			`remove_version_py()`

refactor the version 3 years ago
add commmit to version info 3 years ago			`################################# Steup ##################################`
merge parakeet repo into deepspeech 3 years ago			`setup_info = dict(`
			`# Metadata`
fix setup 3 years ago			`name='paddlespeech',`
refacto the code 3 years ago			`version=VERSION,`
Update the setup.py for paddlespeech (#1009) 3 years ago			`author='PaddlePaddle Speech and Language Team',`
			`author_email='paddlesl@baidu.com',`
			`url='https://github.com/PaddlePaddle/PaddleSpeech',`
			`license='Apache 2.0',`
setup.py deps from requirements.txt 3 years ago			`description='Speech tools and models based on Paddlepaddle',`
fix not found pushd 3 years ago			`long_description=read("README.md"),`
merge parakeet repo into deepspeech 3 years ago			`long_description_content_type="text/markdown",`
setup with ubuntu deps 3 years ago			`keywords=[`
			`"speech",`
			`"asr",`
			`"tts",`
remve .travis; fix install doc; more kws in setup.py 3 years ago			`"speaker verfication",`
			`"speech classfication",`
setup with ubuntu deps 3 years ago			`"text frontend",`
			`"MFA",`
			`"paddlepaddle",`
remve .travis; fix install doc; more kws in setup.py 3 years ago			`"beam search",`
			`"ctcdecoder",`
			`"deepspeech2",`
setup with ubuntu deps 3 years ago			`"transformer",`
			`"conformer",`
			`"fastspeech",`
			`"vocoder",`
			`"pwgan",`
			`"gan",`
			`],`
change the require py version 3 years ago			`python_requires='>=3.7',`
optimize the setup.py and setup.sh 3 years ago			`install_requires=requirements["install"],`
merge parakeet repo into deepspeech 3 years ago			`extras_require={`
optimize the setup.py and setup.sh 3 years ago			`'develop':`
			`requirements["develop"],`
setup.py deps from requirements.txt 3 years ago			`'doc': [`
			`"sphinx", "sphinx-rtd-theme", "numpydoc", "myst_parser",`
			`"recommonmark>=0.5.0", "sphinx-markdown-tables", "sphinx-autobuild"`
			`],`
Refactor paddleaudio to paddlespeech.audio 2 years ago			`'test': ['nose', 'torchaudio==0.10.2'],`
merge parakeet repo into deepspeech 3 years ago			`},`
setup with ubuntu deps 3 years ago			`cmdclass={`
			`'develop': DevelopCommand,`
			`'install': InstallCommand,`
			`'upload': UploadCommand,`
Refactor paddleaudio to paddlespeech.audio 2 years ago			`'test': TestCommand,`
setup with ubuntu deps 3 years ago			`},`
merge parakeet repo into deepspeech 3 years ago
			`# Package info`
fix the setup.py (#1076) 3 years ago			`packages=find_packages(include=('paddlespeech*')),`
merge parakeet repo into deepspeech 3 years ago			`zip_safe=True,`
			`classifiers=[`
change the paddlespeech version (#1163) 3 years ago			`'Development Status :: 5 - Production/Stable',`
merge parakeet repo into deepspeech 3 years ago			`'Intended Audience :: Developers',`
			`'Intended Audience :: Science/Research',`
			`'Topic :: Scientific/Engineering :: Artificial Intelligence',`
			`'License :: OSI Approved :: Apache Software License',`
setup with ubuntu deps 3 years ago			`'Programming Language :: Python',`
			`'Programming Language :: Python :: 3',`
merge parakeet repo into deepspeech 3 years ago			`'Programming Language :: Python :: 3.7',`
setup.py deps from requirements.txt 3 years ago			`'Programming Language :: Python :: 3.8',`
Update the setup.py for paddlespeech (#1009) 3 years ago			`'Programming Language :: Python :: 3.9',`
Add paddlespeech.cli. 3 years ago			`],`
			`entry_points={`
add cli, test=doc 3 years ago			`'console_scripts': [`
			`'paddlespeech=paddlespeech.cli.entry:_execute',`
improve cli code, test=doc 3 years ago			`'paddlespeech_server=paddlespeech.server.entry:server_execute',`
			`'paddlespeech_client=paddlespeech.server.entry:client_execute'`
add cli, test=doc 3 years ago			`]`
Add paddlespeech.cli. 3 years ago			`})`
merge parakeet repo into deepspeech 3 years ago
add commmit to version info 3 years ago			`with version_info():`
format paddlespeech with pre-commit (#2331) 2 years ago			`setup(**setup_info, include_package_data=True)`