PaddleSpeech/third_party/phkit/run_local.py

#!usr/bin/env python
# -*- coding: utf-8 -*-
# author: kuangdd
# date: 2019/12/1
"""
local
"""
import logging

logging.basicConfig(level=logging.INFO)


def run_text2phoneme():
    from phkit.chinese.sequence import text2phoneme, text2sequence
    text = "汉字转音素，TTS：《Text to speech》。"
    # text = "岂有此理"
    # text = "我的儿子玩会儿"
    out = text2phoneme(text)
    print(out)
    # ['h', 'an', '4', '-', 'z', 'iy', '4', '-', 'zh', 'uan', '3', '-', 'ii', 'in', '1', '-', 's', 'u', '4', '-', ',',
    # 'Tt', 'Tt', 'Ss', ':', '(', 'T', 'E', 'X', 'T', '#', 'T', 'O', '#', 'S', 'P', 'E', 'E', 'C', 'H', ')', '.', '-',
    #  '~', '_']
    out = text2sequence(text)
    print(out)
    # [11, 32, 76, 2, 28, 51, 76, 2, 29, 59, 75, 2, 12, 46, 73, 2, 22, 56, 76, 2, 133, 97, 97, 96, 135, 138, 123, 108,
    # 127, 123, 137, 123, 118, 137, 122, 119, 108, 108, 106, 111, 139, 132, 2, 1, 0]


def run_english():
    from phkit.english import text_to_sequence, sequence_to_text
    from phkit.english.cmudict import CMUDict
    text = "text to speech"
    cmupath = 'phkit/english/cmu_dictionary'
    cmudict = CMUDict(cmupath)
    seq = text_to_sequence(text, cleaner_names=["english_cleaners"], dictionary=cmudict)
    print(seq)
    txt = sequence_to_text(seq)
    print(txt)


if __name__ == "__main__":
    print(__file__)
    run_text2phoneme()
    run_english()