|
|
|
|
#!usr/bin/env python
|
|
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
|
# author: kuangdd
|
|
|
|
|
# date: 2019/12/1
|
|
|
|
|
"""
|
|
|
|
|
local
|
|
|
|
|
"""
|
|
|
|
|
import logging
|
|
|
|
|
|
|
|
|
|
logging.basicConfig(level=logging.INFO)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def run_text2phoneme():
|
|
|
|
|
from phkit.chinese.sequence import text2phoneme, text2sequence
|
|
|
|
|
text = "汉字转音素,TTS:《Text to speech》。"
|
|
|
|
|
# text = "岂有此理"
|
|
|
|
|
# text = "我的儿子玩会儿"
|
|
|
|
|
out = text2phoneme(text)
|
|
|
|
|
print(out)
|
|
|
|
|
# ['h', 'an', '4', '-', 'z', 'iy', '4', '-', 'zh', 'uan', '3', '-', 'ii', 'in', '1', '-', 's', 'u', '4', '-', ',',
|
|
|
|
|
# 'Tt', 'Tt', 'Ss', ':', '(', 'T', 'E', 'X', 'T', '#', 'T', 'O', '#', 'S', 'P', 'E', 'E', 'C', 'H', ')', '.', '-',
|
|
|
|
|
# '~', '_']
|
|
|
|
|
out = text2sequence(text)
|
|
|
|
|
print(out)
|
|
|
|
|
# [11, 32, 76, 2, 28, 51, 76, 2, 29, 59, 75, 2, 12, 46, 73, 2, 22, 56, 76, 2, 133, 97, 97, 96, 135, 138, 123, 108,
|
|
|
|
|
# 127, 123, 137, 123, 118, 137, 122, 119, 108, 108, 106, 111, 139, 132, 2, 1, 0]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def run_english():
|
|
|
|
|
from phkit.english import text_to_sequence, sequence_to_text
|
|
|
|
|
from phkit.english.cmudict import CMUDict
|
|
|
|
|
text = "text to speech"
|
|
|
|
|
cmupath = 'phkit/english/cmu_dictionary'
|
|
|
|
|
cmudict = CMUDict(cmupath)
|
|
|
|
|
seq = text_to_sequence(text, cleaner_names=["english_cleaners"], dictionary=cmudict)
|
|
|
|
|
print(seq)
|
|
|
|
|
txt = sequence_to_text(seq)
|
|
|
|
|
print(txt)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
|
print(__file__)
|
|
|
|
|
run_text2phoneme()
|
|
|
|
|
run_english()
|