RedditVideoMakerBot/video_creation/TTSwrapper.py

import base64
import os
import random
import re

import requests
import sox
from moviepy.audio.AudioClip import concatenate_audioclips, CompositeAudioClip
from moviepy.audio.io.AudioFileClip import AudioFileClip
from requests.adapters import HTTPAdapter, Retry

# from profanity_filter import ProfanityFilter
# pf = ProfanityFilter()
# Code by @JasonLovesDoggo
# https://twitter.com/scanlime/status/1512598559769702406

nonhuman = [  # DISNEY VOICES
    "en_us_ghostface",  # Ghost Face
    "en_us_chewbacca",  # Chewbacca
    "en_us_c3po",  # C3PO
    "en_us_stitch",  # Stitch
    "en_us_stormtrooper",  # Stormtrooper
    "en_us_rocket",  # Rocket
    # ENGLISH VOICES
]
human = [
    "en_au_001",  # English AU - Female
    "en_au_002",  # English AU - Male
    "en_uk_001",  # English UK - Male 1
    "en_uk_003",  # English UK - Male 2
    "en_us_001",  # English US - Female (Int. 1)
    "en_us_002",  # English US - Female (Int. 2)
    "en_us_006",  # English US - Male 1
    "en_us_007",  # English US - Male 2
    "en_us_009",  # English US - Male 3
    "en_us_010",
]
voices = nonhuman + human

noneng = [
    "fr_001",  # French - Male 1
    "fr_002",  # French - Male 2
    "de_001",  # German - Female
    "de_002",  # German - Male
    "es_002",  # Spanish - Male
    # AMERICA VOICES
    "es_mx_002",  # Spanish MX - Male
    "br_001",  # Portuguese BR - Female 1
    "br_003",  # Portuguese BR - Female 2
    "br_004",  # Portuguese BR - Female 3
    "br_005",  # Portuguese BR - Male
    # ASIA VOICES
    "id_001",  # Indonesian - Female
    "jp_001",  # Japanese - Female 1
    "jp_003",  # Japanese - Female 2
    "jp_005",  # Japanese - Female 3
    "jp_006",  # Japanese - Male
    "kr_002",  # Korean - Male 1
    "kr_003",  # Korean - Female
    "kr_004",  # Korean - Male 2
]


# good_voices = {'good': ['en_us_002', 'en_us_006'],
#               'ok': ['en_au_002', 'en_uk_001']}  # less en_us_stormtrooper more less en_us_rocket en_us_ghostface


class TTTTSWrapper:  # TikTok Text-to-Speech Wrapper
    def __init__(self):
        self.URI_BASE = "https://api16-normal-useast5.us.tiktokv.com/media/api/text/speech/invoke/?text_speaker="

    def tts(
            self,
            req_text: str = "TikTok Text To Speech",
            filename: str = "title.mp3",
            random_speaker: bool = False,
            censer=False,
    ):
        req_text = req_text.replace("+", "plus").replace(" ", "+").replace("&", "and")
        if censer:
            # req_text = pf.censor(req_text)
            pass
        voice = (
            self.randomvoice()
            if random_speaker
            else (os.getenv("VOICE") or random.choice(human))
        )

        chunks = [
            m.group().strip() for m in re.finditer(r" *((.{0,299})(\.|.$))", req_text)
        ]

        audio_clips = []
        cbn = sox.Combiner()
        cbn.set_input_format(file_type=["mp3" for _ in chunks])

        chunkId = 0
        for chunk in chunks:
            try:
                r = requests.post(
                    f"{self.URI_BASE}{voice}&req_text={chunk}&speaker_map_type=0"
                )
            except requests.exceptions.SSLError:
                # https://stackoverflow.com/a/47475019/18516611
                session = requests.Session()
                retry = Retry(connect=3, backoff_factor=0.5)
                adapter = HTTPAdapter(max_retries=retry)
                session.mount("http://", adapter)
                session.mount("https://", adapter)
                r = session.post(
                    f"{self.URI_BASE}{voice}&req_text={chunk}&speaker_map_type=0"
                )
            vstr = [r.json()["data"]["v_str"]][0]
            b64d = base64.b64decode(vstr)

            with open(filename.replace(".mp3", f"-{chunkId}.mp3"), "wb") as out:
                out.write(b64d)

            audio_clips.append(filename.replace(".mp3", f"-{chunkId}.mp3"))

            chunkId = chunkId + 1
        try:
            if len(audio_clips) > 1:
                cbn.convert(samplerate=44100, n_channels=2)
                cbn.build(audio_clips, filename, "concatenate")
            else:
                os.rename(audio_clips[0], filename)

        except sox.core.SoxError:  # https://github.com/JasonLovesDoggo/RedditVideoMakerBot/issues/67#issuecomment-1150466339
            for clip in audio_clips:
                i = audio_clips.index(clip)  # get the index of the clip
                audio_clips = (
                        audio_clips[:i] + [AudioFileClip(clip)] + audio_clips[i + 1:]
                )  # replace the clip with an AudioFileClip
            audio_concat = concatenate_audioclips(audio_clips)
            audio_composite = CompositeAudioClip([audio_concat])
            audio_composite.write_audiofile(filename, 44100, 2, 2000, None)

    @staticmethod
    def randomvoice():
        ok_or_good = random.randrange(1, 10)
        if ok_or_good == 1:  # 1/10 chance of ok voice
            return random.choice(voices)
        return random.choice(human)  # 9/10 chance of good voice
adds voice config closes #28 3 years ago			`import base64`
			`import os`
			`import random`
fix: improved TTS requests fixes #64 3 years ago			`import re`

adds voice config closes #28 3 years ago			`import requests`
chore: reformatted docs: added better comment documentation 3 years ago			`import sox`
fix: i think 3 years ago			`from moviepy.audio.AudioClip import concatenate_audioclips, CompositeAudioClip`
fix: fixes #66 3 years ago			`from moviepy.audio.io.AudioFileClip import AudioFileClip`
fix: improved TTS requests fixes #64 3 years ago			`from requests.adapters import HTTPAdapter, Retry`
fixed #60 and reformatted project with the black formatter 3 years ago
			`# from profanity_filter import ProfanityFilter`
			`# pf = ProfanityFilter()`
tried to implement smth 3 years ago			`# Code by @JasonLovesDoggo`
I hope i don't get a virus 3 years ago			`# https://twitter.com/scanlime/status/1512598559769702406`
fix: fixed audio error fix: mp3 error fixes #76 fixes #71 3 years ago
adds voice config closes #28 3 years ago			`nonhuman = [ # DISNEY VOICES`
fixed #60 and reformatted project with the black formatter 3 years ago			`"en_us_ghostface", # Ghost Face`
			`"en_us_chewbacca", # Chewbacca`
			`"en_us_c3po", # C3PO`
			`"en_us_stitch", # Stitch`
			`"en_us_stormtrooper", # Stormtrooper`
			`"en_us_rocket", # Rocket`
I hope i don't get a virus 3 years ago			`# ENGLISH VOICES`
adds voice config closes #28 3 years ago			`]`
fixed #60 and reformatted project with the black formatter 3 years ago			`human = [`
			`"en_au_001", # English AU - Female`
			`"en_au_002", # English AU - Male`
			`"en_uk_001", # English UK - Male 1`
			`"en_uk_003", # English UK - Male 2`
			`"en_us_001", # English US - Female (Int. 1)`
			`"en_us_002", # English US - Female (Int. 2)`
			`"en_us_006", # English US - Male 1`
			`"en_us_007", # English US - Male 2`
			`"en_us_009", # English US - Male 3`
			`"en_us_010",`
			`]`
adds voice config closes #28 3 years ago			`voices = nonhuman + human`

			`noneng = [`
fixed #60 and reformatted project with the black formatter 3 years ago			`"fr_001", # French - Male 1`
			`"fr_002", # French - Male 2`
			`"de_001", # German - Female`
			`"de_002", # German - Male`
			`"es_002", # Spanish - Male`
I hope i don't get a virus 3 years ago			`# AMERICA VOICES`
fixed #60 and reformatted project with the black formatter 3 years ago			`"es_mx_002", # Spanish MX - Male`
			`"br_001", # Portuguese BR - Female 1`
			`"br_003", # Portuguese BR - Female 2`
			`"br_004", # Portuguese BR - Female 3`
			`"br_005", # Portuguese BR - Male`
I hope i don't get a virus 3 years ago			`# ASIA VOICES`
fixed #60 and reformatted project with the black formatter 3 years ago			`"id_001", # Indonesian - Female`
			`"jp_001", # Japanese - Female 1`
			`"jp_003", # Japanese - Female 2`
			`"jp_005", # Japanese - Female 3`
			`"jp_006", # Japanese - Male`
			`"kr_002", # Korean - Male 1`
			`"kr_003", # Korean - Female`
			`"kr_004", # Korean - Male 2`
I hope i don't get a virus 3 years ago			`]`
adds voice config closes #28 3 years ago

			`# good_voices = {'good': ['en_us_002', 'en_us_006'],`
			`# 'ok': ['en_au_002', 'en_uk_001']} # less en_us_stormtrooper more less en_us_rocket en_us_ghostface`
I hope i don't get a virus 3 years ago

			`class TTTTSWrapper: # TikTok Text-to-Speech Wrapper`
			`def __init__(self):`
fixed #60 and reformatted project with the black formatter 3 years ago			`self.URI_BASE = "https://api16-normal-useast5.us.tiktokv.com/media/api/text/speech/invoke/?text_speaker="`

			`def tts(`
fix: fixed audio error fix: mp3 error fixes #76 fixes #71 3 years ago			`self,`
			`req_text: str = "TikTok Text To Speech",`
			`filename: str = "title.mp3",`
			`random_speaker: bool = False,`
			`censer=False,`
fixed #60 and reformatted project with the black formatter 3 years ago			`):`
Error fix Moved the character limit checker cause it was being buggy and making it so some longer comments went thru but not others and it looks like that's fixed now also deleted another character limit check cause it wasn't needed anymore. and for some reason the text replace thingy was in an if statement even tho I don't think it should have been in there. 3 years ago			`req_text = req_text.replace("+", "plus").replace(" ", "+").replace("&", "and")`
tried to implement smth 3 years ago			`if censer:`
fixed #60 and reformatted project with the black formatter 3 years ago			`# req_text = pf.censor(req_text)`
tried to implement smth 3 years ago			`pass`
fixed #60 and reformatted project with the black formatter 3 years ago			`voice = (`
			`self.randomvoice()`
			`if random_speaker`
			`else (os.getenv("VOICE") or random.choice(human))`
			`)`
I hope i don't get a virus 3 years ago
fixed #60 and reformatted project with the black formatter 3 years ago			`chunks = [`
fix: fixed audio error fix: mp3 error fixes #76 fixes #71 3 years ago			`m.group().strip() for m in re.finditer(r" *((.{0,299})(\.\|.$))", req_text)`
fixed #60 and reformatted project with the black formatter 3 years ago			`]`
Unlimited comment length I added unlimited comment length by splitting the tts is parts in a way that doesn't make it sound weird. It works great for me but if someone experiences and issues just contact me. 3 years ago
			`audio_clips = []`
Changed to tts chunk combiner to sox This helps performance and improves audio quality as movie.py adds a lot of audio glitches also there where a few small mistakes in the old version that I fixed and seem to work. 3 years ago			`cbn = sox.Combiner()`
fix: fixed audio error fix: mp3 error fixes #76 fixes #71 3 years ago			`cbn.set_input_format(file_type=["mp3" for _ in chunks])`
Unlimited comment length I added unlimited comment length by splitting the tts is parts in a way that doesn't make it sound weird. It works great for me but if someone experiences and issues just contact me. 3 years ago
			`chunkId = 0`
			`for chunk in chunks:`
fix: improved TTS requests fixes #64 3 years ago			`try:`
			`r = requests.post(`
			`f"{self.URI_BASE}{voice}&req_text={chunk}&speaker_map_type=0"`
			`)`
			`except requests.exceptions.SSLError:`
			`# https://stackoverflow.com/a/47475019/18516611`
			`session = requests.Session()`
			`retry = Retry(connect=3, backoff_factor=0.5)`
			`adapter = HTTPAdapter(max_retries=retry)`
reformatted 3 years ago			`session.mount("http://", adapter)`
			`session.mount("https://", adapter)`
			`r = session.post(`
			`f"{self.URI_BASE}{voice}&req_text={chunk}&speaker_map_type=0"`
			`)`
Unlimited comment length I added unlimited comment length by splitting the tts is parts in a way that doesn't make it sound weird. It works great for me but if someone experiences and issues just contact me. 3 years ago			`vstr = [r.json()["data"]["v_str"]][0]`
			`b64d = base64.b64decode(vstr)`

Changed to tts chunk combiner to sox This helps performance and improves audio quality as movie.py adds a lot of audio glitches also there where a few small mistakes in the old version that I fixed and seem to work. 3 years ago			`with open(filename.replace(".mp3", f"-{chunkId}.mp3"), "wb") as out:`
Unlimited comment length I added unlimited comment length by splitting the tts is parts in a way that doesn't make it sound weird. It works great for me but if someone experiences and issues just contact me. 3 years ago			`out.write(b64d)`

Changed to tts chunk combiner to sox This helps performance and improves audio quality as movie.py adds a lot of audio glitches also there where a few small mistakes in the old version that I fixed and seem to work. 3 years ago			`audio_clips.append(filename.replace(".mp3", f"-{chunkId}.mp3"))`
I hope i don't get a virus 3 years ago
adds voice config closes #28 3 years ago			`chunkId = chunkId + 1`
fix: i think 3 years ago			`try:`
			`if len(audio_clips) > 1:`
			`cbn.convert(samplerate=44100, n_channels=2)`
			`cbn.build(audio_clips, filename, "concatenate")`
			`else:`
			`os.rename(audio_clips[0], filename)`
chore: reformatted docs: added better comment documentation 3 years ago
			`except sox.core.SoxError: # https://github.com/JasonLovesDoggo/RedditVideoMakerBot/issues/67#issuecomment-1150466339`
fix: fixes #66 3 years ago			`for clip in audio_clips:`
			`i = audio_clips.index(clip) # get the index of the clip`
chore: reformatted docs: added better comment documentation 3 years ago			`audio_clips = (`
fix: fixed audio error fix: mp3 error fixes #76 fixes #71 3 years ago			`audio_clips[:i] + [AudioFileClip(clip)] + audio_clips[i + 1:]`
chore: reformatted docs: added better comment documentation 3 years ago			`) # replace the clip with an AudioFileClip`
fix: i think 3 years ago			`audio_concat = concatenate_audioclips(audio_clips)`
			`audio_composite = CompositeAudioClip([audio_concat])`
			`audio_composite.write_audiofile(filename, 44100, 2, 2000, None)`
I hope i don't get a virus 3 years ago
			`@staticmethod`
			`def randomvoice():`
			`ok_or_good = random.randrange(1, 10)`
			`if ok_or_good == 1: # 1/10 chance of ok voice`
adds voice config closes #28 3 years ago			`return random.choice(voices)`
			`return random.choice(human) # 9/10 chance of good voice`