RedditVideoMakerBot/TTS/engine_wrapper.py

import os
import re
from pathlib import Path
from typing import Tuple

import numpy as np
import translators
from moviepy.audio.AudioClip import AudioClip
from moviepy.audio.fx.volumex import volumex
from moviepy.editor import AudioFileClip
from rich.progress import track

from utils import settings
from utils.console import print_step, print_substep
from utils.voice import sanitize_text


DEFAULT_MAX_LENGTH: int = (
    50  # Video length variable, edit this on your own risk. It should work, but it's not supported
)


class TTSEngine:

    """Calls the given TTS engine to reduce code duplication and allow multiple TTS engines.

    Args:
        tts_module            : The TTS module. Your module should handle the TTS itself and saving to the given path under the run method.
        reddit_object         : The reddit object that contains the posts to read.
        path (Optional)       : The unix style path to save the mp3 files to. This must not have leading or trailing slashes.
        max_length (Optional) : The maximum length of the mp3 files in total.

    Notes:
        tts_module must take the arguments text and filepath.
    """

    def __init__(
        self,
        tts_module,
        reddit_object: dict,
        path: str = "assets/temp/",
        max_length: int = DEFAULT_MAX_LENGTH,
        last_clip_length: int = 0,
    ):
        self.tts_module = tts_module()
        self.reddit_object = reddit_object

        self.redditid = re.sub(r"[^\w\s-]", "", reddit_object["thread_id"])
        self.path = path + self.redditid + "/mp3"
        self.max_length = max_length
        self.length = 0
        self.last_clip_length = last_clip_length

    def add_periods(
        self,
    ):  # adds periods to the end of paragraphs (where people often forget to put them) so tts doesn't blend sentences
        for comment in self.reddit_object["comments"]:
            # remove links
            regex_urls = r"((http|https)\:\/\/)?[a-zA-Z0-9\.\/\?\:@\-_=#]+\.([a-zA-Z]){2,6}([a-zA-Z0-9\.\&\/\?\:@\-_=#])*"
            comment["comment_body"] = re.sub(regex_urls, " ", comment["comment_body"])
            comment["comment_body"] = comment["comment_body"].replace("\n", ". ")
            comment["comment_body"] = re.sub(r"\bAI\b", "A.I", comment["comment_body"])
            comment["comment_body"] = re.sub(r"\bAGI\b", "A.G.I", comment["comment_body"])
            if comment["comment_body"][-1] != ".":
                comment["comment_body"] += "."
            comment["comment_body"] = comment["comment_body"].replace(". . .", ".")
            comment["comment_body"] = comment["comment_body"].replace(".. . ", ".")
            comment["comment_body"] = comment["comment_body"].replace(". . ", ".")
            comment["comment_body"] = re.sub(r'\."\.', '".', comment["comment_body"])

    def run(self) -> Tuple[int, int]:
        Path(self.path).mkdir(parents=True, exist_ok=True)
        print_step("Saving Text to MP3 files...")

        self.add_periods()
        self.call_tts("title", process_text(self.reddit_object["thread_title"]))
        # processed_text = ##self.reddit_object["thread_post"] != ""
        idx = 0

        if settings.config["settings"]["storymode"]:
            if settings.config["settings"]["storymodemethod"] == 0:
                if len(self.reddit_object["thread_post"]) > self.tts_module.max_chars:
                    self.split_post(self.reddit_object["thread_post"], "postaudio")
                else:
                    self.call_tts("postaudio", process_text(self.reddit_object["thread_post"]))
            elif settings.config["settings"]["storymodemethod"] == 1:
                for idx, text in track(enumerate(self.reddit_object["thread_post"])):
                    self.call_tts(f"postaudio-{idx}", process_text(text))

        else:
            for idx, comment in track(enumerate(self.reddit_object["comments"]), "Saving..."):
                # ! Stop creating mp3 files if the length is greater than max length.
                if self.length > self.max_length and idx > 1:
                    self.length -= self.last_clip_length
                    idx -= 1
                    break
                if (
                    len(comment["comment_body"]) > self.tts_module.max_chars
                ):  # Split the comment if it is too long
                    self.split_post(comment["comment_body"], idx)  # Split the comment
                else:  # If the comment is not too long, just call the tts engine
                    self.call_tts(f"{idx}", process_text(comment["comment_body"]))

        print_substep("Saved Text to MP3 files successfully.", style="bold green")
        return self.length, idx

    def split_post(self, text: str, idx):
        split_files = []
        split_text = [
            x.group().strip()
            for x in re.finditer(
                r" *(((.|\n){0," + str(self.tts_module.max_chars) + "})(\.|.$))", text
            )
        ]
        self.create_silence_mp3()

        idy = None
        for idy, text_cut in enumerate(split_text):
            newtext = process_text(text_cut)
            # print(f"{idx}-{idy}: {newtext}\n")

            if not newtext or newtext.isspace():
                print("newtext was blank because sanitized split text resulted in none")
                continue
            else:
                self.call_tts(f"{idx}-{idy}.part", newtext)
                with open(f"{self.path}/list.txt", "w") as f:
                    for idz in range(0, len(split_text)):
                        f.write("file " + f"'{idx}-{idz}.part.mp3'" + "\n")
                    split_files.append(str(f"{self.path}/{idx}-{idy}.part.mp3"))
                    f.write("file " + f"'silence.mp3'" + "\n")

                os.system(
                    "ffmpeg -f concat -y -hide_banner -loglevel panic -safe 0 "
                    + "-i "
                    + f"{self.path}/list.txt "
                    + "-c copy "
                    + f"{self.path}/{idx}.mp3"
                )
        try:
            for i in range(0, len(split_files)):
                os.unlink(split_files[i])
        except FileNotFoundError as e:
            print("File not found: " + e.filename)
        except OSError:
            print("OSError")

    def call_tts(self, filename: str, text: str):
        self.tts_module.run(
            text,
            filepath=f"{self.path}/{filename}.mp3",
            random_voice=settings.config["settings"]["tts"]["random_voice"],
        )
        # try:
        #     self.length += MP3(f"{self.path}/{filename}.mp3").info.length
        # except (MutagenError, HeaderNotFoundError):
        #     self.length += sox.file_info.duration(f"{self.path}/{filename}.mp3")
        try:
            clip = AudioFileClip(f"{self.path}/{filename}.mp3")
            self.last_clip_length = clip.duration
            self.length += clip.duration
            clip.close()
        except:
            self.length = 0

    def create_silence_mp3(self):
        silence_duration = settings.config["settings"]["tts"]["silence_duration"]
        silence = AudioClip(
            make_frame=lambda t: np.sin(440 * 2 * np.pi * t),
            duration=silence_duration,
            fps=44100,
        )
        silence = volumex(silence, 0)
        silence.write_audiofile(f"{self.path}/silence.mp3", fps=44100, verbose=False, logger=None)


def process_text(text: str, clean: bool = True):
    lang = settings.config["reddit"]["thread"]["post_lang"]
    new_text = sanitize_text(text) if clean else text
    if lang:
        print_substep("Translating Text...")
        translated_text = translators.translate_text(text, translator="google", to_language=lang)
        new_text = sanitize_text(translated_text)
    return new_text
Add tonywiththetommy's changes 2 years ago			`import os`
Add silence inbetween tts 2 years ago			`import re`
Reduced code duplication in TTS engines 3 years ago			`from pathlib import Path`
			`from typing import Tuple`
fix: Fixed Mutagen error issue style: made final_video.py cleaner 3 years ago
Add tonywiththetommy's changes 2 years ago			`import numpy as np`
Couple of fixes including translators fix 2 years ago			`import translators`
Add tonywiththetommy's changes 2 years ago			`from moviepy.audio.AudioClip import AudioClip`
			`from moviepy.audio.fx.volumex import volumex`
Add silence inbetween tts 2 years ago			`from moviepy.editor import AudioFileClip`
Reduced code duplication in TTS engines 3 years ago			`from rich.progress import track`
fixed https://github.com/elebumm/RedditVideoMakerBot/commit/71c317da23b02b4228376ebeab35e0a405a687e9 by removing match usage (3.10+ only) optimized imports 2 years ago
			`from utils import settings`
Reduced code duplication in TTS engines 3 years ago			`from utils.console import print_step, print_substep`
			`from utils.voice import sanitize_text`
refactor: refactored using black formatter. cmd: black . --line-length 101 3 years ago
Merge branch 'dev' of https://github.com/electro199/RedditVideoMakerBot into dev 2 years ago
fixup: Format Python code with Black 2 years ago			`DEFAULT_MAX_LENGTH: int = (`
			`50 # Video length variable, edit this on your own risk. It should work, but it's not supported`
			`)`
A lot of reformatting and a couple of bug fixes 2 years ago
Reduced code duplication in TTS engines 3 years ago
			`class TTSEngine:`

			`"""Calls the given TTS engine to reduce code duplication and allow multiple TTS engines.`

			`Args:`
Add silence inbetween tts 2 years ago			`tts_module : The TTS module. Your module should handle the TTS itself and saving to the given path under the run method.`
Reduced code duplication in TTS engines 3 years ago			`reddit_object : The reddit object that contains the posts to read.`
			`path (Optional) : The unix style path to save the mp3 files to. This must not have leading or trailing slashes.`
			`max_length (Optional) : The maximum length of the mp3 files in total.`

			`Notes:`
			`tts_module must take the arguments text and filepath.`
			`"""`

			`def __init__(`
			`self,`
			`tts_module,`
			`reddit_object: dict,`
Bot can run multiple instances at the same time (#1091) * Bot can run multiple instances at the same time * Delete TTS/__pycache__ directory * Delete video_creation/__pycache__ directory * Delete videos.json * Delete utils/__pycache__ directory * Create videos.json * Moved id to utils * Added cleanup in shutdown and fixed bug * Removed watermark todo and fixed it * Delete final_video.py * Update final_video.py * Delete video.py * Update video.py * Delete id.py * feat: meaningful error message for bad credentials * chore: remove comment reference to .env Co-authored-by: Callum Leslie <git@cleslie.uk> 2 years ago			`path: str = "assets/temp/",`
formatting 2 years ago			`max_length: int = DEFAULT_MAX_LENGTH,`
			`last_clip_length: int = 0,`
Reduced code duplication in TTS engines 3 years ago			`):`
			`self.tts_module = tts_module()`
			`self.reddit_object = reddit_object`
Added the stroy mode with two method and add min comment lenght 2 years ago
Bot can run multiple instances at the same time (#1091) * Bot can run multiple instances at the same time * Delete TTS/__pycache__ directory * Delete video_creation/__pycache__ directory * Delete videos.json * Delete utils/__pycache__ directory * Create videos.json * Moved id to utils * Added cleanup in shutdown and fixed bug * Removed watermark todo and fixed it * Delete final_video.py * Update final_video.py * Delete video.py * Update video.py * Delete id.py * feat: meaningful error message for bad credentials * chore: remove comment reference to .env Co-authored-by: Callum Leslie <git@cleslie.uk> 2 years ago			`self.redditid = re.sub(r"[^\w\s-]", "", reddit_object["thread_id"])`
			`self.path = path + self.redditid + "/mp3"`
Reduced code duplication in TTS engines 3 years ago			`self.max_length = max_length`
			`self.length = 0`
formatting 2 years ago			`self.last_clip_length = last_clip_length`
Reduced code duplication in TTS engines 3 years ago
Reformat 2 years ago			`def add_periods(`
			`self,`
			`): # adds periods to the end of paragraphs (where people often forget to put them) so tts doesn't blend sentences`
fix: tts blending sentences from diff. paragraphs 2 years ago			`for comment in self.reddit_object["comments"]:`
add periods fix 2 years ago			`# remove links`
			`regex_urls = r"((http\|https)\:\/\/)?[a-zA-Z0-9\.\/\?\:@\-_=#]+\.([a-zA-Z]){2,6}([a-zA-Z0-9\.\&\/\?\:@\-_=#])*"`
			`comment["comment_body"] = re.sub(regex_urls, " ", comment["comment_body"])`
Reformat 2 years ago			`comment["comment_body"] = comment["comment_body"].replace("\n", ". ")`
Reformat 2 years ago			`comment["comment_body"] = re.sub(r"\bAI\b", "A.I", comment["comment_body"])`
fixup: Format Python code with Black 2 years ago			`comment["comment_body"] = re.sub(r"\bAGI\b", "A.G.I", comment["comment_body"])`
Reformat 2 years ago			`if comment["comment_body"][-1] != ".":`
			`comment["comment_body"] += "."`
add periods fix 2 years ago			`comment["comment_body"] = comment["comment_body"].replace(". . .", ".")`
			`comment["comment_body"] = comment["comment_body"].replace(".. . ", ".")`
			`comment["comment_body"] = comment["comment_body"].replace(". . ", ".")`
			`comment["comment_body"] = re.sub(r'\."\.', '".', comment["comment_body"])`
Reduced code duplication in TTS engines 3 years ago
			`def run(self) -> Tuple[int, int]:`
A lot of reformatting and a couple of bug fixes 2 years ago			`Path(self.path).mkdir(parents=True, exist_ok=True)`
Reduced code duplication in TTS engines 3 years ago			`print_step("Saving Text to MP3 files...")`
A lot of reformatting and a couple of bug fixes 2 years ago
fix: tts blending sentences from diff. paragraphs 2 years ago			`self.add_periods()`
process text before all calls to call_tts Process_text now called before call_tts to ensure it is called minimally while allowing for verification that text is not empty 2 years ago			`self.call_tts("title", process_text(self.reddit_object["thread_title"]))`
Added the stroy mode with two method and add min comment lenght 2 years ago			`# processed_text = ##self.reddit_object["thread_post"] != ""`
better err handle and run.bat 2 years ago			`idx = 0`
Merge branch 'develop' into master 2 years ago
A lot of reformatting and a couple of bug fixes 2 years ago			`if settings.config["settings"]["storymode"]:`
edited some bug and typo 2 years ago			`if settings.config["settings"]["storymodemethod"] == 0:`
A lot of reformatting and a couple of bug fixes 2 years ago			`if len(self.reddit_object["thread_post"]) > self.tts_module.max_chars:`
Added the stroy mode with two method and add min comment lenght 2 years ago			`self.split_post(self.reddit_object["thread_post"], "postaudio")`
A lot of reformatting and a couple of bug fixes 2 years ago			`else:`
fixup: Format Python code with Black 2 years ago			`self.call_tts("postaudio", process_text(self.reddit_object["thread_post"]))`
edited some bug and typo 2 years ago			`elif settings.config["settings"]["storymodemethod"] == 1:`
A lot of reformatting and a couple of bug fixes 2 years ago			`for idx, text in track(enumerate(self.reddit_object["thread_post"])):`
			`self.call_tts(f"postaudio-{idx}", process_text(text))`

			`else:`
fixup: Format Python code with Black 2 years ago			`for idx, comment in track(enumerate(self.reddit_object["comments"]), "Saving..."):`
Added the stroy mode with two method and add min comment lenght 2 years ago			`# ! Stop creating mp3 files if the length is greater than max length.`
			`if self.length > self.max_length and idx > 1:`
			`self.length -= self.last_clip_length`
			`idx -= 1`
			`break`
			`if (`
			`len(comment["comment_body"]) > self.tts_module.max_chars`
			`): # Split the comment if it is too long`
			`self.split_post(comment["comment_body"], idx) # Split the comment`
			`else: # If the comment is not too long, just call the tts engine`
			`self.call_tts(f"{idx}", process_text(comment["comment_body"]))`
Reduced code duplication in TTS engines 3 years ago
			`print_substep("Saved Text to MP3 files successfully.", style="bold green")`
			`return self.length, idx`

Added the stroy mode with two method and add min comment lenght 2 years ago			`def split_post(self, text: str, idx):`
Reduced code duplication in TTS engines 3 years ago			`split_files = []`
			`split_text = [`
A lot of reformatting and a couple of bug fixes 2 years ago			`x.group().strip()`
			`for x in re.finditer(`
			`r" *(((.\|\n){0," + str(self.tts_module.max_chars) + "})(\.\|.$))", text`
			`)`
Reduced code duplication in TTS engines 3 years ago			`]`
Add silence inbetween tts 2 years ago			`self.create_silence_mp3()`
fix: dont use blank text splits 3 years ago
Add tonywiththetommy's changes 2 years ago			`idy = None`
Reduced code duplication in TTS engines 3 years ago			`for idy, text_cut in enumerate(split_text):`
Add tonywiththetommy's changes 2 years ago			`newtext = process_text(text_cut)`
			`# print(f"{idx}-{idy}: {newtext}\n")`
fix: close ALL clips when finished 3 years ago
Add tonywiththetommy's changes 2 years ago			`if not newtext or newtext.isspace():`
			`print("newtext was blank because sanitized split text resulted in none")`
			`continue`
			`else:`
			`self.call_tts(f"{idx}-{idy}.part", newtext)`
A lot of reformatting and a couple of bug fixes 2 years ago			`with open(f"{self.path}/list.txt", "w") as f:`
Add tonywiththetommy's changes 2 years ago			`for idz in range(0, len(split_text)):`
			`f.write("file " + f"'{idx}-{idz}.part.mp3'" + "\n")`
			`split_files.append(str(f"{self.path}/{idx}-{idy}.part.mp3"))`
			`f.write("file " + f"'silence.mp3'" + "\n")`

A lot of reformatting and a couple of bug fixes 2 years ago			`os.system(`
			`"ffmpeg -f concat -y -hide_banner -loglevel panic -safe 0 "`
			`+ "-i "`
			`+ f"{self.path}/list.txt "`
			`+ "-c copy "`
			`+ f"{self.path}/{idx}.mp3"`
			`)`
Add tonywiththetommy's changes 2 years ago			`try:`
			`for i in range(0, len(split_files)):`
			`os.unlink(split_files[i])`
Add silence inbetween tts 2 years ago			`except FileNotFoundError as e:`
			`print("File not found: " + e.filename)`
Add tonywiththetommy's changes 2 years ago			`except OSError:`
			`print("OSError")`
Reduced code duplication in TTS engines 3 years ago
			`def call_tts(self, filename: str, text: str):`
Reformat 2 years ago			`self.tts_module.run(`
			`text,`
			`filepath=f"{self.path}/{filename}.mp3",`
			`random_voice=settings.config["settings"]["tts"]["random_voice"],`
			`)`
Reformat 2 years ago			`# try:`
			`# self.length += MP3(f"{self.path}/{filename}.mp3").info.length`
			`# except (MutagenError, HeaderNotFoundError):`
			`# self.length += sox.file_info.duration(f"{self.path}/{filename}.mp3")`
added backup contingency 3 years ago			`try:`
			`clip = AudioFileClip(f"{self.path}/{filename}.mp3")`
Correct video length 2 years ago			`self.last_clip_length = clip.duration`
Fixed,added: 0.mp3 not found and only translate 2 years ago			`self.length += clip.duration`
added backup contingency 3 years ago			`clip.close()`
			`except:`
			`self.length = 0`
fix: length checker works with new duration code 3 years ago
Add silence inbetween tts 2 years ago			`def create_silence_mp3(self):`
			`silence_duration = settings.config["settings"]["tts"]["silence_duration"]`
A lot of reformatting and a couple of bug fixes 2 years ago			`silence = AudioClip(`
			`make_frame=lambda t: np.sin(440 * 2 * np.pi * t),`
			`duration=silence_duration,`
			`fps=44100,`
			`)`
Add silence inbetween tts 2 years ago			`silence = volumex(silence, 0)`
fixup: Format Python code with Black 2 years ago			`silence.write_audiofile(f"{self.path}/silence.mp3", fps=44100, verbose=False, logger=None)`
fix: length checker works with new duration code 3 years ago
style: format with python-black 3 years ago
Reformat 2 years ago			`def process_text(text: str, clean: bool = True):`
refactor: tts engines now use toml config 3 years ago			`lang = settings.config["reddit"]["thread"]["post_lang"]`
Fixed,added: 0.mp3 not found and only translate 2 years ago			`new_text = sanitize_text(text) if clean else text`
Merge branch 'develop' into feat/better-tts-changer 3 years ago			`if lang:`
			`print_substep("Translating Text...")`
Fix translators 2 years ago			`translated_text = translators.translate_text(text, translator="google", to_language=lang)`
Update engine_wrapper.py Fixed not sanitizing the text issue that occurs if POSTLANG is set 3 years ago			`new_text = sanitize_text(translated_text)`
Merge branch 'develop' into feat/better-tts-changer 3 years ago			`return new_text`