RedditVideoMakerBot/TTS/engine_wrapper.py

#!/usr/bin/env python3
from pathlib import Path
from typing import Tuple
import re

# import sox
# from mutagen import MutagenError
# from mutagen.mp3 import MP3, HeaderNotFoundError
import translators as ts
from rich.progress import track
from moviepy.editor import AudioFileClip, CompositeAudioClip, concatenate_audioclips
from utils.console import print_step, print_substep
from utils.voice import sanitize_text
from utils import settings

DEFAULT_MAX_LENGTH: int = 50  # video length variable


class TTSEngine:

    """Calls the given TTS engine to reduce code duplication and allow multiple TTS engines.

    Args:
        tts_module          : The TTS module. Your module should handle the TTS itself and saving to the given path under the run method.
        reddit_object         : The reddit object that contains the posts to read.
        path (Optional)       : The unix style path to save the mp3 files to. This must not have leading or trailing slashes.
        max_length (Optional) : The maximum length of the mp3 files in total.

    Notes:
        tts_module must take the arguments text and filepath.
    """

    def __init__(
        self,
        tts_module,
        reddit_object: dict,
        path: str = "assets/temp/mp3",
        max_length: int = DEFAULT_MAX_LENGTH,
        last_clip_length: int = 0,
    ):
        self.tts_module = tts_module()
        self.reddit_object = reddit_object
        self.path = path
        self.max_length = max_length
        self.length = 0
        self.last_clip_length = last_clip_length

    def run(self) -> Tuple[int, int]:

        Path(self.path).mkdir(parents=True, exist_ok=True)

        # This file needs to be removed in case this post does not use post text, so that it won't appear in the final video
        try:
            Path(f"{self.path}/posttext.mp3").unlink()
        except OSError:
            pass

        print_step("Saving Text to MP3 files...")

        self.call_tts("title", process_text(self.reddit_object["thread_title"]))
        processed_text = process_text(self.reddit_object["thread_post"])
        if processed_text != "" and settings.config["settings"]["storymode"] == True:
            self.call_tts("posttext", processed_text)

        idx = None
        for idx, comment in track(
            enumerate(self.reddit_object["comments"]), "Saving..."
        ):
            # ! Stop creating mp3 files if the length is greater than max length.
            if self.length > self.max_length:
                self.length -= self.last_clip_length
                idx -= 1
                break
            if (
                len(comment["comment_body"]) > self.tts_module.max_chars
            ):  # Split the comment if it is too long
                self.split_post(comment["comment_body"], idx)  # Split the comment
            else:  # If the comment is not too long, just call the tts engine
                self.call_tts(f"{idx}", process_text(comment["comment_body"]))

        print_substep("Saved Text to MP3 files successfully.", style="bold green")
        return self.length, idx

    def split_post(self, text: str, idx: int):
        split_files = []
        split_text = [
            x.group().strip()
            for x in re.finditer(
                r" *(((.|\n){0," + str(self.tts_module.max_chars) + "})(\.|.$))", text
            )
        ]
        offset = 0
        for idy, text_cut in enumerate(split_text):
            # print(f"{idx}-{idy}: {text_cut}\n")
            new_text = process_text(text_cut)
            if not new_text or new_text.isspace():
                offset += 1
                continue

            self.call_tts(f"{idx}-{idy - offset}.part", new_text)
            split_files.append(
                AudioFileClip(f"{self.path}/{idx}-{idy - offset}.part.mp3")
            )

        CompositeAudioClip([concatenate_audioclips(split_files)]).write_audiofile(
            f"{self.path}/{idx}.mp3", fps=44100, verbose=False, logger=None
        )

        for i in split_files:
            name = i.filename
            i.close()
            Path(name).unlink()

        # for i in range(0, idy + 1):
        # print(f"Cleaning up {self.path}/{idx}-{i}.part.mp3")

        # Path(f"{self.path}/{idx}-{i}.part.mp3").unlink()

    def call_tts(self, filename: str, text: str):
        self.tts_module.run(text, filepath=f"{self.path}/{filename}.mp3")
        # try:
        #     self.length += MP3(f"{self.path}/{filename}.mp3").info.length
        # except (MutagenError, HeaderNotFoundError):
        #     self.length += sox.file_info.duration(f"{self.path}/{filename}.mp3")
        try:
            clip = AudioFileClip(f"{self.path}/{filename}.mp3")
            if clip.duration + self.length < self.max_length:
                self.last_clip_length = clip.duration
            self.length += clip.duration
            clip.close()
        except:
            self.length = 0


def process_text(text: str):
    lang = settings.config["reddit"]["thread"]["post_lang"]
    new_text = sanitize_text(text)
    if lang:
        print_substep("Translating Text...")
        translated_text = ts.google(text, to_language=lang)
        new_text = sanitize_text(translated_text)
    return new_text
Reduced code duplication in TTS engines 3 years ago			`#!/usr/bin/env python3`
			`from pathlib import Path`
			`from typing import Tuple`
			`import re`
fix: Fixed Mutagen error issue style: made final_video.py cleaner 3 years ago
fix: length checker works with new duration code 2 years ago			`# import sox`
			`# from mutagen import MutagenError`
			`# from mutagen.mp3 import MP3, HeaderNotFoundError`
Merge branch 'develop' into feat/better-tts-changer 3 years ago			`import translators as ts`
Reduced code duplication in TTS engines 3 years ago			`from rich.progress import track`
			`from moviepy.editor import AudioFileClip, CompositeAudioClip, concatenate_audioclips`
			`from utils.console import print_step, print_substep`
			`from utils.voice import sanitize_text`
refactor: tts engines now use toml config 2 years ago			`from utils import settings`
refactor: refactored using black formatter. cmd: black . --line-length 101 3 years ago
formatting 2 years ago			`DEFAULT_MAX_LENGTH: int = 50 # video length variable`
refactor: refactored using black formatter. cmd: black . --line-length 101 3 years ago
Reduced code duplication in TTS engines 3 years ago
			`class TTSEngine:`

			`"""Calls the given TTS engine to reduce code duplication and allow multiple TTS engines.`

			`Args:`
			`tts_module : The TTS module. Your module should handle the TTS itself and saving to the given path under the run method.`
			`reddit_object : The reddit object that contains the posts to read.`
			`path (Optional) : The unix style path to save the mp3 files to. This must not have leading or trailing slashes.`
			`max_length (Optional) : The maximum length of the mp3 files in total.`

			`Notes:`
			`tts_module must take the arguments text and filepath.`
			`"""`

			`def __init__(`
			`self,`
			`tts_module,`
			`reddit_object: dict,`
Fix small bugs and path issues 3 years ago			`path: str = "assets/temp/mp3",`
formatting 2 years ago			`max_length: int = DEFAULT_MAX_LENGTH,`
			`last_clip_length: int = 0,`
Reduced code duplication in TTS engines 3 years ago			`):`
			`self.tts_module = tts_module()`
			`self.reddit_object = reddit_object`
			`self.path = path`
			`self.max_length = max_length`
			`self.length = 0`
formatting 2 years ago			`self.last_clip_length = last_clip_length`
Reduced code duplication in TTS engines 3 years ago
			`def run(self) -> Tuple[int, int]:`

			`Path(self.path).mkdir(parents=True, exist_ok=True)`

background audio implementation 2 years ago			`# This file needs to be removed in case this post does not use post text, so that it won't appear in the final video`
Reduced code duplication in TTS engines 3 years ago			`try:`
			`Path(f"{self.path}/posttext.mp3").unlink()`
			`except OSError:`
			`pass`

			`print_step("Saving Text to MP3 files...")`

process text before all calls to call_tts Process_text now called before call_tts to ensure it is called minimally while allowing for verification that text is not empty 2 years ago			`self.call_tts("title", process_text(self.reddit_object["thread_title"]))`
			`processed_text = process_text(self.reddit_object["thread_post"])`
fixed a error(self-made), added default values 2 years ago			`if processed_text != "" and settings.config["settings"]["storymode"] == True:`
process text before all calls to call_tts Process_text now called before call_tts to ensure it is called minimally while allowing for verification that text is not empty 2 years ago			`self.call_tts("posttext", processed_text)`
Reduced code duplication in TTS engines 3 years ago
			`idx = None`
formatting 2 years ago			`for idx, comment in track(`
			`enumerate(self.reddit_object["comments"]), "Saving..."`
			`):`
Reduced code duplication in TTS engines 3 years ago			`# ! Stop creating mp3 files if the length is greater than max length.`
			`if self.length > self.max_length:`
formatting 2 years ago			`self.length -= self.last_clip_length`
			`idx -= 1`
Reduced code duplication in TTS engines 3 years ago			`break`
background audio implementation 2 years ago			`if (`
			`len(comment["comment_body"]) > self.tts_module.max_chars`
			`): # Split the comment if it is too long`
			`self.split_post(comment["comment_body"], idx) # Split the comment`
			`else: # If the comment is not too long, just call the tts engine`
process text before all calls to call_tts Process_text now called before call_tts to ensure it is called minimally while allowing for verification that text is not empty 2 years ago			`self.call_tts(f"{idx}", process_text(comment["comment_body"]))`
Reduced code duplication in TTS engines 3 years ago
			`print_substep("Saved Text to MP3 files successfully.", style="bold green")`
			`return self.length, idx`

fix: stop broken typechecking 2 years ago			`def split_post(self, text: str, idx: int):`
Reduced code duplication in TTS engines 3 years ago			`split_files = []`
			`split_text = [`
			`x.group().strip()`
fix: regex splitter no longer skips newlines 2 years ago			`for x in re.finditer(`
			`r" *(((.\|\n){0," + str(self.tts_module.max_chars) + "})(\.\|.$))", text`
			`)`
Reduced code duplication in TTS engines 3 years ago			`]`
fix: dont use blank text splits 2 years ago			`offset = 0`
Reduced code duplication in TTS engines 3 years ago			`for idy, text_cut in enumerate(split_text):`
Remove debug statements 3 years ago			`# print(f"{idx}-{idy}: {text_cut}\n")`
fixed a error(self-made), added default values 2 years ago			`new_text = process_text(text_cut)`
improved efficiency of empty text check 2 years ago			`if not new_text or new_text.isspace():`
fix: dont use blank text splits 2 years ago			`offset += 1`
background audio implementation 2 years ago			`continue`

improved efficiency of empty text check 2 years ago			`self.call_tts(f"{idx}-{idy - offset}.part", new_text)`
formatting 2 years ago			`split_files.append(`
			`AudioFileClip(f"{self.path}/{idx}-{idy - offset}.part.mp3")`
			`)`
fix: dont use blank text splits 2 years ago
Reduced code duplication in TTS engines 3 years ago			`CompositeAudioClip([concatenate_audioclips(split_files)]).write_audiofile(`
			`f"{self.path}/{idx}.mp3", fps=44100, verbose=False, logger=None`
			`)`

fix: close ALL clips when finished 2 years ago			`for i in split_files:`
			`name = i.filename`
			`i.close()`
			`Path(name).unlink()`

			`# for i in range(0, idy + 1):`
style: format with python-black 2 years ago			`# print(f"Cleaning up {self.path}/{idx}-{i}.part.mp3")`
fix: close ALL clips when finished 2 years ago
style: format with python-black 2 years ago			`# Path(f"{self.path}/{idx}-{i}.part.mp3").unlink()`
Reduced code duplication in TTS engines 3 years ago
			`def call_tts(self, filename: str, text: str):`
fixed a error(self-made), added default values 2 years ago			`self.tts_module.run(text, filepath=f"{self.path}/{filename}.mp3")`
fix: mutagen error - moved to moviepy duration 2 years ago			`# try:`
			`# self.length += MP3(f"{self.path}/{filename}.mp3").info.length`
			`# except (MutagenError, HeaderNotFoundError):`
			`# self.length += sox.file_info.duration(f"{self.path}/{filename}.mp3")`
added backup contingency 2 years ago			`try:`
			`clip = AudioFileClip(f"{self.path}/{filename}.mp3")`
formatting 2 years ago			`if clip.duration + self.length < self.max_length:`
			`self.last_clip_length = clip.duration`
added backup contingency 2 years ago			`self.length += clip.duration`
			`clip.close()`
			`except:`
			`self.length = 0`
fix: length checker works with new duration code 2 years ago
style: format with python-black 2 years ago
Merge branch 'develop' into feat/better-tts-changer 3 years ago			`def process_text(text: str):`
refactor: tts engines now use toml config 2 years ago			`lang = settings.config["reddit"]["thread"]["post_lang"]`
Merge branch 'develop' into feat/better-tts-changer 3 years ago			`new_text = sanitize_text(text)`
			`if lang:`
			`print_substep("Translating Text...")`
Update engine_wrapper.py Fixed not sanitizing the text issue that occurs if POSTLANG is set 3 years ago			`translated_text = ts.google(text, to_language=lang)`
			`new_text = sanitize_text(translated_text)`
Merge branch 'develop' into feat/better-tts-changer 3 years ago			`return new_text`