RedditVideoMakerBot/TTS/engine_wrapper.py

#!/usr/bin/env python3
from pathlib import Path
from typing import Tuple
import re

# import sox
# from mutagen import MutagenError
# from mutagen.mp3 import MP3, HeaderNotFoundError
import translators as ts
from rich.progress import track
from moviepy.editor import AudioFileClip, CompositeAudioClip, concatenate_audioclips
from utils.console import print_step, print_substep
from utils.voice import sanitize_text
from utils import settings

DEFAULT_MAX_LENGTH: int = 40 # video length variable

class TTSEngine:

    """Calls the given TTS engine to reduce code duplication and allow multiple TTS engines.

    Args:
        tts_module          : The TTS module. Your module should handle the TTS itself and saving to the given path under the run method.
        reddit_object         : The reddit object that contains the posts to read.
        path (Optional)       : The unix style path to save the mp3 files to. This must not have leading or trailing slashes.
        max_length (Optional) : The maximum length of the mp3 files in total.

    Notes:
        tts_module must take the arguments text and filepath.
    """

    def __init__(
        self,
        tts_module,
        reddit_object: dict,
        path: str = "assets/temp/",
        max_length: int = DEFAULT_MAX_LENGTH,
        last_clip_length: int = 0,
    ):
        self.tts_module = tts_module()
        self.reddit_object = reddit_object

        self.redditid = re.sub(r"[^\w\s-]", "", reddit_object["thread_id"])
        self.path = path + self.redditid + "/mp3"
        self.max_length = max_length
        self.length = 0
        self.last_clip_length = last_clip_length

    def run(self) -> Tuple[int, int]:

        Path(self.path).mkdir(parents=True, exist_ok=True)      
        print_step("Saving Text to MP3 files...")
        
        self.call_tts("title", process_text(self.reddit_object["thread_title"]))
        # processed_text = ##self.reddit_object["thread_post"] != ""
        idx = None
        if  settings.config["settings"]["storymode"] :
            if settings.config["settings"]["storymodemethode"] == 0:
                if  (len(self.reddit_object["thread_post"]) > self.tts_module.max_chars):
                    self.split_post(self.reddit_object["thread_post"], "postaudio")
                else :
                    self.call_tts("postaudio",process_text(self.reddit_object["thread_post"]) )   
            elif settings.config["settings"]["storymodemethode"] == 1:
                
                for idx,text in enumerate(self.reddit_object["thread_post"]):
                    self.call_tts(f"posttext-{idx}",process_text(text) )

        else :
            
            for idx, comment in track(enumerate(self.reddit_object["comments"]), "Saving..."):
                # ! Stop creating mp3 files if the length is greater than max length.
                if self.length > self.max_length and idx > 1:
                    self.length -= self.last_clip_length
                    idx -= 1
                    break
                if (
                    len(comment["comment_body"]) > self.tts_module.max_chars
                ):  # Split the comment if it is too long
                    self.split_post(comment["comment_body"], idx)  # Split the comment
                else:  # If the comment is not too long, just call the tts engine
                    self.call_tts(f"{idx}", process_text(comment["comment_body"]))

        print_substep("Saved Text to MP3 files successfully.", style="bold green")
        return self.length, idx

    def split_post(self, text: str, idx):
        split_files = []
        split_text = [
            x.group().strip()
            for x in re.finditer(
                r" *(((.|\n){0," + str(self.tts_module.max_chars) + "})(\.|.$))", text
            )
        ]
        offset = 0
        for idy, text_cut in enumerate(split_text):
            # print(f"{idx}-{idy}: {text_cut}\n")
            new_text = process_text(text_cut)
            if not new_text or new_text.isspace():
                offset += 1
                continue

            self.call_tts(f"{idx}-{idy - offset}.part", new_text)
            split_files.append(AudioFileClip(f"{self.path}/{idx}-{idy - offset}.part.mp3"))

        CompositeAudioClip([concatenate_audioclips(split_files)]).write_audiofile(
            f"{self.path}/{idx}.mp3", fps=44100, verbose=False, logger=None
        )

        for i in split_files:
            name = i.filename
            i.close()
            Path(name).unlink()

        # for i in range(0, idy + 1):
        # print(f"Cleaning up {self.path}/{idx}-{i}.part.mp3")

        # Path(f"{self.path}/{idx}-{i}.part.mp3").unlink()

    def call_tts(self, filename: str, text: str):
        self.tts_module.run(text, filepath=f"{self.path}/{filename}.mp3")
        # try:
        #     self.length += MP3(f"{self.path}/{filename}.mp3").info.length
        # except (MutagenError, HeaderNotFoundError):
        #     self.length += sox.file_info.duration(f"{self.path}/{filename}.mp3")
        try:
            clip = AudioFileClip(f"{self.path}/{filename}.mp3")
            self.last_clip_length = clip.duration
            self.length += clip.duration
            clip.close()
        except:
            self.length = 0


def process_text(text: str):
    lang = settings.config["reddit"]["thread"]["post_lang"]
    new_text = sanitize_text(text)
    if lang:
        print_substep("Translating Text...")
        translated_text = ts.google(text, to_language=lang)
        new_text = sanitize_text(translated_text)
    return new_text
Reduced code duplication in TTS engines 2 years ago			`#!/usr/bin/env python3`
			`from pathlib import Path`
			`from typing import Tuple`
			`import re`
fix: Fixed Mutagen error issue style: made final_video.py cleaner 2 years ago
fix: length checker works with new duration code 2 years ago			`# import sox`
			`# from mutagen import MutagenError`
			`# from mutagen.mp3 import MP3, HeaderNotFoundError`
Merge branch 'develop' into feat/better-tts-changer 2 years ago			`import translators as ts`
Reduced code duplication in TTS engines 2 years ago			`from rich.progress import track`
			`from moviepy.editor import AudioFileClip, CompositeAudioClip, concatenate_audioclips`
			`from utils.console import print_step, print_substep`
			`from utils.voice import sanitize_text`
refactor: tts engines now use toml config 2 years ago			`from utils import settings`
refactor: refactored using black formatter. cmd: black . --line-length 101 2 years ago
Added the stroy mode with two method and add min comment lenght 2 years ago			`DEFAULT_MAX_LENGTH: int = 40 # video length variable`
Reduced code duplication in TTS engines 2 years ago
			`class TTSEngine:`

			`"""Calls the given TTS engine to reduce code duplication and allow multiple TTS engines.`

			`Args:`
			`tts_module : The TTS module. Your module should handle the TTS itself and saving to the given path under the run method.`
			`reddit_object : The reddit object that contains the posts to read.`
			`path (Optional) : The unix style path to save the mp3 files to. This must not have leading or trailing slashes.`
			`max_length (Optional) : The maximum length of the mp3 files in total.`

			`Notes:`
			`tts_module must take the arguments text and filepath.`
			`"""`

			`def __init__(`
			`self,`
			`tts_module,`
			`reddit_object: dict,`
Bot can run multiple instances at the same time (#1091) * Bot can run multiple instances at the same time * Delete TTS/__pycache__ directory * Delete video_creation/__pycache__ directory * Delete videos.json * Delete utils/__pycache__ directory * Create videos.json * Moved id to utils * Added cleanup in shutdown and fixed bug * Removed watermark todo and fixed it * Delete final_video.py * Update final_video.py * Delete video.py * Update video.py * Delete id.py * feat: meaningful error message for bad credentials * chore: remove comment reference to .env Co-authored-by: Callum Leslie <git@cleslie.uk> 2 years ago			`path: str = "assets/temp/",`
formatting 2 years ago			`max_length: int = DEFAULT_MAX_LENGTH,`
			`last_clip_length: int = 0,`
Reduced code duplication in TTS engines 2 years ago			`):`
			`self.tts_module = tts_module()`
			`self.reddit_object = reddit_object`
Added the stroy mode with two method and add min comment lenght 2 years ago
Bot can run multiple instances at the same time (#1091) * Bot can run multiple instances at the same time * Delete TTS/__pycache__ directory * Delete video_creation/__pycache__ directory * Delete videos.json * Delete utils/__pycache__ directory * Create videos.json * Moved id to utils * Added cleanup in shutdown and fixed bug * Removed watermark todo and fixed it * Delete final_video.py * Update final_video.py * Delete video.py * Update video.py * Delete id.py * feat: meaningful error message for bad credentials * chore: remove comment reference to .env Co-authored-by: Callum Leslie <git@cleslie.uk> 2 years ago			`self.redditid = re.sub(r"[^\w\s-]", "", reddit_object["thread_id"])`
			`self.path = path + self.redditid + "/mp3"`
Reduced code duplication in TTS engines 2 years ago			`self.max_length = max_length`
			`self.length = 0`
formatting 2 years ago			`self.last_clip_length = last_clip_length`
Reduced code duplication in TTS engines 2 years ago
			`def run(self) -> Tuple[int, int]:`

Added the stroy mode with two method and add min comment lenght 2 years ago			`Path(self.path).mkdir(parents=True, exist_ok=True)`
Reduced code duplication in TTS engines 2 years ago			`print_step("Saving Text to MP3 files...")`
Added the stroy mode with two method and add min comment lenght 2 years ago
process text before all calls to call_tts Process_text now called before call_tts to ensure it is called minimally while allowing for verification that text is not empty 2 years ago			`self.call_tts("title", process_text(self.reddit_object["thread_title"]))`
Added the stroy mode with two method and add min comment lenght 2 years ago			`# processed_text = ##self.reddit_object["thread_post"] != ""`
Reduced code duplication in TTS engines 2 years ago			`idx = None`
Added the stroy mode with two method and add min comment lenght 2 years ago			`if settings.config["settings"]["storymode"] :`
			`if settings.config["settings"]["storymodemethode"] == 0:`
			`if (len(self.reddit_object["thread_post"]) > self.tts_module.max_chars):`
			`self.split_post(self.reddit_object["thread_post"], "postaudio")`
			`else :`
			`self.call_tts("postaudio",process_text(self.reddit_object["thread_post"]) )`
			`elif settings.config["settings"]["storymodemethode"] == 1:`

			`for idx,text in enumerate(self.reddit_object["thread_post"]):`
			`self.call_tts(f"posttext-{idx}",process_text(text) )`

			`else :`

			`for idx, comment in track(enumerate(self.reddit_object["comments"]), "Saving..."):`
			`# ! Stop creating mp3 files if the length is greater than max length.`
			`if self.length > self.max_length and idx > 1:`
			`self.length -= self.last_clip_length`
			`idx -= 1`
			`break`
			`if (`
			`len(comment["comment_body"]) > self.tts_module.max_chars`
			`): # Split the comment if it is too long`
			`self.split_post(comment["comment_body"], idx) # Split the comment`
			`else: # If the comment is not too long, just call the tts engine`
			`self.call_tts(f"{idx}", process_text(comment["comment_body"]))`
Reduced code duplication in TTS engines 2 years ago
			`print_substep("Saved Text to MP3 files successfully.", style="bold green")`
			`return self.length, idx`

Added the stroy mode with two method and add min comment lenght 2 years ago			`def split_post(self, text: str, idx):`
Reduced code duplication in TTS engines 2 years ago			`split_files = []`
			`split_text = [`
			`x.group().strip()`
fix: regex splitter no longer skips newlines 2 years ago			`for x in re.finditer(`
			`r" *(((.\|\n){0," + str(self.tts_module.max_chars) + "})(\.\|.$))", text`
			`)`
Reduced code duplication in TTS engines 2 years ago			`]`
fix: dont use blank text splits 2 years ago			`offset = 0`
Reduced code duplication in TTS engines 2 years ago			`for idy, text_cut in enumerate(split_text):`
Remove debug statements 2 years ago			`# print(f"{idx}-{idy}: {text_cut}\n")`
style: formatted with black 2 years ago			`new_text = process_text(text_cut)`
improved efficiency of empty text check 2 years ago			`if not new_text or new_text.isspace():`
fix: dont use blank text splits 2 years ago			`offset += 1`
background audio implementation 2 years ago			`continue`

improved efficiency of empty text check 2 years ago			`self.call_tts(f"{idx}-{idy - offset}.part", new_text)`
style: formatted with black 2 years ago			`split_files.append(AudioFileClip(f"{self.path}/{idx}-{idy - offset}.part.mp3"))`
fix: dont use blank text splits 2 years ago
Reduced code duplication in TTS engines 2 years ago			`CompositeAudioClip([concatenate_audioclips(split_files)]).write_audiofile(`
			`f"{self.path}/{idx}.mp3", fps=44100, verbose=False, logger=None`
			`)`

fix: close ALL clips when finished 2 years ago			`for i in split_files:`
			`name = i.filename`
			`i.close()`
			`Path(name).unlink()`

			`# for i in range(0, idy + 1):`
style: format with python-black 2 years ago			`# print(f"Cleaning up {self.path}/{idx}-{i}.part.mp3")`
fix: close ALL clips when finished 2 years ago
style: format with python-black 2 years ago			`# Path(f"{self.path}/{idx}-{i}.part.mp3").unlink()`
Reduced code duplication in TTS engines 2 years ago
			`def call_tts(self, filename: str, text: str):`
style: formatted with black 2 years ago			`self.tts_module.run(text, filepath=f"{self.path}/{filename}.mp3")`
fix: mutagen error - moved to moviepy duration 2 years ago			`# try:`
			`# self.length += MP3(f"{self.path}/{filename}.mp3").info.length`
			`# except (MutagenError, HeaderNotFoundError):`
			`# self.length += sox.file_info.duration(f"{self.path}/{filename}.mp3")`
added backup contingency 2 years ago			`try:`
			`clip = AudioFileClip(f"{self.path}/{filename}.mp3")`
prevent last comment being cut offin the middle 2 years ago			`self.last_clip_length = clip.duration`
added backup contingency 2 years ago			`self.length += clip.duration`
			`clip.close()`
			`except:`
			`self.length = 0`
fix: length checker works with new duration code 2 years ago
style: format with python-black 2 years ago
Merge branch 'develop' into feat/better-tts-changer 2 years ago			`def process_text(text: str):`
refactor: tts engines now use toml config 2 years ago			`lang = settings.config["reddit"]["thread"]["post_lang"]`
Merge branch 'develop' into feat/better-tts-changer 2 years ago			`new_text = sanitize_text(text)`
			`if lang:`
			`print_substep("Translating Text...")`
Update engine_wrapper.py Fixed not sanitizing the text issue that occurs if POSTLANG is set 2 years ago			`translated_text = ts.google(text, to_language=lang)`
			`new_text = sanitize_text(translated_text)`
Merge branch 'develop' into feat/better-tts-changer 2 years ago			`return new_text`