RedditVideoMakerBot/TTS/common.py

import base64
from random import choice
from typing import Union, Optional


class BaseApiTTS:
    max_chars: int
    decode_base64: bool = False

    @staticmethod
    def text_len_sanitize(
            text: str,
            max_length: int,
    ) -> list:
        """
        Splits text if it's too long to be a query

        Args:
            text: text to be sanitized
            max_length: maximum length of the query

        Returns:
            Split text as a list
        """
        # Split by comma or dot (else you can lose intonations), if there is non, split by groups of 299 chars
        split_text = ''

        split_text = list(
            map(lambda x: x.strip() if x.strip()[-1] != '.' else x.strip()[:-1],
                filter(lambda x: True if x else False, text.split('.')))
        )
        if split_text and all([chunk.__len__() < max_length for chunk in split_text]):
            return split_text

        split_text = list(
            map(lambda x: x.strip() if x.strip()[-1] != ',' else x.strip()[:-1],
                filter(lambda x: True if x else False, text.split(','))
                )
        )
        if split_text and all([chunk.__len__() < max_length for chunk in split_text]):
            return split_text

        return list(
            map(
                lambda x: x.strip() if x.strip()[-1] != '.' or x.strip()[-1] != ',' else x.strip()[:-1],
                filter(
                    lambda x: True if x else False,
                    [text[i:i + max_length] for i in range(0, len(text), max_length)]
                )
            )
        )

    def write_file(
            self,
            output_text: str,
            filepath: str,
    ) -> None:
        """
        Writes and decodes TTS responses in files

        Args:
            output_text: text to be written
            filepath: path/name of the file
        """
        decoded_text = base64.b64decode(output_text) if self.decode_base64 else output_text

        with open(filepath, 'wb') as out:
            out.write(decoded_text)

    def run(
            self,
            text: str,
            filepath: str,
    ) -> None:
        """
        Calls for TTS api and writes audio file

        Args:
            text: text to be voice over
            filepath: path/name of the file

        Returns:

        """
        output_text = ''
        if len(text) > self.max_chars:
            for part in self.text_len_sanitize(text, self.max_chars):
                if part:
                    output_text += self.make_request(part)
        else:
            output_text = self.make_request(text)
        self.write_file(output_text, filepath)


def get_random_voice(
        voices: Union[list, dict],
        key: Optional[str] = None,
) -> str:
    """
    Return random voice from list or dict

    Args:
        voices: list or dict of voices
        key: key of a dict if you are using one

    Returns:
        random voice as a str
    """
    if isinstance(voices, list):
        return choice(voices)
    else:
        return choice(voices[key] if key else list(voices.values())[0])


def audio_length(
        path: str,
) -> Union[float, int]:
    """
    Gets the length of the audio file

    Args:
        path: audio file path

    Returns:
        length in seconds as an int
    """
    from mutagen.mp3 import MP3

    try:
        audio = MP3(path)
        return audio.info.length
    except Exception as e:
        import logging

        logger = logging.getLogger('tts_logger')
        logger.setLevel(logging.ERROR)
        handler = logging.FileHandler('.tts.log', mode='a+', encoding='utf-8')
        logger.addHandler(handler)
        logger.error('Error occurred in audio_length:', e)
        return 0
cherry-picked split text from async-tts-api 2 years ago			`import base64`
			`from random import choice`
			`from typing import Union, Optional`


			`class BaseApiTTS:`
			`max_chars: int`
			`decode_base64: bool = False`

			`@staticmethod`
			`def text_len_sanitize(`
			`text: str,`
			`max_length: int,`
			`) -> list:`
self review: improved typing & logging, removed unused imports, fixes in README 2 years ago			`"""`
			`Splits text if it's too long to be a query`

			`Args:`
			`text: text to be sanitized`
			`max_length: maximum length of the query`

			`Returns:`
			`Split text as a list`
			`"""`
cherry-picked split text from async-tts-api 2 years ago			`# Split by comma or dot (else you can lose intonations), if there is non, split by groups of 299 chars`
fixes in text_len_sanitize 2 years ago			`split_text = ''`

			`split_text = list(`
			`map(lambda x: x.strip() if x.strip()[-1] != '.' else x.strip()[:-1],`
			`filter(lambda x: True if x else False, text.split('.')))`
			`)`
			`if split_text and all([chunk.__len__() < max_length for chunk in split_text]):`
			`return split_text`

			`split_text = list(`
			`map(lambda x: x.strip() if x.strip()[-1] != ',' else x.strip()[:-1],`
			`filter(lambda x: True if x else False, text.split(','))`
			`)`
			`)`
			`if split_text and all([chunk.__len__() < max_length for chunk in split_text]):`
			`return split_text`

			`return list(`
			`map(`
			`lambda x: x.strip() if x.strip()[-1] != '.' or x.strip()[-1] != ',' else x.strip()[:-1],`
			`filter(`
			`lambda x: True if x else False,`
			`[text[i:i + max_length] for i in range(0, len(text), max_length)]`
			`)`
			`)`
			`)`
cherry-picked split text from async-tts-api 2 years ago
			`def write_file(`
			`self,`
			`output_text: str,`
			`filepath: str,`
			`) -> None:`
self review: improved typing & logging, removed unused imports, fixes in README 2 years ago			`"""`
			`Writes and decodes TTS responses in files`

			`Args:`
			`output_text: text to be written`
			`filepath: path/name of the file`
			`"""`
cherry-picked split text from async-tts-api 2 years ago			`decoded_text = base64.b64decode(output_text) if self.decode_base64 else output_text`

			`with open(filepath, 'wb') as out:`
			`out.write(decoded_text)`

			`def run(`
			`self,`
			`text: str,`
			`filepath: str,`
			`) -> None:`
self review: improved typing & logging, removed unused imports, fixes in README 2 years ago			`"""`
			`Calls for TTS api and writes audio file`

			`Args:`
			`text: text to be voice over`
			`filepath: path/name of the file`

			`Returns:`

			`"""`
cherry-picked split text from async-tts-api 2 years ago			`output_text = ''`
			`if len(text) > self.max_chars:`
			`for part in self.text_len_sanitize(text, self.max_chars):`
			`if part:`
			`output_text += self.make_request(part)`
			`else:`
			`output_text = self.make_request(text)`
			`self.write_file(output_text, filepath)`


			`def get_random_voice(`
			`voices: Union[list, dict],`
			`key: Optional[str] = None,`
			`) -> str:`
self review: improved typing & logging, removed unused imports, fixes in README 2 years ago			`"""`
			`Return random voice from list or dict`

			`Args:`
			`voices: list or dict of voices`
			`key: key of a dict if you are using one`

			`Returns:`
			`random voice as a str`
			`"""`
cherry-picked split text from async-tts-api 2 years ago			`if isinstance(voices, list):`
			`return choice(voices)`
			`else:`
self review: improved typing & logging, removed unused imports, fixes in README 2 years ago			`return choice(voices[key] if key else list(voices.values())[0])`
cherry-picked split text from async-tts-api 2 years ago

added fixes 2 years ago			`def audio_length(`
			`path: str,`
more fixes 2 years ago			`) -> Union[float, int]:`
self review: improved typing & logging, removed unused imports, fixes in README 2 years ago			`"""`
			`Gets the length of the audio file`

			`Args:`
			`path: audio file path`

			`Returns:`
			`length in seconds as an int`
			`"""`
added fixes 2 years ago			`from mutagen.mp3 import MP3`

			`try:`
			`audio = MP3(path)`
			`return audio.info.length`
self review: improved typing & logging, removed unused imports, fixes in README 2 years ago			`except Exception as e:`
			`import logging`

more fixes 2 years ago			`logger = logging.getLogger('tts_logger')`
			`logger.setLevel(logging.ERROR)`
			`handler = logging.FileHandler('.tts.log', mode='a+', encoding='utf-8')`
self review: improved typing & logging, removed unused imports, fixes in README 2 years ago			`logger.addHandler(handler)`
			`logger.error('Error occurred in audio_length:', e)`
added fixes 2 years ago			`return 0`