works for me now after a lot of fixes, also working on removing old way of subtitles

1 year ago · b0d6d6e363
parent a4e5ad812e
commit b0d6d6e363
9 changed files with 69 additions and 136 deletions
--- a/TTS/engine_wrapper.py
+++ b/TTS/engine_wrapper.py
@ -72,8 +72,6 @@ class TTSEngine:
            comment["comment_body"] = re.sub(r'\."\.', '".', comment["comment_body"])
    def run(self) -> Tuple[int, int]:
        from utils.imagenarator import comment_image_maker
        Path(self.path).mkdir(parents=True, exist_ok=True)
        print_step("Saving Text to MP3 files...")
@ -94,7 +92,6 @@ class TTSEngine:
        else:
            comments = []
            os.makedirs("assets/temp/" + self.redditid + "/png", exist_ok=True)
            for idx, comment in track(enumerate(self.reddit_object["comments"]), "Saving..."):
                # TODO: Maybe move this somewhere better?
                comments.append(comment["comment_body"])
@ -111,10 +108,6 @@ class TTSEngine:
                else:  # If the comment is not too long, just call the tts engine
                    self.call_tts(f"{idx}", process_text(comment["comment_body"]))
            # TODO: Maybe move this somewhere better?
            if not settings.config["settings"]["use_capcut"]:
                comment_image_maker((0, 0, 0, 0), self.reddit_object, comments, (255, 255, 255), transparent=True)
        print_substep("Saved Text to MP3 files successfully.", style="bold green")
        return self.length, idx
--- a/main.py
+++ b/main.py
@ -28,7 +28,7 @@ from video_creation.screenshot_downloader import get_screenshots_of_reddit_posts
 from video_creation.voices import save_text_to_mp3
 from video_creation.memes import make_meme_video
-__VERSION__ = "3.2.1"
+__VERSION__ = "3.2.2"
 print(
    """
--- a/utils/.config.template.toml
+++ b/utils/.config.template.toml
@ -203,7 +203,6 @@ resolution_w = { optional = false, default = 1080, example = 1440, explantation
 resolution_h = { optional = false, default = 1920, example = 2560, explantation = "Sets the height in pixels of the final video" }
 zoom = { optional = true, default = 1, example = 1.1, explanation = "Sets the browser zoom level. Useful if you want the text larger.", type = "float", nmin = 0.1, nmax = 2, oob_error = "The text is really difficult to read at a zoom level higher than 2" }
 channel_name = { optional = true, default = "Reddit Tales", example = "Reddit Stories", explanation = "Sets the username that appaers in the fancy title screen" }
 words_on_screen = { optional = true, default = 10, example = 1, type = "int", explanation = "Sets how many words should be shown on screen" }
 [settings.background]
 background_video = { optional = true, default = "minecraft", example = "rocket-league", options = [
--- a/utils/capcut.py
+++ b/utils/capcut.py
@ -36,6 +36,7 @@ def generate_captions(file_path, title):
        page.click("//span[contains(text(),'OK')]")
        print("Logging in")
        page.goto("https://www.capcut.com/login")
        page.fill("//input[@class='lv-input lv-input-size-default lv_sign_in_panel_wide-input']", email)
@ -65,6 +66,7 @@ def generate_captions(file_path, title):
        if page.is_visible("//div[@class='guide-modal-close-icon']"):
            page.click("//div[@class='guide-modal-close-icon']")
        print("Trying to remove old video")
        if page.is_visible("//div[@data-selectable-item-id]"):
            page.hover("//div[@data-selectable-item-id]")
@ -85,6 +87,7 @@ def generate_captions(file_path, title):
        page.goto("https://www.capcut.com/editor?enter_from=create_new&current_page=landing_page&from_page=work_space&start_tab=video&__action_from=my_draft&position=my_draft&scenario=youtube_ads&scale=9%3A16")
        print("Uploading video")
        if page.is_visible("//div[@class='guide-close-icon-f8J9FZ']//*[name()='svg']"):
            page.click("//div[@class='guide-close-icon-f8J9FZ']//*[name()='svg']")
@ -106,11 +109,18 @@ def generate_captions(file_path, title):
        if page.is_visible("//div[@class='guide-close-icon-OwPlMC']"):
            page.click("//div[@class='guide-close-icon-OwPlMC']")
        while True:
            try:
                page.click("div[class^='guide-close-icon-']", timeout=1000)
            except:
                break
        page.set_input_files("(//input[@type='file'])[1]", file_path)
        time.sleep(2)
-        page.click("//div[@class='tools-dCzTyg']")
+        page.click("//div[@class='tools-97tWCU']")
        page.click("(//li[@role='option'])[5]")
        time.sleep(18)
@ -143,7 +153,7 @@ def generate_captions(file_path, title):
        time.sleep(1)
-        page.click(f"(//img[@class='image-QII91y'])[{str(settings.config['capcut']['preset_number'])}]")
+        page.click(f"(//img[@class='image-E7GTkW'])[{str(settings.config['capcut']['preset_number'])}]")
        time.sleep(2)
--- a/utils/imagenarator.py
+++ b/utils/imagenarator.py
@ -7,7 +7,6 @@ from rich.progress import track
 from TTS.engine_wrapper import process_text
 from utils.console import print_step, print_substep
 from utils.process_post import split_text
 def draw_multiple_line_text(
@ -64,7 +63,7 @@ def imagemaker(theme, reddit_obj: dict, txtclr, padding=5, transparent=False) ->
    texts = reddit_obj["thread_post"]
    id = re.sub(r"[^\w\s-]", "", reddit_obj["thread_id"])
-    texts = split_text(" ".join(texts))
+    #texts = split_text(" ".join(texts))
    if transparent:
        font = ImageFont.truetype(os.path.join("fonts", "Roboto-Bold.ttf"), 100)
@ -77,29 +76,3 @@ def imagemaker(theme, reddit_obj: dict, txtclr, padding=5, transparent=False) ->
        text = process_text(text, False)
        draw_multiple_line_text(image, text, font, txtclr, padding, wrap=30, transparent=transparent)
        image.save(f"assets/temp/{id}/png/img{idx}.png")
 def comment_image_maker(theme, reddit_obj: dict, comments, txtclr, padding=5, transparent=False) -> None:
    """
    Render Images for video
    """
    id = re.sub(r"[^\w\s-]", "", reddit_obj["thread_id"])
    if transparent:
        font = ImageFont.truetype(os.path.join("fonts", "Roboto-Bold.ttf"), 100)
    else:
        font = ImageFont.truetype(os.path.join("fonts", "Roboto-Regular.ttf"), 100)
    size = (1920, 1080)
    print_step("Rendering Images")
    i = 0
    for comment in comments:
        texts = split_text(comment)
        for text in texts:
            image = Image.new("RGBA", size, theme)
            text = process_text(text, False)
            draw_multiple_line_text(image, text, font, txtclr, padding, wrap=30, transparent=transparent)
            print_substep("Made image: " + str(i))
            image.save(f"assets/temp/{id}/png/comment_{i}.png")
            i+=1
--- a/utils/process_post.py
+++ b/utils/process_post.py
@ -1,16 +0,0 @@
 import re
 from typing import List
 from utils import settings
 # working good
 def split_text(obj) -> List[str]:
    text: str = re.sub("\n", " ", obj)
    words_on_screen = settings.config["settings"]["words_on_screen"]
    words = text.split()
    grouped_words = [' '.join(words[i: i + words_on_screen]) for i in range(0, len(words), words_on_screen)]
    return grouped_words
--- a/utils/thumbnail.py
+++ b/utils/thumbnail.py
@ -1,4 +1,9 @@
-from PIL import ImageDraw, ImageFont
+import textwrap
 import os
 from PIL import ImageDraw, ImageFont, Image
 from utils import settings
 from utils.console import print_step, print_substep
 def create_thumbnail(thumbnail, font_family, font_size, font_color, width, height, title):
@ -33,3 +38,38 @@ def create_thumbnail(thumbnail, font_family, font_size, font_color, width, heigh
        draw.text((MarginXaxis, MarginYaxis + (LineHeight * i)), arrayTitle[i], rgb, font=font)
    return thumbnail
 def create_fancy_thumbnail(image, text, text_color, padding, wrap=35):
    print_step(f"Creating fancy thumbnail for: {text}")
    font_title_size = 47
    font = ImageFont.truetype(os.path.join("fonts", "Roboto-Bold.ttf"), font_title_size)
    image_width, image_height = image.size
    lines = textwrap.wrap(text, width=wrap)
    y = (image_height / 2) - (((font.getsize(text)[1] + (len(lines) * padding) / len(lines)) * len(lines)) / 2) + 30
    draw = ImageDraw.Draw(image)
    username_font = ImageFont.truetype(os.path.join("fonts", "Roboto-Bold.ttf"), 30)
    draw.text((205, 825), settings.config["settings"]["channel_name"], font=username_font, fill=text_color, align="left")
    if len(lines) == 3:
        lines = textwrap.wrap(text, width=wrap+10)
        font_title_size = 40
        font = ImageFont.truetype(os.path.join("fonts", "Roboto-Bold.ttf"), font_title_size)
        y = (image_height / 2) - (((font.getsize(text)[1] + (len(lines) * padding) / len(lines)) * len(lines)) / 2) + 35
    elif len(lines) == 4:
        lines = textwrap.wrap(text, width=wrap+10)
        font_title_size = 35
        font = ImageFont.truetype(os.path.join("fonts", "Roboto-Bold.ttf"), font_title_size)
        y = (image_height / 2) - (((font.getsize(text)[1] + (len(lines) * padding) / len(lines)) * len(lines)) / 2) + 40
    elif len(lines) > 4:
        lines = textwrap.wrap(text, width=wrap+10)
        font_title_size = 30
        font = ImageFont.truetype(os.path.join("fonts", "Roboto-Bold.ttf"), font_title_size)
        y = (image_height / 2) - (((font.getsize(text)[1] + (len(lines) * padding) / len(lines)) * len(lines)) / 2) + 30
    for line in lines:
        _, line_height = font.getsize(line)
        draw.text((120, y), line, font=font, fill=text_color, align="left")
        y += line_height + padding
    return image
--- a/video_creation/final_video.py
+++ b/video_creation/final_video.py
@ -17,11 +17,11 @@ from rich.progress import track
 from utils import settings
 from utils import capcut
 from utils import thumbnail
 from utils.cleanup import cleanup
 from utils.console import print_step, print_substep
-from utils.thumbnail import create_thumbnail
+from utils.thumbnail import create_thumbnail, create_fancy_thumbnail
 from utils.videos import save_data
 from utils.process_post import split_text
 from pathlib import Path
@ -111,43 +111,6 @@ def prepare_background(reddit_id: str, W: int, H: int) -> str:
        exit(1)
    return output_path
 # The following function is based on code under: Copyright 2024 beingbored (aka. Tim), MIT License, permission granted to use, copy, modify, and distribute.
 def create_fancy_thumbnail(image, text, text_color, padding, wrap=35):
    print_step(f"Creating fancy thumbnail for: {text}")
    font_title_size = 47
    font = ImageFont.truetype(os.path.join("fonts", "Roboto-Bold.ttf"), font_title_size)
    image_width, image_height = image.size
    lines = textwrap.wrap(text, width=wrap)
    y = (image_height / 2) - (((font.getsize(text)[1] + (len(lines) * padding) / len(lines)) * len(lines)) / 2) + 30
    draw = ImageDraw.Draw(image)
    username_font = ImageFont.truetype(os.path.join("fonts", "Roboto-Bold.ttf"), 30)
    draw.text((205, 825), settings.config["settings"]["channel_name"], font=username_font, fill=text_color, align="left")
    if len(lines) == 3:
        lines = textwrap.wrap(text, width=wrap+10)
        font_title_size = 40
        font = ImageFont.truetype(os.path.join("fonts", "Roboto-Bold.ttf"), font_title_size)
        y = (image_height / 2) - (((font.getsize(text)[1] + (len(lines) * padding) / len(lines)) * len(lines)) / 2) + 35
    elif len(lines) == 4:
        lines = textwrap.wrap(text, width=wrap+10)
        font_title_size = 35
        font = ImageFont.truetype(os.path.join("fonts", "Roboto-Bold.ttf"), font_title_size)
        y = (image_height / 2) - (((font.getsize(text)[1] + (len(lines) * padding) / len(lines)) * len(lines)) / 2) + 40
    elif len(lines) > 4:
        lines = textwrap.wrap(text, width=wrap+10)
        font_title_size = 30
        font = ImageFont.truetype(os.path.join("fonts", "Roboto-Bold.ttf"), font_title_size)
        y = (image_height / 2) - (((font.getsize(text)[1] + (len(lines) * padding) / len(lines)) * len(lines)) / 2) + 30
    for line in lines:
        _, line_height = font.getsize(line)
        draw.text((120, y), line, font=font, fill=text_color, align="left")
        y += line_height + padding
    return image
 def merge_background_audio(audio: ffmpeg, reddit_id: str):
    """Gather an audio and merge with assets/backgrounds/background.mp3
    Args:
@ -246,8 +209,6 @@ def make_final_video(
    if not settings.config["settings"]["mememode"]:
        Path(f"assets/temp/{reddit_id}/png").mkdir(parents=True, exist_ok=True)
        # Copyright 2024 beingbored (aka. Tim), MIT License, permission granted to use, copy, modify, and distribute.
        # get the title_template image and draw a text in the middle part of it with the title of the thread
        title_template = Image.open("assets/title_template.png")
        title = reddit_obj["thread_title"]
@ -265,8 +226,6 @@ def make_final_video(
        title_img.save(f"assets/temp/{reddit_id}/png/title.png")
        # Copyright end
    image_clips.insert(
        0,
        ffmpeg.input(f"assets/temp/{reddit_id}/png/title.png")["v"].filter(
@ -307,27 +266,19 @@ def make_final_video(
                ffmpeg.probe(f"assets/temp/{reddit_id}/mp3/title.mp3")["format"]["duration"]
            )
-            text = " ".join(reddit_obj["thread_post"])
+            time_for_clip = float(ffmpeg.probe(f"assets/temp/{reddit_id}/mp3/title.mp3")["format"]["duration"])
-            number_of_clips_splitted = len(split_text(text))
+            image_clips.append(
-
+                ffmpeg.input(f"assets/temp/{reddit_id}/png/img{0}.png")["v"].filter(
-            # TODO:  Fix that it sometimes goes out of sync
+                    "scale", screenshot_width, -1
            for i in track(range(0, number_of_clips_splitted + 1), "Collecting the image files..."):
                time_for_clip = total_audio_duration/(number_of_clips_splitted+1)
                if i == 0:
                    time_for_clip = float(ffmpeg.probe(f"assets/temp/{reddit_id}/mp3/title.mp3")["format"]["duration"])
                image_clips.append(
                    ffmpeg.input(f"assets/temp/{reddit_id}/png/img{i}.png")["v"].filter(
                        "scale", screenshot_width, -1
                    )
                )
            )
-                background_clip = background_clip.overlay(
+            background_clip = background_clip.overlay(
-                    image_clips[i],
+                image_clips[0],
-                    enable=f"between(t,{current_time},{current_time + time_for_clip})",
+                enable=f"between(t,{current_time},{current_time + time_for_clip})",
-                    x="(main_w-overlay_w)/2",
+                x="(main_w-overlay_w)/2",
-                    y="(main_h-overlay_h)/2",
+                y="(main_h-overlay_h)/2",
-                )
+            )
                current_time += time_for_clip
    else:
        total_audio_duration = float(
            ffmpeg.probe(f"assets/temp/{reddit_id}/audio.mp3")["format"]["duration"]
@ -343,13 +294,6 @@ def make_final_video(
            )
        for i in range(0, num_files):
            time_for_clip = total_audio_duration/(num_files)
            image_clips.append(
                ffmpeg.input(f"assets/temp/{reddit_id}/png/comment_{i}.png")["v"].filter(
                    "scale", screenshot_width, -1
                )
            )
            if i == 0:
                time_for_clip = float(ffmpeg.probe(f"assets/temp/{reddit_id}/mp3/title.mp3")["format"]["duration"])
--- a/video_creation/screenshot_downloader.py
+++ b/video_creation/screenshot_downloader.py
@ -11,7 +11,6 @@ from rich.progress import track
 from utils import settings
 from utils.console import print_step, print_substep
 from utils.imagenarator import imagemaker
 from utils.playwright import clear_cookie_by_name
 from utils.videos import save_data
@ -61,15 +60,6 @@ def get_screenshots_of_reddit_posts(reddit_object: dict, screenshot_num: int):
        bgcolor = (255, 255, 255, 255)
        txtcolor = (0, 0, 0)
        transparent = False
    if storymode and settings.config["settings"]["storymodemethod"] == 1:
        # for idx,item in enumerate(reddit_object["thread_post"]):
        print_substep("Generating images...")
        return imagemaker(
            theme=bgcolor,
            reddit_obj=reddit_object,
            txtclr=txtcolor,
            transparent=transparent,
        )
    if settings.config["settings"]["storymodemethod"] == 1:
        return