|
|
|
@ -55,9 +55,20 @@ class TTSEngine:
|
|
|
|
|
self,
|
|
|
|
|
): # adds periods to the end of paragraphs (where people often forget to put them) so tts doesn't blend sentences
|
|
|
|
|
for comment in self.reddit_object["comments"]:
|
|
|
|
|
# remove links
|
|
|
|
|
regex_urls = r"((http|https)\:\/\/)?[a-zA-Z0-9\.\/\?\:@\-_=#]+\.([a-zA-Z]){2,6}([a-zA-Z0-9\.\&\/\?\:@\-_=#])*"
|
|
|
|
|
comment["comment_body"] = re.sub(regex_urls, " ", comment["comment_body"])
|
|
|
|
|
comment["comment_body"] = comment["comment_body"].replace("\n", ". ")
|
|
|
|
|
comment["comment_body"] = re.sub(r'\bAI\b', 'A.I', comment["comment_body"])
|
|
|
|
|
comment["comment_body"] = re.sub(r'\bAGI\b', 'A.G.I', comment["comment_body"])
|
|
|
|
|
if comment["comment_body"][-1] != ".":
|
|
|
|
|
comment["comment_body"] += "."
|
|
|
|
|
comment["comment_body"] = comment["comment_body"].replace(". . .", ".")
|
|
|
|
|
comment["comment_body"] = comment["comment_body"].replace(".. . ", ".")
|
|
|
|
|
comment["comment_body"] = comment["comment_body"].replace(". . ", ".")
|
|
|
|
|
comment["comment_body"] = re.sub(r'\."\.', '".', comment["comment_body"])
|
|
|
|
|
print(comment["comment_body"])
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def run(self) -> Tuple[int, int]:
|
|
|
|
|
Path(self.path).mkdir(parents=True, exist_ok=True)
|
|
|
|
|