generators/thumbnail.py

import random
import os

from PIL import Image
from PIL import Image, ImageDraw, ImageFont

from utils.openaicaller import openai
from utils.misc import open_explorer_here
'''
Putpose of this file is to generate a miniature of the video.
It has a function that takes a path, title, and description and generates a miniature.
It uses pillow to generate the image, and openai to generate text1 and text2.

text 1 is a short text max 2 words to put on the top of the image.
text 2 is a 3 word text to put in the middle of the image.

The function returns the path of the image.

First open bcg.png. Then create a new image and add a random gradient to it from top to bottom.
then put the png on top of the gradient.
Then add text1 and text2 to the image.
'''

prompt = '''Generate 2 short textes OF MAX 2-4 WORDS each to put on the top of the miniature of the video. Here are some examples:
For the title "Python Exception Handling" the text1 could be "No more crashes!" and the text2 could be "Easy!"
The second text is often shorter than the first one.
Answer without anything else, just with the 2 textes. Answer with text1 on the first line and text2 on the second line. Nothing else.
Here is the title of the video: [TITLE]
Here is the description of the video: [DESCRIPTION]'''


async def rand_gradient(image):
    randr = random.SystemRandom().randint(1, 20)
    randg = random.SystemRandom().randint(1, 20)
    randb = random.SystemRandom().randint(1, 20)
    textcolor1 = [0, 0, 0]
    textcolor2 = [0, 0, 0]
    for i in range(image.size[0]):
        for j in range(image.size[1]):
            colors = [i//randr, j//randg, i//randb]
            position1 = [image.size[0]//5, image.size[1]//5]
            position2 = [image.size[0]//5, image.size[1]//2]
            if i == position1[0] and j == position1[1]:
                textcolor1 = colors
            if i == position2[0] and j == position2[1]:
                textcolor2 = colors
            image.putpixel((i,j), (colors[0], colors[1], colors[2]))
    return image, textcolor1, textcolor2

async def generate_thumbnail(path, title, description):
    prmpt = prompt.replace("[TITLE]", title).replace("[DESCRIPTION]", description)
    response = await openai.generate_response(
        model="gpt-4",
        messages=[
            {"role":"user","content":prmpt},
        ],
        )
    text1 = response['choices'][0]['message']['content'].split("\n")[0] # type: ignore
    text2 = response['choices'][0]['message']['content'].split("\n")[1] # type: ignore
    await generate_image(path, text1, text2)

async def generate_image(path, text1, text2):
#    path_to_bcg = path.split("/")[:-1]
#    path_to_bcg = "/".join(path_to_bcg)
    #use os instead
    path_to_bcg = os.path.dirname(os.path.dirname(path))
    print(path_to_bcg)
    if not os.path.exists(f"{path_to_bcg}/bcg.png"):
        input("bcg.png not found. Please put bcg.png in the folder that will open. Press enter to open the folder.")
        open_explorer_here(path_to_bcg)
        input("Press enter when you have put bcg.png in the folder.")
        if not os.path.exists(f"{path_to_bcg}/bcg.png"):
            input("bcg.png still not found. Exiting.")
            raise FileNotFoundError("bcg.png not found")
    bcg = Image.open(f"{path_to_bcg}/bcg.png")
    img = Image.new('RGBA', (1920, 1080))
    img, textcolor1, textcolor2 = await rand_gradient(img)
    draw = ImageDraw.Draw(img)
    font1 = ImageFont.truetype("./Sigmar-Regular.ttf", 200)
    font2 = ImageFont.truetype("./Sigmar-Regular.ttf", 200)
    text1words = text1.split(" ")
    text2words = text2.split(" ")
    text1def = ""
    text2def = ""
    #max charachters per line is 7, but if a word is longer than 7 charachters, do not split it. Howerver if 2 or more words can fit on the same line, put them on the same line.
    for word in text1words:
        if len(text1def.split("\n")[-1]) + len(word) > 7:
            text1def += "\n"
        text1def += word + " "
    for word in text2words:
        if len(text2def.split("\n")[-1]) + len(word) > 7:
            text2def += "\n"
        text2def += word + " "
    maxlen1 = max([len(line) for line in text1def.split("\n")])
    maxlen2 = max([len(line) for line in text2def.split("\n")])
    #if the text is too long, reduce the font size proportionally
    if maxlen1 > 7:
        font1 = ImageFont.truetype("./Sigmar-Regular.ttf", 200 - (maxlen1 - 7)*10)
    if maxlen2 > 7:
        font2 = ImageFont.truetype("./Sigmar-Regular.ttf", 200 - (maxlen2 - 7)*10)
    text1def = text1def.upper().strip()
    text2def = text2def.upper().strip()
    textcolor1 = [255 - textcolor1[0], 255 - textcolor1[1], 255 - textcolor1[2]]
    textcolor2 = [255 - textcolor2[0], 255 - textcolor2[1], 255 - textcolor2[2]]
    imgtext1 = Image.new('RGBA', (1920, 1080))
    imgtext2 = Image.new('RGBA', (1920, 1080))
    drawtext1 = ImageDraw.Draw(imgtext1)
    drawtext1.text((imgtext1.size[0]//8*2, 0), text1def, font=font1, fill=(textcolor1[0], textcolor1[1], textcolor1[2]))
    imgtext1 = imgtext1.rotate(-5, expand=True)
    drawtext2 = ImageDraw.Draw(imgtext2)
    drawtext2.text((imgtext2.size[0]//8*2.5, imgtext2.size[1]//5*2), text2def, font=font2, fill=(textcolor2[0], textcolor2[1], textcolor2[2]))
    imgtext2 = imgtext2.rotate(5, expand=True)
    #paste the textes on the image
    bcg = bcg.convert('RGBA')
    #also set the bcg size to the image size
    bcg = bcg.resize((1920, 1080))
    img.paste(bcg, (0, 0), bcg) # TODO: make it work with standard pngs (non rgba)
    img.paste(imgtext1, (0, 0-img.size[1]//8), imgtext1)
    if len(text1def.split("\n")) > 2: #if the text is too long, put the second text on the third line
        img.paste(imgtext2, (0, img.size[1]//8), imgtext2)
    else:
        img.paste(imgtext2, (0, 0), imgtext2)
    #disable the alpha channel
    img = img.convert('RGB')
    img_path = os.path.abspath(os.path.join(path, "thumbnail.jpg"))
    for quality in range(100, 0, -1):
        img.save(img_path, quality=quality)
        if os.path.getsize(img_path) < 2000000:
            break
    return img_path
I mean its the biggest commit I ever did (did git add * cause I didn't want to explain all of this It's already so complicated) 2023-06-25 16:12:23 +02:00			`import random`
Initial commit 2023-05-15 10:11:04 +02:00			`import os`

			`from PIL import Image`
I mean its the biggest commit I ever did (did git add * cause I didn't want to explain all of this It's already so complicated) 2023-06-25 16:12:23 +02:00			`from PIL import Image, ImageDraw, ImageFont`
Initial commit 2023-05-15 10:11:04 +02:00
I mean its the biggest commit I ever did (did git add * cause I didn't want to explain all of this It's already so complicated) 2023-06-25 16:12:23 +02:00			`from utils.openaicaller import openai`
refactor(video.py): remove unnecessary print statement refactor(montage.py): use os.path.join instead of string concatenation refactor(thumbnail.py): use os.path.join instead of string concatenation refactor(uploader.py): use os.path.join instead of string concatenation refactor(uploader.py): add support for client_secret.json file with different names in credentials folder docs(readme.md): update instructions for openai and unsplash keys docs(readme.md): update instructions for google oauth client id json files docs(readme.md): add information about channel.yaml file in each channel's folder 2023-06-25 17:40:01 +02:00			`from utils.misc import open_explorer_here`
Initial commit 2023-05-15 10:11:04 +02:00			`'''`
			`Putpose of this file is to generate a miniature of the video.`
			`It has a function that takes a path, title, and description and generates a miniature.`
			`It uses pillow to generate the image, and openai to generate text1 and text2.`

			`text 1 is a short text max 2 words to put on the top of the image.`
			`text 2 is a 3 word text to put in the middle of the image.`

			`The function returns the path of the image.`

			`First open bcg.png. Then create a new image and add a random gradient to it from top to bottom.`
			`then put the png on top of the gradient.`
			`Then add text1 and text2 to the image.`
			`'''`

			`prompt = '''Generate 2 short textes OF MAX 2-4 WORDS each to put on the top of the miniature of the video. Here are some examples:`
			`For the title "Python Exception Handling" the text1 could be "No more crashes!" and the text2 could be "Easy!"`
			`The second text is often shorter than the first one.`
			`Answer without anything else, just with the 2 textes. Answer with text1 on the first line and text2 on the second line. Nothing else.`
			`Here is the title of the video: [TITLE]`
			`Here is the description of the video: [DESCRIPTION]'''`

feat(audio_prompts): add default audio prompts for narrator feat(audio_prompts): add en_narrator_deep audio prompt for narrator feat(audio_prompts): add en_narrator_light_bg audio prompt for narrator fix(video.py): fix indentation and add prompt for generating thumbnail fix(montage.py): fix indentation and add prompt for generating thumbnail fix(montage.py): fix image download for wikimage slides fix(speak.py): remove unused import statement fix(speak.py): remove unused variable 'fakenames' feat(speak.py): add function 'remove_blank_moments' to remove silent parts from audio file feat(speak.py): add function 'optimize_string_groups' to optimize string groups for audio generation fix(speak.py): fix comment indentation in 'generate_voice' function fix(speak.py): remove unused imports in 'generate_voice' function fix(speak.py): remove unused variable 'reduced_noise' in 'generate_voice' function fix(speak.py): remove unused import statements in 'generate_voice' function fix(speak.py): remove unused import statement for 'logging' module fix(speak.py): remove unused print statements in 'main' function fix(speak.py): remove unused import statement for 'logging' module fix(speak.py): remove unused print statements in 'main' function fix(speak.py): fix(wiki_downloader.py): fix Google search URL to include correct query parameter fix(wiki_downloader.py): reduce sleep time after page load to 1 second fix(wiki_downloader.py): increase sleep time after image click to 5 seconds 2023-07-02 11:17:10 +02:00



I mean its the biggest commit I ever did (did git add * cause I didn't want to explain all of this It's already so complicated) 2023-06-25 16:12:23 +02:00			`async def rand_gradient(image):`
Initial commit 2023-05-15 10:11:04 +02:00			`randr = random.SystemRandom().randint(1, 20)`
			`randg = random.SystemRandom().randint(1, 20)`
			`randb = random.SystemRandom().randint(1, 20)`
I mean its the biggest commit I ever did (did git add * cause I didn't want to explain all of this It's already so complicated) 2023-06-25 16:12:23 +02:00			`textcolor1 = [0, 0, 0]`
			`textcolor2 = [0, 0, 0]`
Initial commit 2023-05-15 10:11:04 +02:00			`for i in range(image.size[0]):`
			`for j in range(image.size[1]):`
			`colors = [i//randr, j//randg, i//randb]`
			`position1 = [image.size[0]//5, image.size[1]//5]`
			`position2 = [image.size[0]//5, image.size[1]//2]`
			`if i == position1[0] and j == position1[1]:`
			`textcolor1 = colors`
			`if i == position2[0] and j == position2[1]:`
			`textcolor2 = colors`
			`image.putpixel((i,j), (colors[0], colors[1], colors[2]))`
			`return image, textcolor1, textcolor2`

I mean its the biggest commit I ever did (did git add * cause I didn't want to explain all of this It's already so complicated) 2023-06-25 16:12:23 +02:00			`async def generate_thumbnail(path, title, description):`
Initial commit 2023-05-15 10:11:04 +02:00			`prmpt = prompt.replace("[TITLE]", title).replace("[DESCRIPTION]", description)`
refactor(video.py): remove unnecessary print statement refactor(montage.py): use os.path.join instead of string concatenation refactor(thumbnail.py): use os.path.join instead of string concatenation refactor(uploader.py): use os.path.join instead of string concatenation refactor(uploader.py): add support for client_secret.json file with different names in credentials folder docs(readme.md): update instructions for openai and unsplash keys docs(readme.md): update instructions for google oauth client id json files docs(readme.md): add information about channel.yaml file in each channel's folder 2023-06-25 17:40:01 +02:00			`response = await openai.generate_response(`
Initial commit 2023-05-15 10:11:04 +02:00			`model="gpt-4",`
			`messages=[`
			`{"role":"user","content":prmpt},`
			`],`
			`)`
I mean its the biggest commit I ever did (did git add * cause I didn't want to explain all of this It's already so complicated) 2023-06-25 16:12:23 +02:00			`text1 = response['choices'][0]['message']['content'].split("\n")[0] # type: ignore`
			`text2 = response['choices'][0]['message']['content'].split("\n")[1] # type: ignore`
			`await generate_image(path, text1, text2)`
Initial commit 2023-05-15 10:11:04 +02:00
I mean its the biggest commit I ever did (did git add * cause I didn't want to explain all of this It's already so complicated) 2023-06-25 16:12:23 +02:00			`async def generate_image(path, text1, text2):`
refactor(video.py): remove unnecessary print statement refactor(montage.py): use os.path.join instead of string concatenation refactor(thumbnail.py): use os.path.join instead of string concatenation refactor(uploader.py): use os.path.join instead of string concatenation refactor(uploader.py): add support for client_secret.json file with different names in credentials folder docs(readme.md): update instructions for openai and unsplash keys docs(readme.md): update instructions for google oauth client id json files docs(readme.md): add information about channel.yaml file in each channel's folder 2023-06-25 17:40:01 +02:00			`# path_to_bcg = path.split("/")[:-1]`
			`# path_to_bcg = "/".join(path_to_bcg)`
			`#use os instead`
			`path_to_bcg = os.path.dirname(os.path.dirname(path))`
Added and fixed a whole bunch of things 2023-05-15 15:35:08 +02:00			`print(path_to_bcg)`
			`if not os.path.exists(f"{path_to_bcg}/bcg.png"):`
refactor(video.py): remove unnecessary print statement refactor(montage.py): use os.path.join instead of string concatenation refactor(thumbnail.py): use os.path.join instead of string concatenation refactor(uploader.py): use os.path.join instead of string concatenation refactor(uploader.py): add support for client_secret.json file with different names in credentials folder docs(readme.md): update instructions for openai and unsplash keys docs(readme.md): update instructions for google oauth client id json files docs(readme.md): add information about channel.yaml file in each channel's folder 2023-06-25 17:40:01 +02:00			`input("bcg.png not found. Please put bcg.png in the folder that will open. Press enter to open the folder.")`
			`open_explorer_here(path_to_bcg)`
			`input("Press enter when you have put bcg.png in the folder.")`
Added and fixed a whole bunch of things 2023-05-15 15:35:08 +02:00			`if not os.path.exists(f"{path_to_bcg}/bcg.png"):`
			`input("bcg.png still not found. Exiting.")`
refactor(video.py): remove unnecessary print statement refactor(montage.py): use os.path.join instead of string concatenation refactor(thumbnail.py): use os.path.join instead of string concatenation refactor(uploader.py): use os.path.join instead of string concatenation refactor(uploader.py): add support for client_secret.json file with different names in credentials folder docs(readme.md): update instructions for openai and unsplash keys docs(readme.md): update instructions for google oauth client id json files docs(readme.md): add information about channel.yaml file in each channel's folder 2023-06-25 17:40:01 +02:00			`raise FileNotFoundError("bcg.png not found")`
Added and fixed a whole bunch of things 2023-05-15 15:35:08 +02:00			`bcg = Image.open(f"{path_to_bcg}/bcg.png")`
Initial commit 2023-05-15 10:11:04 +02:00			`img = Image.new('RGBA', (1920, 1080))`
I mean its the biggest commit I ever did (did git add * cause I didn't want to explain all of this It's already so complicated) 2023-06-25 16:12:23 +02:00			`img, textcolor1, textcolor2 = await rand_gradient(img)`
Initial commit 2023-05-15 10:11:04 +02:00			`draw = ImageDraw.Draw(img)`
			`font1 = ImageFont.truetype("./Sigmar-Regular.ttf", 200)`
			`font2 = ImageFont.truetype("./Sigmar-Regular.ttf", 200)`
			`text1words = text1.split(" ")`
			`text2words = text2.split(" ")`
			`text1def = ""`
			`text2def = ""`
			`#max charachters per line is 7, but if a word is longer than 7 charachters, do not split it. Howerver if 2 or more words can fit on the same line, put them on the same line.`
			`for word in text1words:`
			`if len(text1def.split("\n")[-1]) + len(word) > 7:`
			`text1def += "\n"`
			`text1def += word + " "`
			`for word in text2words:`
			`if len(text2def.split("\n")[-1]) + len(word) > 7:`
			`text2def += "\n"`
			`text2def += word + " "`
			`maxlen1 = max([len(line) for line in text1def.split("\n")])`
			`maxlen2 = max([len(line) for line in text2def.split("\n")])`
			`#if the text is too long, reduce the font size proportionally`
			`if maxlen1 > 7:`
			`font1 = ImageFont.truetype("./Sigmar-Regular.ttf", 200 - (maxlen1 - 7)*10)`
			`if maxlen2 > 7:`
			`font2 = ImageFont.truetype("./Sigmar-Regular.ttf", 200 - (maxlen2 - 7)*10)`
			`text1def = text1def.upper().strip()`
			`text2def = text2def.upper().strip()`
			`textcolor1 = [255 - textcolor1[0], 255 - textcolor1[1], 255 - textcolor1[2]]`
			`textcolor2 = [255 - textcolor2[0], 255 - textcolor2[1], 255 - textcolor2[2]]`
			`imgtext1 = Image.new('RGBA', (1920, 1080))`
			`imgtext2 = Image.new('RGBA', (1920, 1080))`
			`drawtext1 = ImageDraw.Draw(imgtext1)`
			`drawtext1.text((imgtext1.size[0]//8*2, 0), text1def, font=font1, fill=(textcolor1[0], textcolor1[1], textcolor1[2]))`
			`imgtext1 = imgtext1.rotate(-5, expand=True)`
			`drawtext2 = ImageDraw.Draw(imgtext2)`
			`drawtext2.text((imgtext2.size[0]//82.5, imgtext2.size[1]//52), text2def, font=font2, fill=(textcolor2[0], textcolor2[1], textcolor2[2]))`
			`imgtext2 = imgtext2.rotate(5, expand=True)`
			`#paste the textes on the image`
feat(audio_prompts): add default audio prompts for narrator feat(audio_prompts): add en_narrator_deep audio prompt for narrator feat(audio_prompts): add en_narrator_light_bg audio prompt for narrator fix(video.py): fix indentation and add prompt for generating thumbnail fix(montage.py): fix indentation and add prompt for generating thumbnail fix(montage.py): fix image download for wikimage slides fix(speak.py): remove unused import statement fix(speak.py): remove unused variable 'fakenames' feat(speak.py): add function 'remove_blank_moments' to remove silent parts from audio file feat(speak.py): add function 'optimize_string_groups' to optimize string groups for audio generation fix(speak.py): fix comment indentation in 'generate_voice' function fix(speak.py): remove unused imports in 'generate_voice' function fix(speak.py): remove unused variable 'reduced_noise' in 'generate_voice' function fix(speak.py): remove unused import statements in 'generate_voice' function fix(speak.py): remove unused import statement for 'logging' module fix(speak.py): remove unused print statements in 'main' function fix(speak.py): remove unused import statement for 'logging' module fix(speak.py): remove unused print statements in 'main' function fix(speak.py): fix(wiki_downloader.py): fix Google search URL to include correct query parameter fix(wiki_downloader.py): reduce sleep time after page load to 1 second fix(wiki_downloader.py): increase sleep time after image click to 5 seconds 2023-07-02 11:17:10 +02:00			`bcg = bcg.convert('RGBA')`
			`#also set the bcg size to the image size`
			`bcg = bcg.resize((1920, 1080))`
			`img.paste(bcg, (0, 0), bcg) # TODO: make it work with standard pngs (non rgba)`
Initial commit 2023-05-15 10:11:04 +02:00			`img.paste(imgtext1, (0, 0-img.size[1]//8), imgtext1)`
			`if len(text1def.split("\n")) > 2: #if the text is too long, put the second text on the third line`
			`img.paste(imgtext2, (0, img.size[1]//8), imgtext2)`
			`else:`
			`img.paste(imgtext2, (0, 0), imgtext2)`
feat(audio_prompts): add default audio prompts for narrator feat(audio_prompts): add en_narrator_deep audio prompt for narrator feat(audio_prompts): add en_narrator_light_bg audio prompt for narrator fix(video.py): fix indentation and add prompt for generating thumbnail fix(montage.py): fix indentation and add prompt for generating thumbnail fix(montage.py): fix image download for wikimage slides fix(speak.py): remove unused import statement fix(speak.py): remove unused variable 'fakenames' feat(speak.py): add function 'remove_blank_moments' to remove silent parts from audio file feat(speak.py): add function 'optimize_string_groups' to optimize string groups for audio generation fix(speak.py): fix comment indentation in 'generate_voice' function fix(speak.py): remove unused imports in 'generate_voice' function fix(speak.py): remove unused variable 'reduced_noise' in 'generate_voice' function fix(speak.py): remove unused import statements in 'generate_voice' function fix(speak.py): remove unused import statement for 'logging' module fix(speak.py): remove unused print statements in 'main' function fix(speak.py): remove unused import statement for 'logging' module fix(speak.py): remove unused print statements in 'main' function fix(speak.py): fix(wiki_downloader.py): fix Google search URL to include correct query parameter fix(wiki_downloader.py): reduce sleep time after page load to 1 second fix(wiki_downloader.py): increase sleep time after image click to 5 seconds 2023-07-02 11:17:10 +02:00			`#disable the alpha channel`
			`img = img.convert('RGB')`
			`img_path = os.path.abspath(os.path.join(path, "thumbnail.jpg"))`
			`for quality in range(100, 0, -1):`
			`img.save(img_path, quality=quality)`
			`if os.path.getsize(img_path) < 2000000:`
			`break`
			`return img_path`