main.py

from g4f.client import Client
import requests
import assemblyai as aai
import json
from pydub import AudioSegment
import random
from moviepy.editor import *
from math import ceil
from os import path, mkdir, system
from shutil import rmtree
import json
from sys import platform
import seewav
import requests
import tempfile
from pathlib import Path
from time import *


f_dat = open('api_keys.json','r').read()
data = eval(f_dat)
#assmebly_ai_api = data["AssemblyAI_API"]
urs_api=data["UnrealSpeech_API"]


def pfp_wave(buzz, bg_m=1, fg=[1, 0.78, 0]):


    buzz_list=['pictures/Denn.png', 'pictures/Jed.jpeg', 'pictures/Jess.jpg', 'pictures/K-11.jpeg', 'pictures/Kee.png', 'pictures/Kell.jpeg', 'pictures/Ron.jpeg']
    video_p = buzz_list[buzz-1]

    bg_list=[[0.21, 0.22, 0.24], [0.9058, 0.4352, 0.3176], [0.3960, 0.5058, 0.2784], [0.4549, 0.3176, 0.1764], [0.6745, 0.8823, 0.6862], [0.4549, 0.4117, 0.7137]]
    bg = bg_list[bg_m-1]
z

    #use seewav to generate waveform video
    #The 'seewav' module in the given codebase is a modded version of a pull request by @Phoenix616 in the github page of the base seewav module

    with tempfile.TemporaryDirectory() as tmp:
        seewav.visualize(audio=Path('tmp/output.mp3'),
                        tmp=Path(tmp),
                        out=Path("tmp/waves.mp4"),
                        fg_color=fg,
                        bg_color=bg,
                        size=(480, 480),
                        bars=70
                        )


    video= VideoFileClip("tmp/waves.mp4")
    video_duration = video.duration
    x_pos = 20
    y_pos = 'center'

    title = (
        ImageClip(video_p)
        .set_pos((x_pos, y_pos))
        .resize(height=150)
    )
    final = CompositeVideoClip([video.set_duration(video_duration), title.set_duration(video_duration)])
    return final

def v_merger(clip1, clip2):

    #split screen two videos

    final = clips_array([[clip1], [clip2]])
    return final


def json_to_srt(json_file_path, srt_file_path):
    with open(json_file_path, 'r') as json_file:
        data = json.load(json_file)

    with open(srt_file_path, 'w') as srt_file:
        index = 1
        for subtitle in data:
            start_time = subtitle['start']
            end_time = subtitle['end'] - 0.03           # -0.03 to ensure that the sutitles dont overlap
            text = subtitle['word']
            if end_time>=60.00 :
                raise ValueError("Clip size of more than a minute not supported!")


            srt_file.write(f"{index}\n")
            srt_file.write(f"00:00:{start_time:06.3f} --> 00:00:{end_time:06.3f}\n")
            srt_file.write(f"{text}\n\n")
            index += 1


def a_mixer(num):

    #mixes base audio with a background music

    if num==1: au_path = "Minecraft"
    if num==2: au_path = "Subwoofer_Lullaby"
    if num==3: au_path = "Moog_City_2"

    sound1 = AudioSegment.from_file(f"music/{au_path}.mp3", format="mp3")
    sound2 = AudioSegment.from_file("tmp/output.mp3", format="mp3")

    overlay = sound2.overlay(sound1, position=0)
    overlay.export("tmp/F_output.mp3", format="mp3")
    return AudioFileClip("tmp/F_output.mp3")


def backdrop(buzz):

    #subclips the gameplay video according to the playtime of the audio

    if buzz==1:
        video_path='backdrop/minecraft.mp4'
    if buzz==2:
        video_path='backdrop/fh5.mp4'
    if buzz==3:
        video_path='backdrop/gtav.mp4'
    if buzz==4:
        video_path='backdrop/trackmania.mp4'


    def vid_dur(file_path):
       TempClip= VideoFileClip(file_path)
       vid_duration=TempClip.duration
       return vid_duration


    audio_duration = AudioSegment.from_file('tmp/output.mp3').duration_seconds
    video_duration = vid_dur(video_path)

    s_time = random.randint(0,ceil(video_duration-(audio_duration + 5)))
    e_time = s_time+ ceil(audio_duration)
    video= VideoFileClip(video_path).subclip(s_time,e_time)
    return video


def sub_append(font_no, weight=16, color="&H0099ff"):

    if font_no==1 :
        font="Permanant Marker"
    if font_no==2 :
        font="Archivo Black"
    if font_no==3 :
        font="Bebas Neue"
    if font_no==4 :
        font="Jersey 10"
    if font_no==5 :
        font="VT323"
        weight = 20

    #adds subtitle


    time_tup = localtime()
    time_string = strftime("%d_%m_%Y__%H%M%S", time_tup)

    system(f"ffmpeg -hide_banner -loglevel error -i tmp/subs.srt tmp/subtitle.ass")
    ass_file_path = 'tmp/subtitle.ass'
    new_style_definition = f'Style: Default,{font},{weight},{color},&Hffffff,&H0,&H0,1,0,0,0,100,100,0,0,1,1,2,5,50,50,50,1\n'

    with open(ass_file_path, 'r', encoding='utf-8') as file:
         lines = file.readlines()

    for line in lines:
        if line.strip().startswith('Style:'):
            lines[(lines.index(line))]=new_style_definition
    with open('tmp/subtitle.ass', 'w') as file:
        file.write(''.join(lines))

    system(f'ffmpeg -hide_banner -loglevel error -i tmp/temporary.mp4 -vf "ass=tmp/subtitle.ass" -c:a copy -c:v libx264 -crf 23 -preset veryfast {time_string}.mp4')


def add_aud(videoclip, audioclip):

    #adds audio to the given video

    new_audioclip = CompositeAudioClip([audioclip])
    videoclip.audio = new_audioclip
    videoclip.write_videofile("tmp/temporary.mp4", codec='libx264', audio_codec='aac')


#def subs():
#    #to remove
#    #generates subtitles using AssemblyAI API
#    #this function is called only when "Timestamp captions" are set to "Sentence"
#
#    aai.settings.api_key = assmebly_ai_api
#    transcriber = aai.Transcriber()
#    transcript = transcriber.transcribe('tmp/output.mp3')
#    with open('tmp/subs.srt', 'a+') as handler:
    #        handler.write(transcript.export_subtitles_srt())


def model(buzz):

    #generates Transcript of the video using g4f gpt 3.5 Turbo model

    client = Client()
    response = client.chat.completions.create(
    model="gpt-3.5-turbo",
    messages=[{"role": "user", "content": "Just answer the given question under 100 words in English, DO NOT include any titles, bullet points, Citations, or any special charecters, just the transcript. Now here is the Prompt :  " + buzz  }],
    )
    gen=response.choices[0].message.content
    return(gen)


def voice_charecter(chr, trs, caps):

    #generates voice
    if chr==1 : charecter="Dan"
    if chr==2 : charecter="Will"
    if chr==3 : charecter="Scarlett"
    if chr==4 : charecter="Liv"
    if chr==5 : charecter="Amy"


    url = "https://api.v6.unrealspeech.com/speech"

    payload = {
        "Text": trs,
        "VoiceId": charecter,
        "Bitrate": "192k",
        "Speed": "0",
        "Pitch": "1",
        "TimestampType": caps
    }
    headers = {
        "accept": "application/json",
        "content-type": "application/json",
        "Authorization": f"Bearer {urs_api}"
    }

    response = requests.post(url, json=payload, headers=headers)
    sleep(5)

    res = json.loads(response.text)
    voiceover = requests.get(res["OutputUri"])
    with open("tmp/output.mp3", 'wb') as f:
        for i in voiceover :
            f.write(i)

    subs = requests.get(res["TimestampsUri"])
    with open("tmp/subs.json", 'wb') as f:
        for i in subs :
            f.write(i)


def clear():

    if platform.startswith('win'):
        system("cls")
    else :
        system("clear")

    print('\033[94m'+'''
░░      ░░░░      ░░░░      ░░░░      ░░░        ░░        ░░        ░░        ░
▒  ▒▒▒▒  ▒▒  ▒▒▒▒  ▒▒  ▒▒▒▒▒▒▒▒  ▒▒▒▒▒▒▒▒  ▒▒▒▒▒▒▒▒▒▒▒  ▒▒▒▒▒▒▒▒  ▒▒▒▒▒  ▒▒▒▒▒▒▒
▓  ▓▓▓▓▓▓▓▓  ▓▓▓▓  ▓▓▓      ▓▓▓▓      ▓▓▓      ▓▓▓▓▓▓▓  ▓▓▓▓▓▓▓▓  ▓▓▓▓▓      ▓▓▓
█  ████  ██        ████████  ████████  ██  ███████████  ████████  █████  ███████
██      ███  ████  ███      ████      ███        █████  ████████  █████        █

''')


def main():
    clear()
    if path.exists("tmp") :
          rmtree("tmp")
          mkdir("tmp")
    else :
          mkdir("tmp")


    #Choice-form

    QueryList={}
    QueryList["script"]=input('\033[94m'+'''1. Transcript Prompt :

>>>  ''')
    clear()
    QueryList["music"]=int(input('''\n2. Use Background music?
2.1 : Minecraft (press 1)
2.2 : Subwoofer Lullaby (press 2)
2.3 : Moog City 2 (press 3)

>>> '''))

    clear()
    QueryList["voices"]=int(input(f'''\n3. Coose a voice :
3.1 : Dan: Young Male (press 1)
3.2 : Will: Mature Male (press 2)
3.3 : Scarlett: Young Female (press 3)
3.4 : Liv: Young Female (press 4)
3.5 : Amy: Mature Female (press 5)

>>> '''))

    clear()
    QueryList["backdrop"]=int(input('''4. Choose a background gameplay :
4.1 : Minecraft (press 1)
4.2 : Forza Horizon 5 (press 2)
4.3 : GTAV (press 3)
4.4 : trackmania (press 4)


>>> '''))

    clear()
    QueryList["charecter"]=int(input('''5. Choose a charecter image.
5.1 : Denn (press 1)
5.2 : Jed (press 2)
5.3 : Jess (press 3)
5.4 : K-11 (press 4)
5.5 : Kee (press 5)
5.6 : Kell (press 6)
5.7 : Ron (press 7)

>>> '''))

    clear()
    QueryList["SubType"]=int(input('''\n6. Subtitles or Timestamps type :
6.1 : Word (press 1)
6.2 : Sentence (press 2)

>>> '''))

    clear()
    QueryList["Font"] = int(input('''\n7. Choose a Font :
7.1 : Permanant Marker (press 1)
7.2 : Archivo Black (press 2)
7.3 : Bebas Neue (press 3)
7.4 : Jersey 10 (press 4)
7.5 : VT323 (press 5)

>>> '''))

    clear()
    QueryList["colour"] = int(input('''\n7. Choose a BackGround Colour :
8.1 : Discord Black (press 1)
8.2 : Vermillion (press 2)
8.3 : Sap Green (press 3)
8.4 : Brown (press 4)
8.5 : Glass Green (press 5)
8.6 : Ultramarine Blue (press 6)

[default - Discord Black]

>>> '''))

    clear()
    #main-code
    script = model(QueryList['script'])
    print(script)
    print('\n'+'[*] Script Generated\n')


    if QueryList["SubType"]==1 :
        voice_charecter(QueryList['voices'], script, "word")
    else :
        voice_charecter(QueryList['voices'], script, "sentance")

    print('\n'+'[*] Voice and Subtitles Generated\n')

    json_to_srt('tmp/subs.json', 'tmp/subs.srt' )


    bckdrp = backdrop(QueryList["backdrop"])
    pwave = pfp_wave(QueryList['charecter'], QueryList["colour"])
    print('\n'+'[*] Background Video Generated\n')

    a_mixed = a_mixer(QueryList['music'])
    merg = v_merger(pwave, bckdrp)

    print('\n'+'[*] Mixing Audio\n')
    add_aud(merg, a_mixed)


    print('\n'+'[*] Burning Captions\n')
    sub_append(QueryList["Font"])

    #--

    print("\n[*] Job Finished")

    delr=input("delete all non essential files? (y/n) : ")
    if delr=="y" :
        rmtree("tmp/")
    if delr=="n" :
        pass

if __name__ == "__main__":
    _is_main = True
    main()