vid2voiceover

Running

App Files Files Community

tsi-org commited on Apr 1

Commit

b240f73

•

1 Parent(s): af9a186

Update app.py

Browse files

Files changed (1) hide show

app.py +103 -1

app.py CHANGED Viewed

@@ -9,7 +9,109 @@ import os
 import requests
 import tempfile
-# Assuming other function definitions remain the same...
 def main():
     st.set_page_config(page_title="AI Voiceover", page_icon="🔮")

 import requests
 import tempfile
+# Load environment variables from .env.local
+load_dotenv('.env.local')
+def check_password():
+    correct_password = os.getenv('PASSWORD')
+    if correct_password is None:
+        st.error("Password is not set in .env.local")
+        return False
+    user_password = st.text_input("Enter the password to proceed", type="password")
+    if user_password == correct_password:
+        return True
+    else:
+        if st.button("Check Password"):
+            st.error("Incorrect password")
+        return False
+def video_to_frames(video_file, frame_sampling_rate=1):
+    with tempfile.NamedTemporaryFile(delete=False, suffix='.mp4') as tmpfile:
+        tmpfile.write(video_file.read())
+        video_filename = tmpfile.name
+    video_clip = VideoFileClip(video_filename)
+    video_duration = video_clip.duration
+    fps = video_clip.fps
+    frames_to_skip = int(fps * frame_sampling_rate)
+    video = cv2.VideoCapture(video_filename)
+    base64Frame = []
+    current_frame = 0
+    while video.isOpened():
+        success, frame = video.read()
+        if not success:
+            break
+        if current_frame % frames_to_skip == 0:
+            _, buffer = cv2.imencode('.jpg', frame)
+            base64Frame.append(base64.b64encode(buffer).decode("utf-8"))
+        current_frame += 1
+    video.release()
+    print(f"{len(base64Frame)} frames read at a sampling rate of {frame_sampling_rate} second(s) per frame.")
+    return base64Frame, video_filename, video_duration
+def frames_to_story(base64Frames, prompt, api_key):
+    PROMPT_MESSAGES = [
+        {
+            "role": "user",
+            "content": [
+                prompt,
+                *map(lambda x: {"image": x, "resize": 768}, base64Frames[0::50]),
+            ],
+        },
+    ]
+    params = {
+        "model": "gpt-4-vision-preview",
+        "messages": PROMPT_MESSAGES,
+        "api_key": api_key,
+        "headers": {"Openai-Version": "2020-11-07"},
+        "max_tokens": 1000,
+    }
+    result = openai.ChatCompletion.create(**params)
+    print(result.choices[0].message.content)
+    return result.choices[0].message.content
+def text_to_audio(text, api_key, voice):
+    response = requests.post(
+        "https://api.openai.com/v1/audio/speech",
+        headers={
+            "Authorization": f"Bearer {api_key}",
+        },
+        json={
+            "model": "tts-1",
+            "input": text,
+            "voice": voice,
+        },
+    )
+    if response.status_code != 200:
+        raise Exception("Request failed with status code")
+    audio_bytes_io = io.BytesIO()
+    for chunk in response.iter_content(chunk_size=1024*1024):
+        audio_bytes_io.write(chunk)
+    audio_bytes_io.seek(0)
+    with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmpfile:
+        for chunk in response.iter_content(chunk_size=1024*1024):
+            tmpfile.write(chunk)
+        audio_filename = tmpfile.name
+    return audio_filename, audio_bytes_io
+def merge_audio_video(video_filename, audio_filename, output_filename):
+    print("Merging audio and video ...")
+    video_clip = VideoFileClip(video_filename)
+    audio_clip = AudioFileClip(audio_filename)
+    final_clip = video_clip.set_audio(audio_clip)
+    final_clip.write_videofile(output_filename, codec='libx264', audio_codec="aac")
+    video_clip.close()
+    audio_clip.close()
+    return output_filename
 def main():
     st.set_page_config(page_title="AI Voiceover", page_icon="🔮")