Spaces:

martintomov
/

gpt4v-voiceover

Runtime error

App Files Files Community

Martin Tomov commited on May 10

Commit

663e3d1

•

1 Parent(s): e3b186c

Update app.py

Browse files

Files changed (1) hide show

app.py +8 -40

app.py CHANGED Viewed

@@ -1,4 +1,3 @@
-from dotenv import load_dotenv
 from IPython.display import display, Image, Audio
 from moviepy.editor import VideoFileClip, AudioFileClip
 from moviepy.audio.io.AudioFileClip import AudioFileClip
@@ -12,9 +11,6 @@ import requests
 import streamlit as st
 import tempfile
-# Load environment variables from .env.local
-load_dotenv('.env.local')
 ## 1. Turn video into frames
 def video_to_frames(video_file):
     # Save the uploaded video file to a temporary file
@@ -73,20 +69,14 @@ def text_to_audio(text, api_key, voice):
         },
     )
-    # Check if the request was successful
     if response.status_code != 200:
         raise Exception("Request failed with status code")
-    # Create an in-memory bytes buffer
     audio_bytes_io = io.BytesIO()
-    # Write audio data to the in-memory bytes buffer
     for chunk in response.iter_content(chunk_size=1024*1024):
         audio_bytes_io.write(chunk)
-    # Important: Seek to the start of the BytesIO buffer before returning
     audio_bytes_io.seek(0)
-    # Save audio to a temporary file
     with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmpfile:
         for chunk in response.iter_content(chunk_size=1024*1024):
             tmpfile.write(chunk)
@@ -97,73 +87,51 @@ def text_to_audio(text, api_key, voice):
 ## 4. Merge videos & audio
 def merge_audio_video(video_filename, audio_filename, output_filename):
     print("Merging audio and video ...")
-    # Load the video file
     video_clip = VideoFileClip(video_filename)
-    # Load the audio file
     audio_clip = AudioFileClip(audio_filename)
-    # Set the audio of the video clip as the audio file
     final_clip = video_clip.set_audio(audio_clip)
-    # Write the result to a file (without audio)
     final_clip.write_videofile(output_filename, codec='libx264', audio_codec="aac")
-    # Close the clips
     video_clip.close()
     audio_clip.close()
-    # Return the path to the new video file
     return output_filename
 ## 5. Streamlit UI
 def main():
     st.set_page_config(page_title="AI Voiceover", page_icon="🔮")
     st.title("GPT4V AI Voiceover 🎥🔮")
-    st.text("Explore how GPT4V changes the way we voiceover videos.")
-    # Retrieve the OpenAI API key from environment
-    openai_key = os.getenv('OPENAI_API_KEY')
     if not openai_key:
-        st.error("OpenAI API key is not set in .env.local")
-        return  # or handle the error as you see fit
     uploaded_file = st.file_uploader("Select a video file", type=["mp4", "avi"])
     option = st.selectbox(
         'Choose the voice you want',
         ('Female Voice', 'Male Voice'))
-    classify = ''
-    if option == 'Male Voice':
-        classify = 'alloy'
-    elif option == 'Female Voice':
-        classify = 'nova'
     if uploaded_file is not None:
         st.video(uploaded_file)
         p = 'Generate a short voiceover script for the video, matching the content with the video scenes. The style should be...'
-        # # Ignore and don't generate anything else than the script that you'll voice over the video.
-        prompt = st.text_area(
-            "Prompt", value=p
-        )
     if st.button("START PROCESSING", type="primary") and uploaded_file is not None:
         with st.spinner("Video is being processed..."):
             base64Frame, video_filename, video_duration = video_to_frames(uploaded_file)
             est_word_count = video_duration * 4
-            final_prompt = prompt + f"(This video is ONLY {video_duration} seconds long. So make sure the voiceover MUST be able to be explained in less than {est_word_count} words. Ignore and don't generate anything else than the script that you'll use to voice over the video.)"
             text = frames_to_story(base64Frame, final_prompt, openai_key)
             st.write(text)
-            # Generate audio from text
             audio_filename, audio_bytes_io = text_to_audio(text, openai_key, classify)
-            # Merge audio and video
             output_video_filename = os.path.splitext(video_filename)[0] + "_output.mp4"
             final_video_filename = merge_audio_video(video_filename, audio_filename, output_video_filename)
-            # Display the result
             st.video(final_video_filename)
-            # Clean up the temporary files
             os.unlink(video_filename)
             os.unlink(audio_filename)
             os.unlink(final_video_filename)
 if __name__ == "__main__":
-    main()

 from IPython.display import display, Image, Audio
 from moviepy.editor import VideoFileClip, AudioFileClip
 from moviepy.audio.io.AudioFileClip import AudioFileClip
 import streamlit as st
 import tempfile
 ## 1. Turn video into frames
 def video_to_frames(video_file):
     # Save the uploaded video file to a temporary file
         },
     )
     if response.status_code != 200:
         raise Exception("Request failed with status code")
     audio_bytes_io = io.BytesIO()
     for chunk in response.iter_content(chunk_size=1024*1024):
         audio_bytes_io.write(chunk)
     audio_bytes_io.seek(0)
     with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmpfile:
         for chunk in response.iter_content(chunk_size=1024*1024):
             tmpfile.write(chunk)
 ## 4. Merge videos & audio
 def merge_audio_video(video_filename, audio_filename, output_filename):
     print("Merging audio and video ...")
     video_clip = VideoFileClip(video_filename)
     audio_clip = AudioFileClip(audio_filename)
     final_clip = video_clip.set_audio(audio_clip)
     final_clip.write_videofile(output_filename, codec='libx264', audio_codec="aac")
     video_clip.close()
     audio_clip.close()
     return output_filename
 ## 5. Streamlit UI
 def main():
     st.set_page_config(page_title="AI Voiceover", page_icon="🔮")
     st.title("GPT4V AI Voiceover 🎥🔮")
+    openai_key = st.text_input("Enter your OpenAI API key")
     if not openai_key:
+        st.error("Please enter your OpenAI API key.")
+        return
     uploaded_file = st.file_uploader("Select a video file", type=["mp4", "avi"])
     option = st.selectbox(
         'Choose the voice you want',
         ('Female Voice', 'Male Voice'))
+    classify = 'alloy' if option == 'Male Voice' else 'nova'
     if uploaded_file is not None:
         st.video(uploaded_file)
         p = 'Generate a short voiceover script for the video, matching the content with the video scenes. The style should be...'
+        prompt = st.text_area("Prompt", value=p)
     if st.button("START PROCESSING", type="primary") and uploaded_file is not None:
         with st.spinner("Video is being processed..."):
             base64Frame, video_filename, video_duration = video_to_frames(uploaded_file)
             est_word_count = video_duration * 4
+            final_prompt = f"{prompt}(This video is ONLY {video_duration} seconds long. So make sure the voiceover MUST be able to be explained in less than {est_word_count} words. Ignore and don't generate anything else than the script that you'll use to voice over the video.)"
             text = frames_to_story(base64Frame, final_prompt, openai_key)
             st.write(text)
             audio_filename, audio_bytes_io = text_to_audio(text, openai_key, classify)
             output_video_filename = os.path.splitext(video_filename)[0] + "_output.mp4"
             final_video_filename = merge_audio_video(video_filename, audio_filename, output_video_filename)
             st.video(final_video_filename)
             os.unlink(video_filename)
             os.unlink(audio_filename)
             os.unlink(final_video_filename)
 if __name__ == "__main__":
+    main()