Spaces:

product2204
/

Image_audio_2_Video

Runtime error

App Files Files Community

product2204 commited on Apr 7

Commit

bb6011e

•

1 Parent(s): eba5601

Update app.py

Browse files

Files changed (1) hide show

app.py +121 -51

app.py CHANGED Viewed

@@ -1,66 +1,136 @@
-import gradio as gr
 import cv2
 import numpy as np
-import tempfile
-import soundfile as sf
-from moviepy.editor import VideoFileClip, concatenate_videoclips,AudioFileClip
-def image_to_video(image, audio, fps=30):
     """
-    Converts an image (NumPy array) and audio (tuple of sample rate and audio data)
-    into a video file.
     Parameters:
-    - image: Input image as a NumPy array.
-    - audio: Input audio as a tuple of (sample rate, audio data as a NumPy array).
     - fps: Frames per second of the output video.
-    Returns:
-    - Path to the generated video file.
     """
-    # Create a temporary video file
-    video_path = tempfile.mktemp('.mp4')
-    # Save the image to a temporary file
-    image_path = tempfile.mktemp('.png')
-    cv2.imwrite(image_path, image)
-    # Create VideoWriter to write frames
-    height, width, _ = image.shape
-    fourcc = cv2.VideoWriter_fourcc(*'mp4v')
     video = cv2.VideoWriter(video_path, fourcc, fps, (width, height))
-    # Determine the duration from the audio sample count and sample rate
-    sample_rate, audio_data = audio
-    duration_sec = len(audio_data) / sample_rate
-    # Write the image to the video file for the required number of frames
-    num_frames = int(duration_sec * fps)
-    for _ in range(num_frames):
-        video.write(cv2.imread(image_path))
     video.release()
-    # Save the audio to a temporary file
-    audio_path = tempfile.mktemp('.wav')
-    sf.write(audio_path, audio_data.T, sample_rate)  # Transpose if necessary for multi-channel audio
-    # Combine the video and audio
     video_clip = VideoFileClip(video_path)
     audio_clip = AudioFileClip(audio_path)
     final_clip = video_clip.set_audio(audio_clip)
-    final_clip.write_videofile(video_path, codec="libx264", audio_codec="aac")
     return video_path
-# Gradio interface
-iface = gr.Interface(
-    fn=image_to_video,
-    inputs=[
-        gr.Image(type="numpy"),
-        gr.Audio(type="numpy", label="Audio (Sample Rate, Audio Data)")
-    ],
-    outputs=gr.Video("video"),
-    title="Image and Audio to Video Converter",
-    description="Upload an image and audio to convert them into a video."
-)
-iface.launch(debug=True,share=True)

 import cv2
 import numpy as np
+from pydub import AudioSegment
+from moviepy.editor import VideoFileClip, AudioFileClip
+def image_to_video(image_path, video_path,audio_path,  fps=30):
     """
+    Converts an image into a video of specified duration.
     Parameters:
+    - image_path: Path to the input image.
+    - video_path: Path where the output video will be saved.
+    - duration_sec: Duration of the video in seconds.
     - fps: Frames per second of the output video.
     """
+    # Load the image
+    print("image_path",image_path)
+    img = cv2.imread(image_path)
+    print("image_path")
+    if img is None:
+        raise ValueError("Image could not be loaded. Please check the path.")
+    # Get image dimensions
+    height, width, layers = img.shape
+    # Define the codec and create VideoWriter object
+    fourcc = cv2.VideoWriter_fourcc(*'mp4v')  # Use 'XVID' if you prefer AVI format
     video = cv2.VideoWriter(video_path, fourcc, fps, (width, height))
+    audio = AudioSegment.from_file(audio_path)
+    duration_sec = len(audio) / 1000.0  # Duration in milliseconds to seconds
+    # Calculate the number of frames needed to achieve the desired duration
+    num_frames = duration_sec * fps
+    # Write the image to video file for the required number of frames
+    for _ in range(int(num_frames)):
+        video.write(img)
+    # Release the video writer
     video.release()
     video_clip = VideoFileClip(video_path)
     audio_clip = AudioFileClip(audio_path)
     final_clip = video_clip.set_audio(audio_clip)
+    final_clip.write_videofile(video_path, codec="libx264", audio_codec="aac")
     return video_path
+def rename():
+    import os
+    import shutil
+    # Define the directory to search in
+    directory = os.getcwd()
+    # Initialize variables for the first .jpg and .wav files found
+    first_jpg_file = None
+    first_wav_file = None
+    # Search for the first .jpg and .wav files in the directory
+    for filename in os.listdir(directory):
+        if filename.endswith('.jpg') and first_jpg_file is None:
+            first_jpg_file = os.path.join(directory, filename)
+        elif filename.endswith('.wav') and first_wav_file is None:
+            first_wav_file = os.path.join(directory, filename)
+            print(f"Audio file renamed to {audio_path_new}")
+    # New paths with desired names
+    image_path_new = os.path.join(directory, 'logo.jpg')
+    audio_path_new = os.path.join(directory, 'audio.wav')
+    print(f"Image file renamed to {image_path_new}")
+    # Rename (or move) the image file if found
+    if first_jpg_file:
+        shutil.move(first_jpg_file, image_path_new)
+        print(f"Image file renamed to {image_path_new}")
+    else:
+        print("No .jpg file found.")
+    # Rename (or move) the audio file if found
+    if first_wav_file:
+        shutil.move(first_wav_file, audio_path_new)
+        print(f"Audio file renamed to {audio_path_new}")
+    else:
+        print("No .wav file found.")
+    return  image_path_new,audio_path_new
+# Example usage
+def image_audio_to_video(image_path, audio_path):
+  import os
+  dir=os.getcwd()
+  print("dir",dir)
+  video_path=f"/{dir}/video.mp4"
+  print("video_path",video_path)
+  image_to_video(image_path, video_path,audio_path)
+  return video_path
+import gradio as gr
+def setup_interface():
+    """
+    Setup and launch the Gradio interface.
+    """
+    with gr.Blocks() as demo:
+        gr.Markdown("## Create a Video from an Image and Audio")
+        with gr.Row():
+            with gr.Column():
+                image_upload = gr.Image(label="Upload Image",type="filepath")
+                audio_upload = gr.Audio(label="Upload Audio",type="filepath")
+            with gr.Column():
+                output_video = gr.Video(label="Output Video")
+        # Button to initiate the process
+        if image_upload and audio_upload :
+          submit_btn = gr.Button("Create Video")
+          # Function call on button press with both image and audio as inputs
+          submit_btn.click(fn=image_audio_to_video,
+                          inputs=[image_upload, audio_upload],
+                          outputs=output_video)
+    demo.launch(debug=True)
+if __name__ == "__main__":
+    setup_interface()