Spaces:

mrcuddle
/

SDXT-Image-To-Video

Running on Zero

App Files Files Community

mrcuddle commited on Dec 15, 2024

Commit

2a768ff

verified ·

1 Parent(s): 0d3b369

Update app.py

Browse files

Files changed (1) hide show

app.py +42 -49

app.py CHANGED Viewed

@@ -1,55 +1,48 @@
-import gradio as gr
-from diffusers import StableVideoDiffusionPipeline, EulerDiscreteScheduler
 import torch
 from PIL import Image
-import tempfile
-import imageio
-import spaces
-# Load the Stable Video Diffusion model
-model_id = "stabilityai/stable-video-diffusion-img2vid-xt"
-try:
-    pipe = StableVideoDiffusionPipeline.from_pretrained(model_id, torch_dtype=torch.float16, revision="main")
-    pipe.scheduler = EulerDiscreteScheduler.from_config(pipe.scheduler.config)
-    pipe.to("cuda")
-except Exception as e:
-    raise RuntimeError(f"Failed to load the model: {e}")
-@spaces.GPU
-def generate_video(image, num_frames=25, height=576, width=1024):
-    try:
-        # Convert the image to a format suitable for the pipeline
-        image = Image.open(image)
-        # Generate the video
-        video_frames = pipe(image=image, num_frames=num_frames, height=height, width=width).frames
-        # Save the video frames to a temporary file
-        with tempfile.NamedTemporaryFile(delete=False, suffix=".mp4") as temp_video:
-            video_path = temp_video.name
-            # Save the frames as a video using imageio
-            imageio.mimsave(video_path, video_frames, fps=30)
-        return video_path
-    except Exception as e:
-        raise RuntimeError(f"Failed to generate the video: {e}")
 # Create the Gradio interface
-with gr.Blocks() as demo:
-    gr.Markdown("## Image to Video with Stable Diffusion XT")
-    with gr.Row():
-        with gr.Column():
-            image_input = gr.Image(type="filepath", label="Upload Image")
-            num_frames_input = gr.Slider(1, 50, step=1, value=25, label="Number of Frames")
-            height_input = gr.Number(label="Resolution Height", value=576)
-            width_input = gr.Number(label="Resolution Width", value=1024)
-            run_button = gr.Button("Generate Video")
-        with gr.Column():
-            video_output = gr.Video(label="Generated Video")
-    run_button.click(
-        generate_video,
-        inputs=[image_input, num_frames_input, height_input, width_input],
-        outputs=video_output
-    )
 # Launch the interface
-if __name__ == "__main__":
-    demo.launch()

 import torch
+import gradio as gr
+from diffusers import StableVideoDiffusionPipeline
 from PIL import Image
+import numpy as np
+from moviepy.editor import ImageSequenceClip
+# Load the pipeline
+pipeline = StableVideoDiffusionPipeline.from_pretrained(
+    "stabilityai/stable-video-diffusion-img2vid-xt", torch_dtype=torch.float16, variant="fp16"
+)
+pipeline.enable_model_cpu_offload()
+def generate_video(image, seed):
+    # Preprocess the image
+    image = Image.open(image)
+    image = image.resize((1024, 576))
+    # Set the generator seed
+    generator = torch.manual_seed(seed)
+    # Generate the video frames
+    frames = pipeline(image, decode_chunk_size=8, generator=generator).frames[0]
+    # Convert frames to a format suitable for video export
+    frames = [(frame * 255).astype(np.uint8) for frame in frames]
+    # Export the frames to a video file
+    clip = ImageSequenceClip(frames, fps=7)
+    output_video_path = "generated.mp4"
+    clip.write_videofile(output_video_path, codec="libx264")
+    return output_video_path
 # Create the Gradio interface
+iface = gr.Interface(
+    fn=generate_video,
+    inputs=[
+        gr.Image(type="file", label="Upload Image"),
+        gr.Number(label="Seed", value=42)
+    ],
+    outputs=gr.Video(label="Generated Video"),
+    title="Stable Video Diffusion",
+    description="Generate a video from an uploaded image using Stable Video Diffusion."
+)
 # Launch the interface
+iface.launch()