Spaces:

ford442
/

LTX-Video

Running on Zero

App Files Files Community

ford442 commited on 15 days ago

Commit

af2936b

•

1 Parent(s): 005df4d

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -29

app.py CHANGED Viewed

@@ -162,11 +162,16 @@ preset_options = [
     {"label": "1056x640, 57 frames", "width": 1056, "height": 640, "num_frames": 57},
     {"label": "448x448, 100 frames", "width": 448, "height": 448, "num_frames": 100},
     {"label": "448x448, 200 frames", "width": 448, "height": 448, "num_frames": 200},
     {"label": "640x640, 80 frames", "width": 640, "height": 640, "num_frames": 80},
     {"label": "768x768, 64 frames", "width": 768, "height": 768, "num_frames": 64},
     {"label": "720x720, 64 frames", "width": 768, "height": 768, "num_frames": 64},
     {"label": "768x512, 97 frames", "width": 768, "height": 512, "num_frames": 97},
     {"label": "512x512, 160 frames", "width": 512, "height": 512, "num_frames": 160},
     {"label": "736x480, 113 frames", "width": 736, "height": 480, "num_frames": 113},
     {"label": "704x480, 121 frames", "width": 704, "height": 480, "num_frames": 121},
     {"label": "704x448, 129 frames", "width": 704, "height": 448, "num_frames": 129},
@@ -223,22 +228,10 @@ pipeline = XoraVideoPipeline(
     tokenizer=tokenizer,
     scheduler=scheduler,
     vae=vae,
-).to(torch.bfloat16).to(device)
-GPU_DURATION_OPTIONS = {
-    "Short (45s)": 45,
-    "Short (60s)": 60,
-    "Medium (80s)": 80,
-    "Medium (100s)": 100,
-    "Long (120s)": 120,
-    "Long (140s)": 140,
-}
-def set_gpu_duration(duration_choice):
-    os.environ["GPU_DURATION"] = str(GPU_DURATION_OPTIONS[duration_choice])
-@spaces.GPU(duration=int(os.getenv("GPU_DURATION", "80")))  # Dynamic duration
-def generate_video_from_text(
     prompt="",
     enhance_prompt_toggle=False,
     txt2vid_analytics_toggle=True,
@@ -274,7 +267,7 @@ def generate_video_from_text(
         progress((step + 1) / num_inference_steps)
     try:
-        with torch.no_grad():
             images = pipeline(
                 num_inference_steps=num_inference_steps,
                 num_images_per_prompt=1,
@@ -316,8 +309,8 @@ def generate_video_from_text(
     torch.cuda.empty_cache()
     return output_path
-@spaces.GPU(duration=int(os.getenv("GPU_DURATION", "80")))  # Dynamic duration
-def generate_video_from_image(
     image_path,
     prompt="",
     enhance_prompt_toggle=False,
@@ -414,14 +407,6 @@ def create_advanced_options():
         inference_steps = gr.Slider(label="4.2 Inference Steps", minimum=5, maximum=150, step=5, value=40)
         guidance_scale = gr.Slider(label="4.3 Guidance Scale", minimum=1.0, maximum=10.0, step=0.1, value=3.2)
-        gpu_duration = gr.Dropdown(
-            label="GPU Duration",
-            choices=list(GPU_DURATION_OPTIONS.keys()),
-            value="Medium (80s)"  # Default value
-        )
-        gpu_duration.change(fn=set_gpu_duration, inputs=gpu_duration, outputs=[])
         height_slider = gr.Slider(
             label="4.4 Height",
             minimum=256,
@@ -679,7 +664,7 @@ with gr.Blocks(theme=gr.themes.Soft()) as iface:
     txt2vid_preset.change(fn=preset_changed, inputs=[txt2vid_preset], outputs=txt2vid_advanced[3:])
     txt2vid_generate.click(
-        fn=generate_video_from_text,
         inputs=[
             txt2vid_prompt,
             txt2vid_enhance_toggle,
@@ -697,7 +682,7 @@ with gr.Blocks(theme=gr.themes.Soft()) as iface:
     img2vid_preset.change(fn=preset_changed, inputs=[img2vid_preset], outputs=img2vid_advanced[3:])
     img2vid_generate.click(
-        fn=generate_video_from_image,
         inputs=[
             img2vid_image,
             img2vid_prompt,

     {"label": "1056x640, 57 frames", "width": 1056, "height": 640, "num_frames": 57},
     {"label": "448x448, 100 frames", "width": 448, "height": 448, "num_frames": 100},
     {"label": "448x448, 200 frames", "width": 448, "height": 448, "num_frames": 200},
+    {"label": "448x448, 300 frames", "width": 448, "height": 448, "num_frames": 300},
     {"label": "640x640, 80 frames", "width": 640, "height": 640, "num_frames": 80},
+    {"label": "640x640, 120 frames", "width": 640, "height": 640, "num_frames": 120},
     {"label": "768x768, 64 frames", "width": 768, "height": 768, "num_frames": 64},
+    {"label": "768x768, 90 frames", "width": 768, "height": 768, "num_frames": 90},
     {"label": "720x720, 64 frames", "width": 768, "height": 768, "num_frames": 64},
+    {"label": "720x720, 100 frames", "width": 768, "height": 768, "num_frames": 100},
     {"label": "768x512, 97 frames", "width": 768, "height": 512, "num_frames": 97},
     {"label": "512x512, 160 frames", "width": 512, "height": 512, "num_frames": 160},
+    {"label": "512x512, 200 frames", "width": 512, "height": 512, "num_frames": 200},
     {"label": "736x480, 113 frames", "width": 736, "height": 480, "num_frames": 113},
     {"label": "704x480, 121 frames", "width": 704, "height": 480, "num_frames": 121},
     {"label": "704x448, 129 frames", "width": 704, "height": 448, "num_frames": 129},
     tokenizer=tokenizer,
     scheduler=scheduler,
     vae=vae,
+).to(device)
+@spaces.GPU(duration=90)  # Dynamic duration
+def generate_video_from_text_90(
     prompt="",
     enhance_prompt_toggle=False,
     txt2vid_analytics_toggle=True,
         progress((step + 1) / num_inference_steps)
     try:
+      #  with torch.no_grad():
             images = pipeline(
                 num_inference_steps=num_inference_steps,
                 num_images_per_prompt=1,
     torch.cuda.empty_cache()
     return output_path
+@spaces.GPU(duration=90)  # Dynamic duration
+def generate_video_from_image_90(
     image_path,
     prompt="",
     enhance_prompt_toggle=False,
         inference_steps = gr.Slider(label="4.2 Inference Steps", minimum=5, maximum=150, step=5, value=40)
         guidance_scale = gr.Slider(label="4.3 Guidance Scale", minimum=1.0, maximum=10.0, step=0.1, value=3.2)
         height_slider = gr.Slider(
             label="4.4 Height",
             minimum=256,
     txt2vid_preset.change(fn=preset_changed, inputs=[txt2vid_preset], outputs=txt2vid_advanced[3:])
     txt2vid_generate.click(
+        fn=generate_video_from_text_90,
         inputs=[
             txt2vid_prompt,
             txt2vid_enhance_toggle,
     img2vid_preset.change(fn=preset_changed, inputs=[img2vid_preset], outputs=img2vid_advanced[3:])
     img2vid_generate.click(
+        fn=generate_video_from_image_90,
         inputs=[
             img2vid_image,
             img2vid_prompt,