Spaces:

ford442
/

LTX-Video

Running on Zero

App Files Files Community

ford442 commited on 8 days ago

Commit

ce99327

•

1 Parent(s): 4c1a182

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -10

app.py CHANGED Viewed

@@ -25,7 +25,6 @@ import gc
 import csv
 from datetime import datetime
 from openai import OpenAI
-#from gradio import themes
 torch.backends.cuda.matmul.allow_tf32 = False
 torch.backends.cuda.matmul.allow_bf16_reduced_precision_reduction = False
@@ -34,7 +33,7 @@ torch.backends.cudnn.allow_tf32 = False
 torch.backends.cudnn.deterministic = False
 #torch.backends.cudnn.benchmark = False
 torch.backends.cuda.preferred_blas_library="cublas"
-torch.backends.cuda.preferred_linalg_library="cusolver"
 torch.set_float32_matmul_precision("highest")
@@ -67,9 +66,10 @@ device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 request_log = []
-clip_model = CLIPModel.from_pretrained("openai/clip-vit-base-patch32", cache_dir=model_path).to(torch.device("cuda:0"))
 clip_processor = CLIPProcessor.from_pretrained("openai/clip-vit-base-patch32", cache_dir=model_path)
 def compute_clip_embedding(text=None, image=None):
     """
     Compute CLIP embedding for a given text or image.
@@ -218,7 +218,7 @@ vae = load_vae(vae_dir)
 unet = load_unet(unet_dir)
 scheduler = load_scheduler(scheduler_dir)
 patchifier = SymmetricPatchifier(patch_size=1)
-text_encoder = T5EncoderModel.from_pretrained("PixArt-alpha/PixArt-XL-2-1024-MS", subfolder="text_encoder").to(torch.device("cuda:0"))
 tokenizer = T5Tokenizer.from_pretrained("PixArt-alpha/PixArt-XL-2-1024-MS", subfolder="tokenizer")
 pipeline = XoraVideoPipeline(
@@ -228,7 +228,7 @@ pipeline = XoraVideoPipeline(
     tokenizer=tokenizer,
     scheduler=scheduler,
     vae=vae,
-).to(torch.device("cuda:0"))
 @spaces.GPU(duration=90)  # Dynamic duration
 def generate_video_from_text_90(
@@ -319,7 +319,7 @@ def generate_video_from_image_90(
     frame_rate=20,
     seed=random.randint(0, MAX_SEED),
     num_inference_steps=35,
-    guidance_scale=4.2,
     height=768,
     width=768,
     num_frames=60,
@@ -356,7 +356,7 @@ def generate_video_from_image_90(
         "media_items": media_items,
     }
-    generator = torch.Generator(device="cuda").manual_seed(seed)
     def gradio_progress_callback(self, step, timestep, kwargs):
         progress((step + 1) / num_inference_steps)
@@ -394,16 +394,18 @@ def generate_video_from_image_90(
             f"An error occurred while generating the video. Please try again. Error: {e}",
             duration=5,
         )
     finally:
         torch.cuda.empty_cache()
         gc.collect()
     return output_path
 def create_advanced_options():
     with gr.Accordion("Step 4: Advanced Options (Optional)", open=False):
         seed = gr.Slider(label="4.1 Seed", minimum=0, maximum=1000000, step=1, value=646373)
         inference_steps = gr.Slider(label="4.2 Inference Steps", minimum=5, maximum=150, step=5, value=40)
-        guidance_scale = gr.Slider(label="4.3 Guidance Scale", minimum=1.0, maximum=10.0, step=0.1, value=4.2)
         height_slider = gr.Slider(
             label="4.4 Height",
@@ -440,7 +442,7 @@ def create_advanced_options():
         ]
 # Define the Gradio interface with tabs
-with gr.Blocks(theme=gr.themes.Glass()) as iface:
     with gr.Row(elem_id="title-row"):
         gr.Markdown(
             """
@@ -697,4 +699,4 @@ with gr.Blocks(theme=gr.themes.Glass()) as iface:
     )
 if __name__ == "__main__":
-    iface.queue(max_size=64, default_concurrency_limit=1, api_open=False).launch(share=True, show_api=False)

 import csv
 from datetime import datetime
 from openai import OpenAI
 torch.backends.cuda.matmul.allow_tf32 = False
 torch.backends.cuda.matmul.allow_bf16_reduced_precision_reduction = False
 torch.backends.cudnn.deterministic = False
 #torch.backends.cudnn.benchmark = False
 torch.backends.cuda.preferred_blas_library="cublas"
+#torch.backends.cuda.preferred_linalg_library="cusolver"
 torch.set_float32_matmul_precision("highest")
 request_log = []
+clip_model = CLIPModel.from_pretrained("openai/clip-vit-base-patch32", cache_dir=model_path).to(device)
 clip_processor = CLIPProcessor.from_pretrained("openai/clip-vit-base-patch32", cache_dir=model_path)
 def compute_clip_embedding(text=None, image=None):
     """
     Compute CLIP embedding for a given text or image.
 unet = load_unet(unet_dir)
 scheduler = load_scheduler(scheduler_dir)
 patchifier = SymmetricPatchifier(patch_size=1)
+text_encoder = T5EncoderModel.from_pretrained("PixArt-alpha/PixArt-XL-2-1024-MS", subfolder="text_encoder").to(device)
 tokenizer = T5Tokenizer.from_pretrained("PixArt-alpha/PixArt-XL-2-1024-MS", subfolder="tokenizer")
 pipeline = XoraVideoPipeline(
     tokenizer=tokenizer,
     scheduler=scheduler,
     vae=vae,
+).to(device)
 @spaces.GPU(duration=90)  # Dynamic duration
 def generate_video_from_text_90(
     frame_rate=20,
     seed=random.randint(0, MAX_SEED),
     num_inference_steps=35,
+    guidance_scale=3.2,
     height=768,
     width=768,
     num_frames=60,
         "media_items": media_items,
     }
+    generator = torch.Generator(device="cpu").manual_seed(seed)
     def gradio_progress_callback(self, step, timestep, kwargs):
         progress((step + 1) / num_inference_steps)
             f"An error occurred while generating the video. Please try again. Error: {e}",
             duration=5,
         )
     finally:
         torch.cuda.empty_cache()
         gc.collect()
     return output_path
 def create_advanced_options():
     with gr.Accordion("Step 4: Advanced Options (Optional)", open=False):
         seed = gr.Slider(label="4.1 Seed", minimum=0, maximum=1000000, step=1, value=646373)
         inference_steps = gr.Slider(label="4.2 Inference Steps", minimum=5, maximum=150, step=5, value=40)
+        guidance_scale = gr.Slider(label="4.3 Guidance Scale", minimum=1.0, maximum=10.0, step=0.1, value=3.2)
         height_slider = gr.Slider(
             label="4.4 Height",
         ]
 # Define the Gradio interface with tabs
+with gr.Blocks(theme=gr.themes.Soft()) as iface:
     with gr.Row(elem_id="title-row"):
         gr.Markdown(
             """
     )
 if __name__ == "__main__":
+    iface.queue(max_size=64, default_concurrency_limit=1, api_open=False).launch(share=True, show_api=False)