Spaces:

MohamedRashad
/

Infinity

Running on Zero

App Files Files Community

MohamedRashad commited on 25 days ago

Commit

f7f1ca1

1 Parent(s): 041b736

Refactor app.py to improve UI layout and rename weight download function; update import path for AutoEncoder in vae.py

Browse files

Files changed (2) hide show

app.py +29 -12
models/bsq_vae/vae.py +1 -1

app.py CHANGED Viewed

@@ -16,13 +16,12 @@ from typing import List
 import cv2
 import numpy as np
-import pandas as pd
 import torch
 import torch.nn.functional as F
 from PIL import Image, ImageEnhance
 import PIL.Image as PImage
 from torchvision.transforms.functional import to_tensor
-from transformers import AutoTokenizer, T5EncoderModel, T5TokenizerFast, T5Tokenizer, T5ForConditionalGeneration
 from huggingface_hub import hf_hub_download
 import gradio as gr
 import spaces
@@ -34,7 +33,7 @@ from utils.dynamic_resolution import dynamic_resolution_h_w, h_div_w_templates
 torch._dynamo.config.cache_size_limit = 64
 # Define a function to download weights if not present
-def download_weights(weights_path):
     try:
         model_file = weights_path / 'infinity_2b_reg.pth'
         if not model_file.exists():
@@ -361,7 +360,7 @@ def load_transformer(vae, args):
 # Set up paths
 weights_path = Path(__file__).parent / 'weights'
 weights_path.mkdir(exist_ok=True)
-download_weights(weights_path)
 # Device setup
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
@@ -451,16 +450,34 @@ with gr.Blocks() as demo:
     gr.Markdown("<h1><center>Infinity Image Generator</center></h1>")
     with gr.Row():
-        prompt = gr.Textbox(label="Prompt", value="alien spaceship enterprise")
-        cfg = gr.Slider(label="CFG", minimum=1, maximum=10, step=0.5, value=3)
-        tau = gr.Slider(label="Tau", minimum=0.1, maximum=1.0, step=0.1, value=0.5)
-        h_div_w = gr.Slider(label="Aspect Ratio (Height/Width)", minimum=0.5, maximum=2.0, step=0.1, value=1.0)
-        seed = gr.Number(label="Seed", value=random.randint(0, 10000))
-        enable_positive_prompt = gr.Checkbox(label="Enable Positive Prompt", value=False)
-    generate_button = gr.Button("Generate Image")
-    output_image = gr.Image(label="Generated Image", type="pil")
     generate_button.click(
         generate_image,
         inputs=[prompt, cfg, tau, h_div_w, seed, enable_positive_prompt],

 import cv2
 import numpy as np
 import torch
 import torch.nn.functional as F
 from PIL import Image, ImageEnhance
 import PIL.Image as PImage
 from torchvision.transforms.functional import to_tensor
+from transformers import AutoTokenizer, T5EncoderModel, T5TokenizerFast
 from huggingface_hub import hf_hub_download
 import gradio as gr
 import spaces
 torch._dynamo.config.cache_size_limit = 64
 # Define a function to download weights if not present
+def download_infinity_weights(weights_path):
     try:
         model_file = weights_path / 'infinity_2b_reg.pth'
         if not model_file.exists():
 # Set up paths
 weights_path = Path(__file__).parent / 'weights'
 weights_path.mkdir(exist_ok=True)
+download_infinity_weights(weights_path)
 # Device setup
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
     gr.Markdown("<h1><center>Infinity Image Generator</center></h1>")
     with gr.Row():
+        with gr.Column():
+            # Prompt Settings
+            gr.Markdown("### Prompt Settings")
+            prompt = gr.Textbox(label="Prompt", value="alien spaceship enterprise", placeholder="Enter your prompt here...")
+            enable_positive_prompt = gr.Checkbox(label="Enable Positive Prompt", value=False, info="Enhance prompts with positive attributes for faces.")
+            # Image Settings
+            gr.Markdown("### Image Settings")
+            with gr.Row():
+                cfg = gr.Slider(label="CFG (Classifier-Free Guidance)", minimum=1, maximum=10, step=0.5, value=3, info="Controls the strength of the prompt.")
+                tau = gr.Slider(label="Tau (Temperature)", minimum=0.1, maximum=1.0, step=0.1, value=0.5, info="Controls the randomness of the output.")
+            with gr.Row():
+                h_div_w = gr.Slider(label="Aspect Ratio (Height/Width)", minimum=0.5, maximum=2.0, step=0.1, value=1.0, info="Set the aspect ratio of the generated image.")
+                seed = gr.Number(label="Seed", value=random.randint(0, 10000), info="Set a seed for reproducibility.")
+            # Generate Button
+            generate_button = gr.Button("Generate Image", variant="primary")
+        with gr.Column():
+            # Output Section
+            gr.Markdown("### Generated Image")
+            output_image = gr.Image(label="Generated Image", type="pil")
+            gr.Markdown("**Tip:** Right-click the image to save it.")
+    # Error Handling
+    error_message = gr.Textbox(label="Error Message", visible=False)
+    # Link the generate button to the image generation function
     generate_button.click(
         generate_image,
         inputs=[prompt, cfg, tau, h_div_w, seed, enable_positive_prompt],

models/bsq_vae/vae.py CHANGED Viewed

@@ -1,7 +1,7 @@
 import argparse
 import torch
-from infinity.models.bsq_vae.flux_vqgan import AutoEncoder
 def load_cnn(model, state_dict, prefix, expand=False, use_linear=False):
     delete_keys = []

 import argparse
 import torch
+from models.bsq_vae.flux_vqgan import AutoEncoder
 def load_cnn(model, state_dict, prefix, expand=False, use_linear=False):
     delete_keys = []