Spaces:

jasperai
/

inversion-instantstyle

Running on Zero

App Files Files Community

baubin commited on Oct 2

Commit

dded383

•

1 Parent(s): b40fefa

examples, pin version

Browse files

Files changed (6) hide show

.gitignore +1 -0
app.py +34 -21
images/6.png +3 -0
images/7.png +3 -0
images/8.png +3 -0
requirements.txt +7 -5

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ envs

app.py CHANGED Viewed

@@ -1,3 +1,4 @@
 import os
 import random
@@ -6,8 +7,12 @@ import numpy as np
 import PIL.Image
 import spaces
 import torch
-from diffusers import (AutoencoderKL, DDIMInverseScheduler, DDIMScheduler,
-                       StableDiffusionXLPipeline)
 from torchvision.transforms import ToTensor
 # pyright: reportPrivateImportUsage=false
@@ -15,7 +20,8 @@ from torchvision.transforms import ToTensor
 DESCRIPTION = f"""
     # 🎨 Inversion-InstantStyle 🎨
-    This is an interactive demo of noisy DDIM inversion capabilities on top of Instant-Style styling method. This was developed in the context of a style benchmark : [style-rank](https://gojasper.github.io/style-rank-project) by *Eyal Benaroche, Clément Chadebec, Onur Tasar, and Benjamin Aubin* from [Jasper Research](https://www.jasper.ai/) in the context of Eyal's internship with Ecole Polytechnique.
     """
 OPEN_SOURCE_PROMO = f"""
@@ -57,6 +63,8 @@ if gr.NO_RELOAD:
             "stabilityai/stable-diffusion-xl-base-1.0", subfolder="scheduler"
         )
         invert_scheduler = DDIMInverseScheduler(**forward_scheduler.config)
 css = """
     h1 {
@@ -175,15 +183,20 @@ def generate(
 examples_prompts = [
     "Astronaut in a jungle, detailed, 8k",
-    "A Bird",
-    "A Tiger",
-    "A Cat",
-    "cactus",
-    "A Panda",
 ]
-examples_images = [f"./images/{i}.png" for i in range(6)]
 examples = [[prompt, image] for prompt, image in zip(examples_prompts, examples_images)]
 with gr.Blocks(css=css) as demo:
@@ -197,7 +210,17 @@ with gr.Blocks(css=css) as demo:
             with gr.Column():
-                style_image = gr.Image()
                 noise_scale = gr.Slider(
                     label="Noise Scale",
@@ -210,16 +233,6 @@ with gr.Blocks(css=css) as demo:
         with gr.Blocks():
             with gr.Column():
-                with gr.Row():
-                    prompt = gr.Text(
-                        label="Prompt",
-                        show_label=False,
-                        max_lines=1,
-                        placeholder="Enter your prompt",
-                        container=False,
-                    )
-                    run_button = gr.Button("Run", scale=0)
                 result = gr.Image(label="Result", show_label=False)
     with gr.Accordion("Advanced options", open=False):

+import glob
 import os
 import random
 import PIL.Image
 import spaces
 import torch
+from diffusers import (
+    AutoencoderKL,
+    DDIMInverseScheduler,
+    DDIMScheduler,
+    StableDiffusionXLPipeline,
+)
 from torchvision.transforms import ToTensor
 # pyright: reportPrivateImportUsage=false
 DESCRIPTION = f"""
     # 🎨 Inversion-InstantStyle 🎨
+    This is an interactive demo of [Inversion-InstantStyle](https://gojasper.github.io/style-rank-project/#inversion_instantstyle), which combines DDIM inversion and renoising with the [Instant-Style](https://instantstyle.github.io/) styling method.
+    It was proposed in the context of our [Style-Rank](https://gojasper.github.io/style-rank-project) benchmark which evaluates training-free styling methods, by *Eyal Benaroche, Clément Chadebec, Onur Tasar, and Benjamin Aubin* from [Jasper Research](https://www.jasper.ai/) and [Ecole Polytechnique](https://www.polytechnique.edu/).
     """
 OPEN_SOURCE_PROMO = f"""
             "stabilityai/stable-diffusion-xl-base-1.0", subfolder="scheduler"
         )
         invert_scheduler = DDIMInverseScheduler(**forward_scheduler.config)
+    else:
+        raise ValueError("This demo does not work on CPU.")
 css = """
     h1 {
 examples_prompts = [
     "Astronaut in a jungle, detailed, 8k",
+    "A bird",
+    "A tiger",
+    "A cat",
+    "A cactus",
+    "A panda",
+    "A duck",
+    "An elephant",
+    "A dragon head",
 ]
+examples_images = glob.glob("./images/*.png")
+assert len(examples_images) == len(
+    examples_prompts
+), "Number of example images and prompts should match"
 examples = [[prompt, image] for prompt, image in zip(examples_prompts, examples_images)]
 with gr.Blocks(css=css) as demo:
             with gr.Column():
+                with gr.Row():
+                    prompt = gr.Text(
+                        label="Target prompt",
+                        show_label=False,
+                        max_lines=1,
+                        placeholder="Enter your prompt to generate new content",
+                        container=False,
+                    )
+                    run_button = gr.Button("Run", scale=0)
+                style_image = gr.Image(label="Style reference image")
                 noise_scale = gr.Slider(
                     label="Noise Scale",
         with gr.Blocks():
             with gr.Column():
                 result = gr.Image(label="Result", show_label=False)
     with gr.Accordion("Advanced options", open=False):

images/6.png ADDED Viewed

Git LFS Details

SHA256: 1cb23bbf5d35aad2bdad146b9f8623d237255baf3dfba38cffa5f613364e1c2a
Pointer size: 131 Bytes
Size of remote file: 254 kB

images/7.png ADDED Viewed

Git LFS Details

SHA256: ac6a2c9e41ebdac0f2bffdfe8adc87380afbe54196b8ac2326a6d7f05e2f3ef8
Pointer size: 131 Bytes
Size of remote file: 203 kB

images/8.png ADDED Viewed

Git LFS Details

SHA256: 04037fa01871e2c9f30f5b0dcdf21159299f94c94dd87ecf48a6de50e8f1a5d0
Pointer size: 131 Bytes
Size of remote file: 122 kB

requirements.txt CHANGED Viewed

@@ -1,12 +1,14 @@
 accelerate
 diffusers
 gradio==4.37.2
 numpy==1.26.4
 spaces
-torch==2.0.1
 torchvision
 transformers >= 4.34.0
-xformers
-ftfy
-peft==0.6.0
-optimum

 accelerate
 diffusers
+fastapi==0.112.2
+ftfy
 gradio==4.37.2
 numpy==1.26.4
+optimum
+peft==0.6.0
+pydantic
 spaces
+torch>=2.0.1
 torchvision
 transformers >= 4.34.0
+xformers