|
from typing import Optional |
|
|
|
import numpy as np |
|
import cv2 |
|
import streamlit as st |
|
from PIL import Image |
|
import os |
|
import tempfile |
|
|
|
from sdfile import PIPELINES, generate |
|
|
|
DEFAULT_PROMPT = "belted shirt black belted portrait-collar wrap blouse with black prints" |
|
DEAFULT_WIDTH, DEFAULT_HEIGHT = 512,512 |
|
OUTPUT_IMAGE_KEY = "output_img" |
|
LOADED_IMAGE_KEY = "loaded_img" |
|
|
|
def get_image(key: str) -> Optional[Image.Image]: |
|
if key in st.session_state: |
|
return st.session_state[key] |
|
return None |
|
|
|
def set_image(key:str, img: Image.Image): |
|
st.session_state[key] = img |
|
|
|
def prompt_and_generate_button(prefix, pipeline_name: PIPELINES, **kwargs): |
|
prompt = st.text_area( |
|
"Prompt", |
|
value = DEFAULT_PROMPT, |
|
key = f"{prefix}-prompt" |
|
) |
|
negative_prompt = st.text_area( |
|
"Negative prompt", |
|
value = "", |
|
key =f"{prefix}-negative_prompt", |
|
) |
|
col1,col2 =st.columns(2) |
|
with col1: |
|
steps = st.slider( |
|
"Number of inference steps", |
|
min_value=1, |
|
max_value=200, |
|
value=30, |
|
key=f"{prefix}-inference-steps", |
|
) |
|
with col2: |
|
guidance_scale = st.slider( |
|
"Guidance scale", |
|
min_value=0.0, |
|
max_value=20.0, |
|
value= 7.5, |
|
step = 0.5, |
|
key=f"{prefix}-guidance-scale", |
|
) |
|
enable_cpu_offload = st.checkbox( |
|
"Enable CPU offload if you run out of memory", |
|
key =f"{prefix}-cpu-offload", |
|
value= False, |
|
) |
|
|
|
if st.button("Generate Image", key = f"{prefix}-btn"): |
|
with st.spinner("Generating image ..."): |
|
image = generate( |
|
prompt, |
|
pipeline_name, |
|
negative_prompt=negative_prompt, |
|
num_inference_steps=steps, |
|
guidance_scale=guidance_scale, |
|
enable_cpu_offload=enable_cpu_offload, |
|
**kwargs, |
|
) |
|
set_image(OUTPUT_IMAGE_KEY,image.copy()) |
|
st.image(image) |
|
def width_and_height_sliders(prefix): |
|
col1, col2 = st.columns(2) |
|
with col1: |
|
width = st.slider( |
|
"Width", |
|
min_value=64, |
|
max_value=1600, |
|
step=16, |
|
value=512, |
|
key=f"{prefix}-width", |
|
) |
|
with col2: |
|
height = st.slider( |
|
"Height", |
|
min_value=64, |
|
max_value=1600, |
|
step=16, |
|
value=512, |
|
key=f"{prefix}-height", |
|
) |
|
return width, height |
|
|
|
def image_uploader(prefix): |
|
image = st.file_uploader("Image", ["jpg", "png"], key=f"{prefix}-uploader") |
|
if image: |
|
image = Image.open(image) |
|
print(f"loaded input image of size ({image.width}, {image.height})") |
|
return image |
|
|
|
return get_image(LOADED_IMAGE_KEY) |
|
|
|
def sketching(): |
|
image = image_uploader("sketch2img") |
|
|
|
if not image: |
|
return None,None |
|
|
|
with tempfile.TemporaryDirectory() as temp_dir: |
|
temp_image_path = os.path.join(temp_dir, "uploaded_image.jpg") |
|
image.save(temp_image_path) |
|
|
|
image = cv2.imread(temp_image_path) |
|
image = cv2.cvtColor(image,cv2.COLOR_BGR2GRAY) |
|
image_blur = cv2.GaussianBlur(image,(5,5),0) |
|
sketch = cv2.adaptiveThreshold(image_blur, 255, cv2.ADAPTIVE_THRESH_MEAN_C,cv2.THRES_BINARY,11,2) |
|
sketch_pil = Image.fromarray(sketch) |
|
return sketch_pil |
|
|
|
def txt2img_tab(): |
|
prefix = "txt2img" |
|
width, height = width_and_height_sliders(prefix) |
|
prompt_and_generate_button(prefix,"txt2img",width=width,height=height) |
|
|
|
def sketching_tab(): |
|
prefix = "sketch2img" |
|
col1,col2 = st.columns(2) |
|
with col1: |
|
sketch_pil = sketching() |
|
with col2: |
|
if sketch_pil: |
|
controlnet_conditioning_scale = st.slider( |
|
"Strength or dependence on the input sketch", |
|
min_value=0.0, |
|
max_value= 1.0, |
|
value = 0.5, |
|
step = 0.05, |
|
key=f"{prefix}-controlnet_conditioning_scale", |
|
) |
|
prompt_and_generate_button( |
|
prefix, |
|
"sketch2img", |
|
sketch_pil=sketch_pil, |
|
controlnet_conditioning_scale=controlnet_conditioning_scale, |
|
) |
|
|
|
def main(): |
|
st.set_page_config(layout="wide") |
|
st.title("Fashion-SDX: Playground") |
|
|
|
tab1,tab2 = st.tabs( |
|
["Text to image", "Sketch to image"] |
|
) |
|
with tab1: |
|
txt2img_tab() |
|
with tab2: |
|
sketching_tab() |
|
|
|
with st.sidebar: |
|
st.header("Most Recent Output Image") |
|
output_image = get_image((OUTPUT_IMAGE_KEY)) |
|
if output_image: |
|
st.image(output_image) |
|
else: |
|
st.markdown("no output generated yet") |
|
if __name__ =="__main__": |
|
main() |