File size: 20,552 Bytes
7cbf24f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 |
import os
import cv2
import gradio as gr
import numpy as np
import random
import base64
import requests
import json
import time
def portrait_gen(person_img, template_img, prompt, seed, randomize_seed):
post_start_time = time.time()
if person_img is None:
gr.Warning("Empty Person image")
return None, None, "Empty image"
if randomize_seed:
seed = random.randint(0, MAX_SEED)
encoded_person_img = cv2.imencode('.jpg', cv2.cvtColor(person_img, cv2.COLOR_RGB2BGR))[1].tobytes()
encoded_person_img = base64.b64encode(encoded_person_img).decode('utf-8')
encoded_template_img = None
if template_img is not None:
# style image with fixed hidden prompt
prompt_temp = imgpath_to_prompt(template_img)
if prompt_temp is not None:
prompt = prompt_temp
encoded_template_img = cv2.imencode('.jpg', cv2.imread(template_img))[1].tobytes()
encoded_template_img = base64.b64encode(encoded_template_img).decode('utf-8')
url = "http://" + os.environ['avatar_url'] + "Submit"
token = os.environ['token']
referer = os.environ['referer']
headers = {'Content-Type': 'application/json', 'token': token, 'referer': referer}
data = {
"templateImage": encoded_template_img,
"humanImage": encoded_person_img,
"seed": seed,
"prompt": prompt
}
try:
response = requests.post(url, headers=headers, data=json.dumps(data), timeout=50)
# print("post response code", response.status_code)
if response.status_code == 200:
result = response.json()['result']
status = result['status']
if status == "success":
uuid = result['result']
# print(uuid)
except Exception as err:
print(f"Post Exception Error: {err}")
raise gr.Error("Too many users, please try again later")
post_end_time = time.time()
print(f"post time used: {post_end_time-post_start_time}")
get_start_time =time.time()
time.sleep(9)
Max_Retry = 12
result_img = None
info = ""
err_log = ""
for i in range(Max_Retry):
try:
url = "http://" + os.environ['avatar_url'] + "Query?taskId=" + uuid
response = requests.get(url, headers=headers, timeout=20)
# print("get response code", response.status_code)
if response.status_code == 200:
result = response.json()['result']
status = result['status']
if status == "success":
result = base64.b64decode(result['result'])
result_np = np.frombuffer(result, np.uint8)
result_img = cv2.imdecode(result_np, cv2.IMREAD_UNCHANGED)
result_img = cv2.cvtColor(result_img, cv2.COLOR_RGB2BGR)
info = "Success"
break
elif status == "error":
err_log = f"Status is Error"
info = "Error"
break
else:
# print(response.text)
err_log = "URL error, pleace contact the admin"
info = "URL error, pleace contact the admin"
break
except requests.exceptions.ReadTimeout:
err_log = "Http Timeout"
info = "Http Timeout, please try again later"
except Exception as err:
err_log = f"Get Exception Error: {err}"
time.sleep(1)
get_end_time = time.time()
print(f"get time used: {get_end_time-get_start_time}")
print(f"all time used: {get_end_time-get_start_time+post_end_time-post_start_time}")
if info == "":
err_log = f"No image after {Max_Retry} retries"
info = "Too many users, please try again later"
if info != "Success":
print(f"Error Log: {err_log}")
gr.Warning("Too many users, please try again later")
return result_img, seed, info
MAX_SEED = 999999
example_path = os.path.join(os.path.dirname(__file__), 'assets')
refer_list = sorted(os.listdir(os.path.join(example_path,"refer_imgs")))
refer_list_path = [os.path.join(example_path,"refer_imgs",garm) for garm in refer_list]
human_list = sorted(os.listdir(os.path.join(example_path,"id_imgs")))
human_list_path = [os.path.join(example_path,"id_imgs",human) for human in human_list]
prompt_list = [
"Half-length close-up of a beautiful girl, dressed in the Hogwarts uniform from the Harry Potter series, wearing a blue cloak with a crest that appears to be the Gryffindor house emblem, along with a white shirt and a red-and-gold striped tie. She is holding a majic wand, the hair is long and wavy, and the background consists of a wooden wall with several books and a framed picture placed on a wooden desk. This setting evokes an atmosphere similar to a cozy study room or a magical classroom.",
"WM,Anime Magic,an anime girl holding glowing blue poker cards in her hands,poker cards flying in the sky,glowing magic effects,dynamic poses,highly detailed,ultra-high resolutions,32K UHD,best quality,masterpiece..The background features a full majic moon casting a soft glow, accentuating the ethereal majic ambiance.",
"A serene beauty stands in a studio awash with soft, golden light. Her wavy brunette hair cascades over her shoulders, while her piercing blue eyes gaze into the distance, filled with quiet contemplation. She wears a delicate, flowing white dress that seems to shimmer in the gentle glow, exuding an aura of pure elegance and grace , the classic film filter applied to the image imparts a nostalgic and gritty texture,highlighting the enduring allure of youth culture and fashion. the background provide a rich,textured setting,further emphasizing the unique style and attitude of the subject. Shot with a Fujifilm X-Pro3 camera,HDR,UHD,8K,best quality,best quality,masterpiece,realistic,cute face,smug,naughty face,light blush,giggling,backlighting,rim_light,moody lighting,",
"A man wear an Argentina shirt with No. 7, holds up the World Cup, surrounded by golden rain. The man is laughing with a gold medal around their neck. The background showcases a large stadium filled with spectators, illuminated by bright lights and surrounded by a celebratory shower of confetti. The overall atmosphere is one of triumph and celebration",
"anime epic cinematic shot of dynamic, The transatlantic slave trade, dramatic lighting, Technicolor, in motion, main subject of high budget action movie, raw photo, motion blur, best quality, high resolution, aidmaMJ6.1, an angel with wings and armor holding a spear in front of him flies at a demon, the demon, spreading his arms, yells at the angel,",
"Sci-fi style digital art image showing a knight in futuristic armor riding a motorcycle on a city street. The protagonist is located in the center right position, wearing a black, metallic tight armor. The surface of the armor is covered with raindrops and water stains, indicating that it has just experienced a heavy rain. His posture is leaning forward, holding the handlebars tightly with both hands, which makes him look very focused and full of power. The design of the motorcycle is very futuristic, with smooth body lines, bright red light from the headlights, and the right side mirror also reflects the ambient light. The tires of the motorcycle are wide and the tread pattern is clearly visible, which echoes the slippery road surface. The background is a city street scene with tall buildings, and the buildings are covered with colorful neon billboards. Various words and patterns are blurred against the sky in the distance. Some larger billboards with red and blue words can be seen on the left; on the right, there are more small billboards with various colors but not very clear. There are other pedestrians on the street. Although they are far away, their figures can be distinguished. Most of them have their backs to the camera and walk towards the distant buildings. The rain-soaked ground in the entire scene reflects the surrounding lights, adding depth and three-dimensionality to the picture. The details of the buildings in the background are slightly blurred, presenting a hazy feeling, highlighting the protagonist and his motorcycle in the foreground. The overall tone of the picture is cold, mainly black and gray, supplemented by red and blue light, forming a strong contrast effect. The high color saturation, moderate brightness, and uniform exposure give the picture a strong visual impact and a sense of futuristic technology. This image successfully creates a futuristic urban scene full of dynamic and technological atmosphere through delicate detail depiction and vivid color use.",
# "a person wearing a light brown coat, a white shirt, a dark pleated short skirt, and a striped tie, showing off the long legs. The outfit is completed with knee-high white socks and black leather shoes. The individual is standing on a pathway that is covered with yellow fallen leaves, surrounded by trees that have yellow leaves still attached. The trees are planted along both sides of the pathway, creating a picturesque autumn scene. The trunks of the trees are painted white at the base. The overall setting appears to be a serene autumnal day, with bright and warm lighting",
"Chinese pretty girl, with long, dark, wavy hair cascading over the shoulders, a sleeveless, knitted blue top with a high neck. The background is a gradient of various shades of blue, with a subtle texture that gives it a studio portrait appearance. The lighting is soft, illuminating the individual from the front, creating a calm and serene ambiance.",
"A person dressed in a sleek, black turtleneck sweater and a matching black suit jacket. The outfit conveys a sophisticated and formal style. The background is a solid olive green color, which contrasts subtly with the dark clothing. The hair appears to be dark and styled in a slightly tousled manner, adding a casual touch to the otherwise formal attire.",
"The upper body of a person wearing a plain, vibrant red, long-sleeved sweater. The sweater has a round neckline with a ribbed texture. The person has black hair that appears to be slightly tousled. The background of the image is plain and neutral, likely a light gray or white color, providing a clean and simple backdrop that contrasts with the rich color of the sweater. The image conveys a sense of casual yet stylish attire.",
]
prompt_list_examples = [
'hold a sign writing "Kolors Portrait with Flux"',
'The millionaire flung wads of cash in the air like confetti at the crowded nightclub, making it rain on the ecstatic revellers below.',
'Wearing Iron Man costume, in fantastic space, with stars twinkling, ultra-high resolutions,32K UHD,best quality,masterpiece',
'a person sitting on the ground in a forest or park during autumn. The ground is covered with fallen leaves in shades of yellow and brown. They are wearing a cozy cream-colored knit sweater and jeans. Their hair is long and brown, reaching past their shoulders. In one hand, they hold up a yellow maple leaf, while the other hand rests on their lap, also holding a leaf. The background features trees with yellow leaves, indicating the fall season, and the sunlight filters through the foliage, casting a warm, golden light on the scene. The atmosphere is serene and picturesque, capturing the essence of autumn.',
'A masterpiece of dreamy photography. The girl holds a glowing glass jar in her hands, which emits a soft yellow light, illuminating her face and the surrounding environment. She wears a white lace dress with blue and pink decorations and a light blue bow tied around her waist. The girl wears a white headdress dotted with blue and pink flowers and carries twinkling blue wings on her back. Behind the girl, you can see a vast sea of flowers, which sparkle with pink and gold light and are scattered on the green grass. The sky is full of sparkling stars, from the upper left corner to the lower right corner, as if the Milky Way is scattered in the night sky. The overall light is soft and full of magical colors, making the whole picture look like a fairy tale world.',
]
prompt_list_single = [
'hold a sign writing "Kolors Portrait with Flux"',
"A beautiful girl reading book, high quality.",
"Full body shot of young Asian face woman in sun hat and white dress standing on sunny beach with sea and mountains in background, high quality, sharp focus,",
]
css="""
#col-left {
margin: 0 auto;
max-width: 270px;
}
#col-mid {
margin: 0 auto;
max-width: 270px;
}
#col-right {
margin: 0 auto;
max-width: 550px;
}
#col-showcase {
margin: 0 auto;
max-width: 1100px;
}
#col-left-left {
margin: 0 auto;
max-width: 400px;
}
#col-left-right {
margin: 0 auto;
max-width: 120px;
}
#button {
color: blue;
}
"""
def img_to_prompt(img_path,prompt):
if img_path is None:
# return prompt,prompt_final
return prompt
else:
return None
def imgpath_to_prompt(img_path):
img_name = img_path.split("/")[-1]
if img_name in refer_list:
prompt_id = refer_list.index(img_name)
prompt_final = prompt_list[prompt_id]
else:
prompt_final = None
return prompt_final
def text_to_text(text1, text2):
if text1 is not None:
return text1
else:
return text2
def load_description(fp):
with open(fp, 'r', encoding='utf-8') as f:
content = f.read()
return content
def img_close():
return None
def change_mode(mode: str):
if mode == "Input prompt":
return gr.update(visible=True), gr.update(visible=False, value=None)
elif mode == "Ref. image":
return gr.update(visible=False, value=""), gr.update(visible=True)
else:
raise gr.Error("no such mode!")
change_mode_js = """
function change_mode_js(...args){
mode = args[0];
console.log("change_mode");
text_examples = document.querySelector("#text_examples");
image_examples = document.querySelector("#image_examples");
ref_examples = document.querySelector("#ref_examples");
prompt_examples = document.querySelector("#prompt_examples");
if (mode === "Input prompt"){
text_examples.hidden = false;
prompt_examples.hidden = false;
image_examples.hidden = true;
ref_examples.hidden = true;
}else {
text_examples.hidden = true;
prompt_examples.hidden = true;
image_examples.hidden = false;
ref_examples.hidden = false;
}
return args
}
"""
with gr.Blocks(css=css) as Portrait:
gr.HTML(load_description("title.md"))
with gr.Row():
with gr.Column(elem_id = "col-left"):
gr.HTML("""
<div style="display: flex; justify-content: center; align-items: center; text-align: center; font-size: 20px;">
<div>
Step 1. Upload a portrait image ⬇️
</div>
</div>
""")
with gr.Column(elem_id = "col-mid"):
gr.HTML("""
<div style="display: flex; justify-content: center; align-items: center; text-align: center; font-size: 20px;">
<div>
Step 2. Set a style reference ⬇️
</div>
</div>
""")
with gr.Column(elem_id = "col-right"):
gr.HTML("""
<div style="display: flex; justify-content: center; align-items: center; text-align: center; font-size: 20px;">
<div>
Step 3. Press “Run” to get results ⬇️
</div>
</div>
""")
with gr.Row():
with gr.Column(elem_id = "col-left"):
imgs = gr.Image(label="Person Images", sources='upload', type="numpy",width=400)
example = gr.Examples(
inputs=imgs,
examples_per_page=10,
examples=human_list_path,
label="Person Images"
)
with gr.Column(elem_id = "col-mid"):
# gr.HTML("""
# <div style="display: flex; justify-content: center; align-items: center; text-align: center; font-size: 15px;">
# <div>
# Use image <strong>OR!!!</strong> text as reference style.
# </div>
# </div>
# """)
mode = gr.Radio(label="Set a reference image or input prompt", choices=["Ref. image", "Input prompt"], value="text")
refer_img = gr.Image(label="Reference images", sources='upload', type="filepath")
example = gr.Examples(
inputs=refer_img,
examples_per_page=9,
examples=refer_list_path,
label = 'Reference images',
elem_id="ref_examples"
)
prompt = gr.Text(
label="Input prompts",
show_label=False,
max_lines=1,
placeholder="Enter your prompt",
container=False,
)
examples_prompt = gr.Examples(
inputs=prompt,
examples=prompt_list_single,
label = 'Input prompts',
elem_id="prompt_examples"
)
Portrait.load(
fn=lambda: gr.update(value="Ref. image"),
outputs=[mode],
show_progress=False
)
mode.change(
js=change_mode_js,
fn=change_mode,
inputs=[mode],
outputs=[prompt, refer_img],
show_progress=False
)
with gr.Column(elem_id = "col-right"):
image_out = gr.Image(label="Results", show_share_button=False)
with gr.Row():
seed = gr.Slider(
label="Seed",
minimum=0,
maximum=MAX_SEED,
step=1,
value=0,
)
randomize_seed = gr.Checkbox(label="Random seed", value=True)
with gr.Row():
seed_used = gr.Number(label="Seed used")
result_info = gr.Text(label="Response")
test_button = gr.Button(value="Run", elem_id="button")
test_button.click(fn=portrait_gen, inputs=[imgs, refer_img, prompt, seed, randomize_seed], outputs=[image_out, seed_used, result_info], api_name=False)
with gr.Column(elem_id = "col-showcase"):
gr.HTML("""
<div style="display: flex; justify-content: center; align-items: center; text-align: center; font-size: 20px;">
<div> </div>
<br>
<br>
<div>
Portrait examples in pairs of person images and style.
</div>
</div>
""")
image_show_case = gr.Examples(
examples=[
[human_list_path[5], refer_list_path[0], os.path.join(example_path, 'outputs/190815.jpg')],
[human_list_path[6], refer_list_path[1], os.path.join(example_path, 'outputs/190811.jpg')],
[human_list_path[2], refer_list_path[3], os.path.join(example_path, 'outputs/190813.jpg')],
[human_list_path[0], refer_list_path[4], os.path.join(example_path, 'outputs/190814.jpg')],
],
inputs=[imgs, refer_img, image_out],
label=None,
elem_id="image_examples"
)
text_show_case = gr.Examples(
examples=[
[human_list_path[6], prompt_list_examples[0], os.path.join(example_path, 'outputs/190820.jpg')],
[human_list_path[4], prompt_list_examples[1], os.path.join(example_path, 'outputs/190812.jpg')],
[human_list_path[3], prompt_list_examples[2], os.path.join(example_path, 'outputs/190816.jpg')],
[human_list_path[7], prompt_list_examples[3], os.path.join(example_path, 'outputs/190818.jpg')],
[human_list_path[8], prompt_list_examples[4], os.path.join(example_path, 'outputs/190819.jpg')],
],
inputs=[imgs, prompt, image_out],
label=None,
elem_id="text_examples"
)
Portrait.queue(api_open=False).launch(show_api=False)
|