Spaces:
Paused
Paused
init
Browse files- llava/conversation.py +11 -11
- llava/serve/gradio_web_server.py +20 -15
llava/conversation.py
CHANGED
@@ -133,17 +133,17 @@ class Conversation:
|
|
133 |
image = image.resize((336, 336))
|
134 |
else:
|
135 |
raise ValueError(f"Invalid image_process_mode: {image_process_mode}")
|
136 |
-
if max(image.size) > max_len:
|
137 |
-
|
138 |
-
|
139 |
-
|
140 |
-
|
141 |
-
|
142 |
-
|
143 |
-
|
144 |
-
|
145 |
-
|
146 |
-
|
147 |
if return_pil:
|
148 |
return image
|
149 |
else:
|
|
|
133 |
image = image.resize((336, 336))
|
134 |
else:
|
135 |
raise ValueError(f"Invalid image_process_mode: {image_process_mode}")
|
136 |
+
# if max(image.size) > max_len:
|
137 |
+
# max_hw, min_hw = max(image.size), min(image.size)
|
138 |
+
# aspect_ratio = max_hw / min_hw
|
139 |
+
# shortest_edge = int(min(max_len / aspect_ratio, min_len, min_hw))
|
140 |
+
# longest_edge = int(shortest_edge * aspect_ratio)
|
141 |
+
# W, H = image.size
|
142 |
+
# if H > W:
|
143 |
+
# H, W = longest_edge, shortest_edge
|
144 |
+
# else:
|
145 |
+
# H, W = shortest_edge, longest_edge
|
146 |
+
# image = image.resize((W, H))
|
147 |
if return_pil:
|
148 |
return image
|
149 |
else:
|
llava/serve/gradio_web_server.py
CHANGED
@@ -61,7 +61,7 @@ def resize_image(image, default_width=(1344, 896), request_width=None):
|
|
61 |
from PIL import Image, ImageDraw
|
62 |
|
63 |
|
64 |
-
def draw_circle_on_image(image, x, y, radius=
|
65 |
"""
|
66 |
在给定的图片上绘制一个红色圆圈,并返回新的图片。如果 x, y 坐标不在图片范围内,
|
67 |
并且 y 超出了图片高度,则尝试将 y 减去 224;如果调整后的 y 仍然超出范围,则返回原图。
|
@@ -382,6 +382,7 @@ def http_bot(state, model_selector, temperature, top_p, max_new_tokens, request:
|
|
382 |
|
383 |
if len(all_images) > 0:
|
384 |
# 假设我们对第一张图片进行 resize 并展示
|
|
|
385 |
resized_image = draw_circle_on_image(resize_image(all_images[0]),original_coord[0],original_coord[1])
|
386 |
# state.append_message(state.roles[1], ("", resized_image,"Default"))
|
387 |
yield (state, state.to_gradio_chatbot(resized_image)) + (enable_btn,) * 5
|
@@ -425,8 +426,8 @@ block_css = """
|
|
425 |
}
|
426 |
|
427 |
#chatbot img {
|
428 |
-
max-width:
|
429 |
-
max-height:
|
430 |
width: auto; /* 保持宽度自适应 */
|
431 |
height: auto; /* 保持高度自适应 */
|
432 |
object-fit: contain; /* 保持图片宽高比,不失真 */
|
@@ -444,13 +445,14 @@ def build_demo(embed_mode, cur_dir=None, concurrency_count=1):
|
|
444 |
|
445 |
with gr.Row():
|
446 |
with gr.Column(scale=3):
|
447 |
-
with gr.Row(elem_id="model_selector_row"):
|
448 |
-
|
449 |
-
|
450 |
-
|
451 |
-
|
452 |
-
|
453 |
-
|
|
|
454 |
|
455 |
imagebox = gr.Image(type="pil")
|
456 |
image_process_mode = gr.Radio(
|
@@ -464,11 +466,14 @@ def build_demo(embed_mode, cur_dir=None, concurrency_count=1):
|
|
464 |
[f"{cur_dir}/amazon.jpg",f"Search bar at the top of the page"],
|
465 |
# [f"{cur_dir}/examples/waterview.jpg", "What are the things I should be cautious about when I visit here?"],
|
466 |
], inputs=[imagebox, textbox])
|
467 |
-
|
468 |
-
|
469 |
-
|
470 |
-
|
471 |
-
|
|
|
|
|
|
|
472 |
|
473 |
with gr.Column(scale=8):
|
474 |
chatbot = gr.Chatbot(
|
|
|
61 |
from PIL import Image, ImageDraw
|
62 |
|
63 |
|
64 |
+
def draw_circle_on_image(image, x, y, radius=20, color=(255, 0, 0)):
|
65 |
"""
|
66 |
在给定的图片上绘制一个红色圆圈,并返回新的图片。如果 x, y 坐标不在图片范围内,
|
67 |
并且 y 超出了图片高度,则尝试将 y 减去 224;如果调整后的 y 仍然超出范围,则返回原图。
|
|
|
382 |
|
383 |
if len(all_images) > 0:
|
384 |
# 假设我们对第一张图片进行 resize 并展示
|
385 |
+
|
386 |
resized_image = draw_circle_on_image(resize_image(all_images[0]),original_coord[0],original_coord[1])
|
387 |
# state.append_message(state.roles[1], ("", resized_image,"Default"))
|
388 |
yield (state, state.to_gradio_chatbot(resized_image)) + (enable_btn,) * 5
|
|
|
426 |
}
|
427 |
|
428 |
#chatbot img {
|
429 |
+
max-width: 80%; /* 宽图片根据宽度调整 */
|
430 |
+
max-height: 80vh; /* 高图片根据视口高度调整 */
|
431 |
width: auto; /* 保持宽度自适应 */
|
432 |
height: auto; /* 保持高度自适应 */
|
433 |
object-fit: contain; /* 保持图片宽高比,不失真 */
|
|
|
445 |
|
446 |
with gr.Row():
|
447 |
with gr.Column(scale=3):
|
448 |
+
# with gr.Row(elem_id="model_selector_row"):
|
449 |
+
# model_selector = gr.Dropdown(
|
450 |
+
# choices=models,
|
451 |
+
# value=models[0] if len(models) > 0 else "",
|
452 |
+
# interactive=True,
|
453 |
+
# show_label=False,
|
454 |
+
# container=False)
|
455 |
+
model_selector="llava-v1.5-UGround_v1"
|
456 |
|
457 |
imagebox = gr.Image(type="pil")
|
458 |
image_process_mode = gr.Radio(
|
|
|
466 |
[f"{cur_dir}/amazon.jpg",f"Search bar at the top of the page"],
|
467 |
# [f"{cur_dir}/examples/waterview.jpg", "What are the things I should be cautious about when I visit here?"],
|
468 |
], inputs=[imagebox, textbox])
|
469 |
+
temperature=0
|
470 |
+
top_p=0.7
|
471 |
+
max_output_tokens=16384
|
472 |
+
#
|
473 |
+
# with gr.Accordion("Parameters", open=False) as parameter_row:
|
474 |
+
# temperature = gr.Slider(minimum=0.0, maximum=1.0, value=0.2, step=0.1, interactive=True, label="Temperature",)
|
475 |
+
# top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0.7, step=0.1, interactive=True, label="Top P",)
|
476 |
+
# max_output_tokens = gr.Slider(minimum=0, maximum=1024, value=512, step=64, interactive=True, label="Max output tokens",)
|
477 |
|
478 |
with gr.Column(scale=8):
|
479 |
chatbot = gr.Chatbot(
|