CogVLM

Running

App Files Files Community

lykeven commited on Sep 27, 2023

Commit

8d00201

1 Parent(s): d3049aa

add app

Browse files

Files changed (9) hide show

app.py +195 -0
examples/1.jpeg +0 -0
examples/1.png +0 -0
examples/2.jpeg +0 -0
examples/2.jpg +0 -0
examples/3.jpeg +0 -0
examples/3.jpg +0 -0
examples/example_inputs.jsonl +3 -0
style.css +7 -0

app.py ADDED Viewed

	@@ -0,0 +1,195 @@

+#!/usr/bin/env python
+import gradio as gr
+import os
+import re
+from PIL import Image
+import base64
+import time
+DESCRIPTION = '''# <a href="https://github.com/THUDM/CogVLM">VisualGLM</a>'''
+MAINTENANCE_NOTICE1 = 'Hint 1: If the app report "Something went wrong, connection error out", please turn off your proxy and retry.\nHint 2: If you upload a large size of image like 10MB, it may take some time to upload and process. Please be patient and wait.'
+NOTES = 'This app is adapted from <a href="https://github.com/THUDM/CogVLM">https://github.com/THUDM/CogVLM</a>. It would be recommended to check out the repo if you want to see the detail of our model.'
+import json
+import requests
+import base64
+import hashlib
+default_chatbox = [("", "Hi, What do you want to know about this image?")]
+URL = os.environ.get("URL")
+def process_image(image_prompt):
+    image = Image.open(image_prompt)
+    print(f"height:{image.height}, width:{image.width}")
+    resized_image = image.resize((224, 224), )
+    timestamp = int(time.time())
+    file_ext = os.path.splitext(image_prompt)[1]
+    filename = f"examples/{timestamp}{file_ext}"
+    resized_image.save(filename)
+    print(f"temporal filename {filename}")
+    with open(filename, "rb") as image_file:
+        bytes = base64.b64encode(image_file.read())
+        encoded_img = str(bytes, encoding='utf-8')
+        image_hash = hashlib.sha256(bytes).hexdigest()
+        os.remove(filename)
+        return encoded_img, image_hash
+def process_image_without_resize(image_prompt):
+    image = Image.open(image_prompt)
+    print(f"height:{image.height}, width:{image.width}")
+    timestamp = int(time.time())
+    file_ext = os.path.splitext(image_prompt)[1]
+    filename = f"examples/{timestamp}{file_ext}"
+    image.save(filename)
+    print(f"temporal filename {filename}")
+    with open(filename, "rb") as image_file:
+        bytes = base64.b64encode(image_file.read())
+        encoded_img = str(bytes, encoding='utf-8')
+        image_hash = hashlib.sha256(bytes).hexdigest()
+        os.remove(filename)
+        return encoded_img, image_hash
+def is_chinese(text):
+    zh_pattern = re.compile(u'[\u4e00-\u9fa5]+')
+    return zh_pattern.search(text)
+def post(
+        input_text,
+        temperature,
+        top_p,
+        image_prompt,
+        result_previous,
+        hidden_image
+        ):
+    result_text = [(ele[0], ele[1]) for ele in result_previous]
+    for i in range(len(result_text)-1, -1, -1):
+        if result_text[i][0] == "":
+            del result_text[i]
+    print(f"history {result_text}")
+    is_zh = is_chinese(input_text)
+    if image_prompt is None:
+        print("Image empty")
+        if is_zh:
+            result_text.append((input_text, '图片为空！请上传图片并重试。'))
+        else:
+            result_text.append((input_text, 'Image empty! Please upload a image and retry.'))
+        return input_text, result_text, hidden_image
+    elif input_text == "":
+        print("Text empty")
+        result_text.append((input_text, 'Text empty! Please enter text and retry.'))
+        return "", result_text, hidden_image
+    headers = {
+            "Content-Type": "application/json; charset=UTF-8",
+            "User-Agent": "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/67.0.3396.87 Safari/537.36",
+        }
+    if image_prompt:
+        encoded_img, image_hash = process_image_without_resize(image_prompt)
+        print(f"image_hash:{image_hash}, hidden_image_hash:{hidden_image}")
+        if hidden_image is not None and image_hash != hidden_image:
+            print("image has been update")
+            result_text = []
+        hidden_image = image_hash
+    else:
+        encoded_img = None
+    print('开始请求...')
+    data = json.dumps({
+        'text': input_text,
+        'image': encoded_img,
+        'temperature': temperature,
+        'top_p': top_p,
+        'history': result_text
+    })
+    try:
+        response = requests.request("POST", URL, headers=headers, data=data, timeout=(60, 100)).json()
+    except Exception as e:
+        print("error message", e)
+        if is_zh:
+            result_text.append((input_text, '超时！请稍等几分钟再重试。'))
+        else:
+            result_text.append((input_text, 'Timeout! Please wait a few minutes and retry.'))
+        return "", result_text, hidden_image
+    print('请求完毕...')
+    # response = {'result':input_text}
+    answer = str(response['result'])
+    result_text.append((input_text, answer))
+    print(result_text)
+    print('finished')
+    return "", result_text, hidden_image
+def clear_fn(value):
+    return "", default_chatbox, None
+def clear_fn2(value):
+    return default_chatbox
+def main():
+    gr.close_all()
+    examples = []
+    with open("./examples/example_inputs.jsonl") as f:
+        for line in f:
+            data = json.loads(line)
+            examples.append(data)
+    with gr.Blocks(css='style.css') as demo:
+        with gr.Row():
+            with gr.Column(scale=4.5):
+                with gr.Group():
+                    input_text = gr.Textbox(label='Input Text', placeholder='Please enter text prompt below and press ENTER.')
+                    with gr.Row():
+                        run_button = gr.Button('Generate')
+                        clear_button = gr.Button('Clear')
+                    image_prompt = gr.Image(type="filepath", label="Image Prompt", value=None)
+                with gr.Row():
+                    temperature = gr.Slider(maximum=1, value=0.8, minimum=0, label='Temperature')
+                    top_p = gr.Slider(maximum=1, value=0.4, minimum=0, label='Top P')
+                with gr.Group():
+                    with gr.Row():
+                        with gr.Column(scale=7):
+                            maintenance_notice = gr.Markdown(MAINTENANCE_NOTICE1)
+                        with gr.Column(scale=2):
+                            change_button = gr.Button('Change hint to English', visible=False)
+            with gr.Column(scale=5.5):
+                result_text = gr.components.Chatbot(label='Multi-round conversation History', value=[("", "Hi, What do you want to know about this image?")]).style(height=550)
+                hidden_image_hash = gr.Textbox(visible=False)
+        gr_examples = gr.Examples(examples=[[example["text"], example["image"]] for example in examples],
+                                  inputs=[input_text, image_prompt],
+                                  label="Example Inputs (Click to insert an examplet into the input box)",
+                                  examples_per_page=3)
+        gr.Markdown(NOTES)
+        print(gr.__version__)
+        run_button.click(fn=post,inputs=[input_text, temperature, top_p, image_prompt, result_text, hidden_image_hash],
+                         outputs=[input_text, result_text, hidden_image_hash])
+        input_text.submit(fn=post,inputs=[input_text, temperature, top_p, image_prompt, result_text, hidden_image_hash],
+                         outputs=[input_text, result_text, hidden_image_hash])
+        clear_button.click(fn=clear_fn, inputs=clear_button, outputs=[input_text, result_text, image_prompt])
+        image_prompt.upload(fn=clear_fn2, inputs=clear_button, outputs=[result_text])
+        image_prompt.clear(fn=clear_fn2, inputs=clear_button, outputs=[result_text])
+        print(gr.__version__)
+    demo.queue(concurrency_count=10)
+    demo.launch()
+if __name__ == '__main__':
+    main()

examples/1.jpeg ADDED Viewed

examples/1.png ADDED Viewed

examples/2.jpeg ADDED Viewed

examples/2.jpg ADDED Viewed

examples/3.jpeg ADDED Viewed

examples/3.jpg ADDED Viewed

examples/example_inputs.jsonl ADDED Viewed

	@@ -0,0 +1,3 @@

+{"id":1, "text": "Describe this image", "image": "examples/1.png"}
+{"id":2, "text": "What is written in the image?", "image": "examples/2.jpg"}
+{"id":3, "text": "How many houses are there in this cartoon?", "image": "examples/3.jpg"}

style.css ADDED Viewed

	@@ -0,0 +1,7 @@

+h1 {
+    text-align: center;
+  }
+  img#visitor-badge {
+    display: block;
+    margin: auto;
+  }