Spaces:

h2oai
/

h2ovl-mississippi

Running on A10G

App Files Files Community

Shanshan Wang commited on Oct 18, 2024

Commit

80d1b7a

1 Parent(s): e753774

added a preset prompts

Browse files

Files changed (1) hide show

app.py +55 -15

app.py CHANGED Viewed

@@ -21,6 +21,14 @@ model_paths = {
 }
 def load_model_and_set_image_function(model_name):
     # Get the model path from the model_paths dictionary
     model_path = model_paths[model_name]
@@ -227,6 +235,28 @@ with gr.Blocks() as demo:
             label="Select Model",
             value="H2OVL-Mississippi-2B"
         )
     # When the model selection changes, load the new model
     model_dropdown.change(
@@ -235,26 +265,28 @@ with gr.Blocks() as demo:
         outputs=[model_state]
     )
-    # Load the default model when the app starts
     demo.load(
         fn=load_model_and_set_image_function,
         inputs=[model_dropdown],
         outputs=[model_state]
     )
-    with gr.Row(equal_height=True):
-        # First column with image input
-        with gr.Column(scale=1):
-            image_input = gr.Image(type="filepath", label="Upload an Image")
-        # Second column with chatbot and user input
-        with gr.Column(scale=2):
-            chatbot = gr.Chatbot(label="Conversation")
-            user_input = gr.Textbox(label="What is your question",
-                                    placeholder="Type your message here",
-                                    interactive=True,
-                                    lines=1)
     with gr.Accordion('Parameters', open=False):
         with gr.Row():
@@ -329,7 +361,13 @@ with gr.Blocks() as demo:
         fn=clear_all,
         inputs=None,
         outputs=[chatbot, state, image_input, user_input]
-    )
     gr.Examples(
         examples=[
             ["assets/driver_license.png", "Extract the text from the image and fill the following json {'license_number':'',\n'full_name':'',\n'date_of_birth':'',\n'address':'',\n'issue_date':'',\n'expiration_date':'',\n}"],
@@ -338,6 +376,8 @@ with gr.Blocks() as demo:
             ["assets/CBA-1H23-Results-Presentation_wheel.png", "What is the efficiency of H2O.AI in document processing?"],
         ],
         inputs = [image_input, user_input],
         label = "examples",
     )
 demo.queue()

 }
+example_prompts = [
+    "Read the text and provide word by word ocr for the document. <doc>",
+    "Extract the text from the image.",
+    "Extract the text from the image and fill the following json {'license_number':'',\n'full_name':'',\n'date_of_birth':'',\n'address':'',\n'issue_date':'',\n'expiration_date':'',\n}",
+    "Please extract the following fields, and return the result in JSON format: supplier_name, supplier_address, customer_name, customer_address, invoice_number, invoice_total_amount, invoice_tax_amount",
+]
 def load_model_and_set_image_function(model_name):
     # Get the model path from the model_paths dictionary
     model_path = model_paths[model_name]
             label="Select Model",
             value="H2OVL-Mississippi-2B"
         )
+    with gr.Row(equal_height=True):
+        # First column with image input
+        with gr.Column(scale=1):
+            image_input = gr.Image(type="filepath", label="Upload an Image")
+        # Second column with chatbot and user input
+        with gr.Column(scale=2):
+            chatbot = gr.Chatbot(label="Conversation")
+            user_input = gr.Dropdown(label="What is your question",
+                                    choices = example_prompts,
+                                    value=None,
+                                    allow_custom_value=True,
+                                    interactive=True)
+    def reset_chatbot_state():
+        # reset chatbot and state
+        return [], None
     # When the model selection changes, load the new model
     model_dropdown.change(
         outputs=[model_state]
     )
+    model_dropdown.change(
+        fn=reset_chatbot_state,
+        inputs=None,
+        outputs=[chatbot, state]
+    )
+    # Reset chatbot and state when image input changes
+    image_input.change(
+        fn=reset_chatbot_state,
+        inputs=None,
+        outputs=[chatbot, state]
+    )
+        # Load the default model when the app starts
     demo.load(
         fn=load_model_and_set_image_function,
         inputs=[model_dropdown],
         outputs=[model_state]
     )
     with gr.Accordion('Parameters', open=False):
         with gr.Row():
         fn=clear_all,
         inputs=None,
         outputs=[chatbot, state, image_input, user_input]
+    )
+    def example_clicked(example):
+        image_value, user_input_value = example
+        return image_value, user_input_value, [], None  # Reset chatbot and state
     gr.Examples(
         examples=[
             ["assets/driver_license.png", "Extract the text from the image and fill the following json {'license_number':'',\n'full_name':'',\n'date_of_birth':'',\n'address':'',\n'issue_date':'',\n'expiration_date':'',\n}"],
             ["assets/CBA-1H23-Results-Presentation_wheel.png", "What is the efficiency of H2O.AI in document processing?"],
         ],
         inputs = [image_input, user_input],
+        outputs = [image_input, user_input, chatbot, state],
+        fn=example_clicked,
         label = "examples",
     )
 demo.queue()