Spaces:

adil9858
/

AI_Image_Caption

Running

App Files Files Community

adil9858 commited on 23 days ago

Commit

7dcb1ad

verified ·

1 Parent(s): e807b08

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -8

app.py CHANGED Viewed

@@ -14,7 +14,7 @@ def encode_image(img):
     return encoded_string
 # Function to get explanation from VLM API
-def explain_image_with_vlm(image):
     api = "https://api.hyperbolic.xyz/v1/chat/completions"
     api_key = "eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJzdWIiOiJhZGlsYXppejIwMTNAZ21haWwuY29tIiwiaWF0IjoxNzMyODU1NDI1fQ.lRjbz9LMW9jj7Lf7I8m_dTRh4KQ1wDCdWiTRGErMuEk"
@@ -30,7 +30,7 @@ def explain_image_with_vlm(image):
             {
                 "role": "user",
                 "content": [
-                    {"type": "text", "text": "Explain the Image in 10 words only"},
                     {
                         "type": "image_url",
                         "image_url": {"url": f"data:image/jpeg;base64,{base64_img}"},
@@ -90,16 +90,22 @@ def styled_header(header_text):
 # Main Camera Input Section
 img_file_buffer = st.camera_input("🚀 Capture Your Image Here")
-if img_file_buffer:
     # Display captured image
     image = Image.open(img_file_buffer)
-    #st.markdown(styled_header("📸 Your Captured Image:"), unsafe_allow_html=True)
-    #st.image(image, caption="Captured Image", use_column_width=True)
     st.markdown(styled_header("🤖 Image Analysis:"), unsafe_allow_html=True)
     with st.spinner("🔍 The AI is analyzing your image. Please wait..."):
-        explanation = explain_image_with_vlm(image)
-        #st.success("✨ Analysis Complete!")
         st.write(f"**AI Insight:** {explanation}")
 # Footer
@@ -111,4 +117,4 @@ st.markdown(
     </footer>
     """,
     unsafe_allow_html=True
-)

     return encoded_string
 # Function to get explanation from VLM API
+def explain_image_with_vlm(image, prompt):
     api = "https://api.hyperbolic.xyz/v1/chat/completions"
     api_key = "eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJzdWIiOiJhZGlsYXppejIwMTNAZ21haWwuY29tIiwiaWF0IjoxNzMyODU1NDI1fQ.lRjbz9LMW9jj7Lf7I8m_dTRh4KQ1wDCdWiTRGErMuEk"
             {
                 "role": "user",
                 "content": [
+                    {"type": "text", "text": prompt},  # Use the user-provided prompt
                     {
                         "type": "image_url",
                         "image_url": {"url": f"data:image/jpeg;base64,{base64_img}"},
 # Main Camera Input Section
 img_file_buffer = st.camera_input("🚀 Capture Your Image Here")
+# Text prompt input
+user_prompt = st.text_input(
+    "📝 Enter your prompt (e.g., 'Explain the image', 'What are the functions in this graph?', 'Describe the scene'):",
+    value="Explain the image in 10 words only"
+)
+if img_file_buffer and user_prompt:
     # Display captured image
     image = Image.open(img_file_buffer)
+    st.markdown(styled_header("📸 Your Captured Image:"), unsafe_allow_html=True)
+    st.image(image, caption="Captured Image", use_column_width=True)
     st.markdown(styled_header("🤖 Image Analysis:"), unsafe_allow_html=True)
     with st.spinner("🔍 The AI is analyzing your image. Please wait..."):
+        explanation = explain_image_with_vlm(image, user_prompt)
+        st.success("✨ Analysis Complete!")
         st.write(f"**AI Insight:** {explanation}")
 # Footer
     </footer>
     """,
     unsafe_allow_html=True
+)