Spaces:

sounar
/

ContactDoctor-API

Paused

App Files Files Community

sounar commited on 16 days ago

Commit

acfc179

•

1 Parent(s): 2bdc9ef

Update app.py

Browse files

Files changed (1) hide show

app.py +24 -82

app.py CHANGED Viewed

@@ -1,91 +1,33 @@
-import os
 import torch
-from transformers import AutoModel, AutoTokenizer, BitsAndBytesConfig
-import gradio as gr
-from PIL import Image
-from torchvision.transforms import ToTensor
-# Get API token from environment variable
-api_token = os.getenv("HF_TOKEN").strip()
-# Quantization configuration
-bnb_config = BitsAndBytesConfig(
-    load_in_4bit=True,
-    bnb_4bit_quant_type="nf4",
-    bnb_4bit_use_double_quant=True,
-    bnb_4bit_compute_dtype=torch.float16
-)
-# Initialize model and tokenizer
-model = AutoModel.from_pretrained(
-    "ContactDoctor/Bio-Medical-MultiModal-Llama-3-8B-V1",
-    quantization_config=bnb_config,
-    device_map="auto",
-    torch_dtype=torch.float16,
-    trust_remote_code=True,
-    attn_implementation="flash_attention_2",
-    token=api_token
-)
-tokenizer = AutoTokenizer.from_pretrained(
-    "ContactDoctor/Bio-Medical-MultiModal-Llama-3-8B-V1",
-    trust_remote_code=True,
-    token=api_token
-)
-def analyze_input(image, question):
-    try:
-        if image is not None:
-            # Convert to RGB if image is provided
-            image = image.convert('RGB')
-        # Prepare messages in the format expected by the model
-        msgs = [{'role': 'user', 'content': [image, question]}]
-        # Generate response using the chat method
-        response_stream = model.chat(
-            image=image,
-            msgs=msgs,
-            tokenizer=tokenizer,
-            sampling=True,
-            temperature=0.95,
-            stream=True
-        )
-        # Collect the streamed response
-        generated_text = ""
-        for new_text in response_stream:
-            generated_text += new_text
-            print(new_text, flush=True, end='')
-        return {"status": "success", "response": generated_text}
-    except Exception as e:
-        import traceback
-        error_trace = traceback.format_exc()
-        print(f"Error occurred: {error_trace}")
-        return {"status": "error", "message": str(e)}
-# Create Gradio interface
-demo = gr.Interface(
-    fn=analyze_input,
-    inputs=[
-        gr.Image(type="pil", label="Upload Medical Image"),
-        gr.Textbox(
-            label="Medical Question",
-            placeholder="Give the modality, organ, analysis, abnormalities (if any), treatment (if abnormalities are present)?",
-            value="Give the modality, organ, analysis, abnormalities (if any), treatment (if abnormalities are present)?"
-        )
-    ],
-    outputs=gr.JSON(label="Analysis"),
-    title="Medical Image Analysis Assistant",
-    description="Upload a medical image and ask questions about it. The AI will analyze the image and provide detailed responses."
-)
-# Launch the Gradio app
 if __name__ == "__main__":
-    demo.launch(
-        share=True,
-        server_name="0.0.0.0",
-        server_port=7860
-    )

+from transformers import AutoTokenizer, AutoModelForCausalLM
 import torch
+# Load the model
+model_name = "ContactDoctor/Bio-Medical-MultiModal-Llama-3-8B-V1"
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForCausalLM.from_pretrained(model_name)
+def generate_response(input_text):
+    # Tokenize input text
+    inputs = tokenizer(input_text, return_tensors="pt").to("cuda" if torch.cuda.is_available() else "cpu")
+    # Generate response
+    outputs = model.generate(inputs["input_ids"], max_length=150, temperature=0.7)
+    response = tokenizer.decode(outputs[0], skip_special_tokens=True)
+    return response
+from flask import Flask, request, jsonify
+from predict import generate_response  # import from the predict file
+app = Flask(__name__)
+@app.route("/predict", methods=["POST"])
+def predict():
+    data = request.get_json()
+    input_text = data.get("text")
+    if not input_text:
+        return jsonify({"error": "No input text provided"}), 400
+    response = generate_response(input_text)
+    return jsonify({"response": response})
 if __name__ == "__main__":
+    app.run(port=5000)