Spaces:

sounar
/

ContactDoctor-API

Paused

App Files Files Community

sounar commited on 12 days ago

Commit

8e90fc6

•

1 Parent(s): acfc179

Update app.py

Browse files

Files changed (1) hide show

app.py +82 -24

app.py CHANGED Viewed

@@ -1,33 +1,91 @@
-from transformers import AutoTokenizer, AutoModelForCausalLM
 import torch
-# Load the model
-model_name = "ContactDoctor/Bio-Medical-MultiModal-Llama-3-8B-V1"
-tokenizer = AutoTokenizer.from_pretrained(model_name)
-model = AutoModelForCausalLM.from_pretrained(model_name)
-def generate_response(input_text):
-    # Tokenize input text
-    inputs = tokenizer(input_text, return_tensors="pt").to("cuda" if torch.cuda.is_available() else "cpu")
-    # Generate response
-    outputs = model.generate(inputs["input_ids"], max_length=150, temperature=0.7)
-    response = tokenizer.decode(outputs[0], skip_special_tokens=True)
-    return response
-from flask import Flask, request, jsonify
-from predict import generate_response  # import from the predict file
-app = Flask(__name__)
-@app.route("/predict", methods=["POST"])
-def predict():
-    data = request.get_json()
-    input_text = data.get("text")
-    if not input_text:
-        return jsonify({"error": "No input text provided"}), 400
-    response = generate_response(input_text)
-    return jsonify({"response": response})
 if __name__ == "__main__":
-    app.run(port=5000)

+import os
 import torch
+from transformers import AutoModel, AutoTokenizer, BitsAndBytesConfig
+import gradio as gr
+from PIL import Image
+from torchvision.transforms import ToTensor
+# Get API token from environment variable
+api_token = os.getenv("HF_TOKEN").strip()
+# Quantization configuration
+bnb_config = BitsAndBytesConfig(
+    load_in_4bit=True,
+    bnb_4bit_quant_type="nf4",
+    bnb_4bit_use_double_quant=True,
+    bnb_4bit_compute_dtype=torch.float16
+)
+# Initialize model and tokenizer
+model = AutoModel.from_pretrained(
+    "ContactDoctor/Bio-Medical-MultiModal-Llama-3-8B-V1",
+    quantization_config=bnb_config,
+    device_map="auto",
+    torch_dtype=torch.float16,
+    trust_remote_code=True,
+    attn_implementation="flash_attention_2",
+    token=api_token
+)
+tokenizer = AutoTokenizer.from_pretrained(
+    "ContactDoctor/Bio-Medical-MultiModal-Llama-3-8B-V1",
+    trust_remote_code=True,
+    token=api_token
+)
+def analyze_input(image, question):
+    try:
+        if image is not None:
+            # Convert to RGB if image is provided
+            image = image.convert('RGB')
+        # Prepare messages in the format expected by the model
+        msgs = [{'role': 'user', 'content': [image, question]}]
+        # Generate response using the chat method
+        response_stream = model.chat(
+            image=image,
+            msgs=msgs,
+            tokenizer=tokenizer,
+            sampling=True,
+            temperature=0.95,
+            stream=True
+        )
+        # Collect the streamed response
+        generated_text = ""
+        for new_text in response_stream:
+            generated_text += new_text
+            print(new_text, flush=True, end='')
+        return {"status": "success", "response": generated_text}
+    except Exception as e:
+        import traceback
+        error_trace = traceback.format_exc()
+        print(f"Error occurred: {error_trace}")
+        return {"status": "error", "message": str(e)}
+# Create Gradio interface
+demo = gr.Interface(
+    fn=analyze_input,
+    inputs=[
+        gr.Image(type="pil", label="Upload Medical Image"),
+        gr.Textbox(
+            label="Medical Question",
+            placeholder="Give the modality, organ, analysis, abnormalities (if any), treatment (if abnormalities are present)?",
+            value="Give the modality, organ, analysis, abnormalities (if any), treatment (if abnormalities are present)?"
+        )
+    ],
+    outputs=gr.JSON(label="Analysis"),
+    title="Medical Image Analysis Assistant",
+    description="Upload a medical image and ask questions about it. The AI will analyze the image and provide detailed responses."
+)
+# Launch the Gradio app
 if __name__ == "__main__":
+    demo.launch(
+        share=True,
+        server_name="0.0.0.0",
+        server_port=7860
+    )