Spaces:

srivatsavdamaraju
/

minicpm_ggufmodel_api

Build error

srivatsavdamaraju commited on Oct 25

Commit

fa725d5

•

1 Parent(s): 25b37ff

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,42 +1,43 @@
 import gradio as gr
-from transformers import AutoModel, AutoTokenizer
-from PIL import Image
 import torch
-# Load the model and tokenizer
-model_path = "./ggml-model-IQ3_M.gguf"  # Adjust the path to your .gguf model
-model = AutoModel.from_pretrained(model_path, torch_dtype=torch.bfloat16)
-tokenizer = AutoTokenizer.from_pretrained(model_path)
-# Function to generate responses
-def generate_response(question, image=None):
-    # Tokenize the question input
-    inputs = tokenizer(question, return_tensors="pt")
-    # Process the image if provided
-    if image is not None:
-        image = Image.open(image).convert("RGB")
-        # You may need to preprocess the image here (e.g., resizing)
-    # Generate output from the model
-    with torch.no_grad():
-        output = model(**inputs)  # Adjust based on your model's input requirements
-    # Extract the response
-    response = output  # Modify this to match your model's output structure
-    return response  # Convert the response to a string if necessary
 # Create the Gradio interface
-interface = gr.Interface(
-    fn=generate_response,
     inputs=[
-        gr.Textbox(label="Enter your question"),
-        gr.Image(label="Upload an image", type="filepath")
     ],
     outputs="text",
-    title="MiniCPM Q&A Model",
-    description="Ask questions about the uploaded image."
 )
-# Launch the interface
-interface.launch()

 import gradio as gr
 import torch
+from PIL import Image
+from transformers import AutoModel, AutoTokenizer
+# Load the model and tokenizer from the local path
+model = AutoModel.from_pretrained('minicpm/models', trust_remote_code=True)
+tokenizer = AutoTokenizer.from_pretrained('minicpm/models', trust_remote_code=True)
+# Set the model to evaluation mode
+model.eval()
+def predict(image, question):
+    # Preprocess the image
+    image = image.convert('RGB')
+    # Create the message list
+    msgs = [{'role': 'user', 'content': question}]
+    # Generate a response
+    res = model.chat(
+        image=image,
+        msgs=msgs,
+        tokenizer=tokenizer,
+        sampling=True,
+        temperature=0.1
+    )
+    return res
 # Create the Gradio interface
+iface = gr.Interface(
+    fn=predict,
     inputs=[
+        gr.inputs.Image(type="pil", label="Upload an Image"),
+        gr.inputs.Textbox(label="Ask a Question")
     ],
     outputs="text",
+    title="Image Question Answering",
+    description="Upload an image and ask a question about it."
 )
+# Launch the app
+iface.launch()