import io import os import streamlit as st import requests from PIL import Image from model import get_caption_model, generate_caption import gradio as gr @st.cache(allow_output_mutation=True) def get_model(): return get_caption_model() caption_model = get_model() def predict(): captions = [] pred_caption = generate_caption('tmp.jpg', caption_model) captions.append(pred_caption) for _ in range(4): pred_caption = generate_caption('tmp.jpg', caption_model, add_noise=True) if pred_caption not in captions: captions.append(pred_caption) #finalc = ' '.join([str(elem) for elem in captions]) return captions; def launch(inputs): img = Image.open(requests.get(inputs, stream=True).raw) img = img.convert('RGB') st.image(img) img.save('tmp.jpg') o=predict() str1="" for ele in o: str1 += "\n"+ele os.remove('tmp.jpg') return str1 iface = gr.Interface(launch, inputs="text", outputs="text",) iface.launch(debug=True,)