Spaces:
Sleeping
Sleeping
File size: 1,381 Bytes
7617596 e82dff2 582115f c83f375 7617596 19327c9 7617596 64fb58a b734d92 818a4f8 3b61cce 818a4f8 c410fd7 818a4f8 359b3f0 818a4f8 64fb58a 582115f 818a4f8 582115f 45a5416 818a4f8 7617596 818a4f8 7617596 19327c9 64fb58a 3b61cce |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 |
#!/usr/bin/env python
from __future__ import annotations
import os
import gradio as gr
from app_caption import create_demo as create_demo_caption
from app_vqa import create_demo as create_demo_vqa
from prismer_model import build_deformable_conv, download_models
# Prepare model checkpoints
download_models()
build_deformable_conv()
# Demo file here
description = """
# Prismer
The official demo for **Prismer: A Vision-Language Model with Multi-Task Experts**.
Please refer to our [project page](https://shikun.io/projects/prismer) or [github](https://github.com/NVlabs/prismer) for more details.
Expert labels will be only computed once for the same image checked with md5sum.
"""
if (SPACE_ID := os.getenv('SPACE_ID')) is not None:
description += f'For faster inference without waiting in queue, you may duplicate the space and upgrade to GPU in settings. <a href="https://huggingface.co/spaces/{SPACE_ID}?duplicate=true"><img style="display: inline; margin-top: 0em; margin-bottom: 0em" src="https://bit.ly/3gLdBN6" alt="Duplicate Space" /></a>'
with gr.Blocks(theme='sudeepshouche/minimalist') as demo:
gr.Markdown(description)
with gr.Tabs():
with gr.TabItem('Zero-shot Image Captioning'):
create_demo_caption()
with gr.TabItem('Visual Question Answering'):
create_demo_vqa()
demo.queue(api_open=False).launch()
|