Spaces:

RamAnanth1
/

InstructBLIP

Runtime error

RamAnanth1 commited on May 12, 2023

Commit

06c64f4

•

1 Parent(s): 77095ce

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,12 +4,11 @@ import torch
 device = torch.device("cuda") if torch.cuda.is_available() else "cpu"
 model_name = "blip2_t5_instruct"
 model_type = "flant5xl"
 model, vis_processors, _ = load_model_and_preprocess(
-    name=args.model_name,
-    model_type=args.model_type,
     is_eval=True,
     device=device,
 )
@@ -47,6 +46,11 @@ theme = gr.themes.Monochrome(
 css = ".generating {visibility: hidden}"
 with gr.Blocks(theme=theme, analytics_enabled=False,css=css) as demo:
     with gr.Column(scale=3):
         image_input = gr.Image(type="pil")
         prompt_textbox = gr.Textbox(label="Prompt:", placeholder="prompt", lines=2)

 device = torch.device("cuda") if torch.cuda.is_available() else "cpu"
 model_name = "blip2_t5_instruct"
 model_type = "flant5xl"
 model, vis_processors, _ = load_model_and_preprocess(
+    name=model_name,
+    model_type=model_type,
     is_eval=True,
     device=device,
 )
 css = ".generating {visibility: hidden}"
 with gr.Blocks(theme=theme, analytics_enabled=False,css=css) as demo:
+    gr.Markdown(
+            """
+            Unofficial demo for InstructBLIP. InstructBLIP is a new vision-language instruction-tuning framework by Salesforce that uses BLIP-2 models, achieving state-of-the-art zero-shot generalization performance on a wide range of vision-language tasks.
+            """
+        )
     with gr.Column(scale=3):
         image_input = gr.Image(type="pil")
         prompt_textbox = gr.Textbox(label="Prompt:", placeholder="prompt", lines=2)