Spaces:

xxx1
/

VQA_CAP_GPT

Runtime error

App Files Files Community

xxx1 commited on Feb 28, 2023

Commit

1d42b83

1 Parent(s): dc9a7dd

Create app.py

Browse files

Files changed (1) hide show

app.py +83 -0

app.py ADDED Viewed

	@@ -0,0 +1,83 @@

+import string
+import gradio as gr
+import requests
+import torch
+from transformers import BlipForQuestionAnswering, BlipProcessor
+device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+processor = BlipProcessor.from_pretrained("Salesforce/blip-vqa-capfilt-large")
+model_vqa = BlipForQuestionAnswering.from_pretrained("Salesforce/blip-vqa-capfilt-large").to(device)
+def inference_chat(input_image,input_text):
+    inputs = processor(images=input_image, text=input_text,return_tensors="pt")
+    inputs["max_length"] = 20
+    inputs["num_beams"] = 5
+    inputs['num_return_sequences'] =4
+    out = model_vqa.generate(**inputs)
+    return "\n".join(processor.batch_decode(out, skip_special_tokens=True))
+with gr.Blocks(
+    css="""
+    .message.svelte-w6rprc.svelte-w6rprc.svelte-w6rprc {font-size: 20px; margin-top: 20px}
+    #component-21 > div.wrap.svelte-w6rprc {height: 600px;}
+    """
+) as iface:
+    state = gr.State([])
+    #caption_output = None
+    #gr.Markdown(title)
+    #gr.Markdown(description)
+    #gr.Markdown(article)
+    with gr.Row():
+        with gr.Column(scale=1):
+            image_input = gr.Image(type="pil")
+            with gr.Row():
+                with gr.Column(scale=1):
+                    chat_input = gr.Textbox(lines=1, label="VQA Input(问题输入)")
+                    with gr.Row():
+                        clear_button = gr.Button(value="Clear", interactive=True)
+                        submit_button = gr.Button(
+                            value="Submit", interactive=True, variant="primary"
+                        )
+        with gr.Column():
+            caption_output = gr.Textbox(lines=0, label="VQA Output(模型答案输出)")
+        image_input.change(
+            lambda: ("", "", []),
+            [],
+            [ caption_output, state],
+            queue=False,
+        )
+        chat_input.submit(
+                    inference_chat,
+                    [
+                        image_input,
+                        chat_input,
+                    ],
+                    [ caption_output],
+                )
+        clear_button.click(
+                        lambda: ("", [], []),
+                        [],
+                        [chat_input,  state],
+                        queue=False,
+                    )
+        submit_button.click(
+                        inference_chat,
+                        [
+                            image_input,
+                            chat_input,
+                        ],
+                        [caption_output],
+                    )
+   # examples = gr.Examples(
+   #     examples=examples,
+   #     inputs=[image_input, chat_input],
+  #  )
+iface.queue(concurrency_count=1, api_open=False, max_size=10)
+iface.launch(enable_queue=True)