mouaddb commited on
Commit
95f4cfd
·
1 Parent(s): a04cf9c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -5
app.py CHANGED
@@ -2,10 +2,6 @@ import gradio as gr
2
  from transformers import AutoProcessor, AutoTokenizer, AutoImageProcessor, AutoModelForCausalLM, BlipForConditionalGeneration, VisionEncoderDecoderModel
3
  import torch
4
 
5
- torch.hub.download_url_to_file('http://images.cocodataset.org/val2017/000000039769.jpg', 'cats.jpg')
6
- torch.hub.download_url_to_file('https://huggingface.co/datasets/nielsr/textcaps-sample/resolve/main/stop_sign.png', 'stop_sign.png')
7
- torch.hub.download_url_to_file('https://cdn.openai.com/dall-e-2/demos/text2im/astronaut/horse/photo/0.jpg', 'astronaut.jpg')
8
-
9
  git_processor_base = AutoProcessor.from_pretrained("microsoft/git-base-coco")
10
  git_model_base = AutoModelForCausalLM.from_pretrained("microsoft/git-base-coco")
11
 
@@ -57,7 +53,7 @@ def generate_captions(image):
57
  return caption_git_base, caption_git_large, caption_blip_base, caption_blip_large, caption_vitgpt
58
 
59
 
60
- examples = [["cats.jpg"], ["stop_sign.png"], ["astronaut.jpg"]]
61
  outputs = [gr.outputs.Textbox(label="Caption generated by GIT-base"), gr.outputs.Textbox(label="Caption generated by GIT-large"), gr.outputs.Textbox(label="Caption generated by BLIP-base"), gr.outputs.Textbox(label="Caption generated by BLIP-large"), gr.outputs.Textbox(label="Caption generated by ViT+GPT-2")]
62
 
63
  title = "Interactive demo: comparing image captioning models"
 
2
  from transformers import AutoProcessor, AutoTokenizer, AutoImageProcessor, AutoModelForCausalLM, BlipForConditionalGeneration, VisionEncoderDecoderModel
3
  import torch
4
 
 
 
 
 
5
  git_processor_base = AutoProcessor.from_pretrained("microsoft/git-base-coco")
6
  git_model_base = AutoModelForCausalLM.from_pretrained("microsoft/git-base-coco")
7
 
 
53
  return caption_git_base, caption_git_large, caption_blip_base, caption_blip_large, caption_vitgpt
54
 
55
 
56
+ examples = [["test-1.jpg"], ["test-2.png"], ["test-3.jpg"]]
57
  outputs = [gr.outputs.Textbox(label="Caption generated by GIT-base"), gr.outputs.Textbox(label="Caption generated by GIT-large"), gr.outputs.Textbox(label="Caption generated by BLIP-base"), gr.outputs.Textbox(label="Caption generated by BLIP-large"), gr.outputs.Textbox(label="Caption generated by ViT+GPT-2")]
58
 
59
  title = "Interactive demo: comparing image captioning models"