Spaces:

Nepjune
/

Project_image_captioning_blip

Runtime error

Nepjune commited on Feb 6, 2024

Commit

7bf188c

verified ·

1 Parent(s): 651ec42

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,14 +1,20 @@
-from transformers import ViTFeatureExtractor, ViTForImageCaptioning, AutoTokenizer
 import torch
-from PIL import Image
-model = ViTForImageCaptioning.from_pretrained("nlpconnect/vit-gpt2-image-captioning")
-feature_extractor = ViTFeatureExtractor.from_pretrained("nlpconnect/vit-gpt2-image-captioning")
-tokenizer = AutoTokenizer.from_pretrained("nlpconnect/vit-gpt2-image-captioning")
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 model.to(device)
 max_length = 16
 num_beams = 4
 gen_kwargs = {"max_length": max_length, "num_beams": num_beams}

+from __future__ import annotations
+import gradio as gr
+import PIL.Image
+import spaces
 import torch
+from transformers import AutoProcessor, BlipForConditionalGeneration
+DESCRIPTION = "# Image Captioning with BLIP"
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 model.to(device)
+model_id = "Salesforce/blip-image-captioning-large"
+processor = AutoProcessor.from_pretrained(model_id)
+model = BlipForConditionalGeneration.from_pretrained(model_id).to(device)
 max_length = 16
 num_beams = 4
 gen_kwargs = {"max_length": max_length, "num_beams": num_beams}