Spaces:

Nepjune
/

Project_image_captioning_blip

Runtime error

Nepjune commited on Feb 6, 2024

Commit

6819cba

verified ·

1 Parent(s): edf49bd

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,20 +1,14 @@
-from __future__ import annotations
-import gradio as gr
-import PIL.Image
-import spaces
 import torch
-from transformers import AutoProcessor, BlipForConditionalGeneration
-DESCRIPTION = "# Image Captioning with BLIP"
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 model.to(device)
-model_id = "Salesforce/blip-image-captioning-large"
-processor = AutoProcessor.from_pretrained(model_id)
-model = BlipForConditionalGeneration.from_pretrained(model_id).to(device)
 max_length = 16
 num_beams = 4
 gen_kwargs = {"max_length": max_length, "num_beams": num_beams}

+from transformers import ViTFeatureExtractor, ViTForImageToText, AutoTokenizer
 import torch
+from PIL import Image
+model = ViTForImageToText.from_pretrained("nlpconnect/vit-gpt2-image-captioning")
+feature_extractor = ViTFeatureExtractor.from_pretrained("nlpconnect/vit-gpt2-image-captioning")
+tokenizer = AutoTokenizer.from_pretrained("nlpconnect/vit-gpt2-image-captioning")
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 model.to(device)
 max_length = 16
 num_beams = 4
 gen_kwargs = {"max_length": max_length, "num_beams": num_beams}