Spaces:

Mediocreatmybest
/

PipelineImageCaption

Runtime error

File size: 1,072 Bytes

bca9f16
6b8d35c
bca9f16
6b8d35c
bca9f16
 
 
 
52fd1d4
bca9f16
6b8d35c
bca9f16
44717e7
52fd1d4
 
 
 
 
364461b
bca9f16
6b8d35c
364461b
 
6b8d35c
0e10238
364461b
 
 
44717e7

import torch
import gradio as gr
from transformers import pipeline

CAPTION_MODELS = {
    'blip-base': 'Salesforce/blip-image-captioning-base',
    'blip-large': 'Salesforce/blip-image-captioning-large',
    'vit-gpt2-coco-en': 'ydshieh/vit-gpt2-coco-en',
    'blip2-2.7b-fp16': 'Mediocreatmybest/blip2-opt-2.7b-fp16-sharded',
}

# Simple caption creation
def caption_image(model_choice, image_input):
    captioner = pipeline(task="image-to-text",
                         model=CAPTION_MODELS[model_choice],
                         max_new_tokens=30,
                         device_map="cpu", use_fast=True
                         )
    caption = captioner(image_input)[0]['generated_text']
    return str(caption).strip()

def launch(model_choice, image_input):
    return caption_image(model_choice, image_input)

model_dropdown = gr.Dropdown(choices=list(CAPTION_MODELS.keys()), label='Model Choice')
image_input = gr.Image(type="pil", label="Input Image or URL")

iface = gr.Interface(launch, inputs=[model_dropdown, image_input], outputs="text")
iface.launch()