ImageCaptioning

Sleeping

krishnv commited on Aug 9, 2024

Commit

2c7adc2

verified ·

1 Parent(s): 9633d94

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,38 +1,15 @@
 from transformers import AutoProcessor, AutoModelForCausalLM
 from PIL import Image
-import gradio as gr
-# Load the processor and model
 processor = AutoProcessor.from_pretrained("microsoft/git-base-coco")
 model = AutoModelForCausalLM.from_pretrained("microsoft/git-base-coco")
-# Define the captioning function
-def caption_image(image):
-    # Process the image
-    pixel_values = processor(images=image, return_tensors="pt").pixel_values
-    # Generate captions
-    generated_ids = model.generate(pixel_values=pixel_values, max_length=50)
-    generated_caption = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
-    return generated_caption
-# Define Gradio interface components
-inputs = [
-    gr.inputs.Image(type='pil', label='Upload Image')
-]
-outputs = [
-    gr.outputs.Textbox(label='Generated Caption')
-]
-# Define Gradio app properties
-title = "Image Captioning Application"
-description = "Upload an image to see the caption generated by the model"
-# Create and launch the Gradio interface
-gr.Interface(
-    fn=caption_image,
-    inputs=inputs,
-    outputs=outputs,
-    title=title,
-    description=description,
-).launch(debug=True)

 from transformers import AutoProcessor, AutoModelForCausalLM
+import requests
 from PIL import Image
 processor = AutoProcessor.from_pretrained("microsoft/git-base-coco")
 model = AutoModelForCausalLM.from_pretrained("microsoft/git-base-coco")
+url = "http://images.cocodataset.org/val2017/000000039769.jpg"
+image = Image.open(requests.get(url, stream=True).raw)
+pixel_values = processor(images=image, return_tensors="pt").pixel_values
+generated_ids = model.generate(pixel_values=pixel_values, max_length=50)
+generated_caption = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
+print(generated_caption)