coyotte508's picture
coyotte508 HF staff
🍱 Copy folders from huggingface.js
b2ecf7d
raw
history blame
2.29 kB
import type { TaskDataCustom } from "../Types";
const taskData: TaskDataCustom = {
datasets: [
{
// TODO write proper description
description: "Dataset from 12M image-text of Reddit",
id: "red_caps",
},
{
// TODO write proper description
description: "Dataset from 3.3M images of Google",
id: "datasets/conceptual_captions",
},
],
demo: {
inputs: [
{
filename: "savanna.jpg",
type: "img",
},
],
outputs: [
{
label: "Detailed description",
content: "a herd of giraffes and zebras grazing in a field",
type: "text",
},
],
},
metrics: [],
models: [
{
description: "A robust image captioning model.",
id: "Salesforce/blip-image-captioning-large",
},
{
description: "A strong image captioning model.",
id: "nlpconnect/vit-gpt2-image-captioning",
},
{
description: "A strong optical character recognition model.",
id: "microsoft/trocr-base-printed",
},
{
description: "A strong visual question answering model for scientific diagrams.",
id: "google/pix2struct-ai2d-base",
},
{
description: "A strong captioning model for UI components.",
id: "google/pix2struct-widget-captioning-base",
},
{
description: "A captioning model for images that contain text.",
id: "google/pix2struct-textcaps-base",
},
],
spaces: [
{
description: "A robust image captioning application.",
id: "flax-community/image-captioning",
},
{
description: "An application that transcribes handwritings into text.",
id: "nielsr/TrOCR-handwritten",
},
{
description: "An application that can caption images and answer questions about a given image.",
id: "Salesforce/BLIP",
},
{
description: "An application that can caption images and answer questions with a conversational agent.",
id: "Salesforce/BLIP2",
},
{
description: "An image captioning application that demonstrates the effect of noise on captions.",
id: "johko/capdec-image-captioning",
},
],
summary:
"Image to text models output a text from a given image. Image captioning or optical character recognition can be considered as the most common applications of image to text.",
widgetModels: ["Salesforce/blip-image-captioning-base"],
youtubeId: "",
};
export default taskData;