import type { TaskDataCustom } from "../Types"; const taskData: TaskDataCustom = { datasets: [ { description: "A widely used dataset useful to benchmark named entity recognition models.", id: "conll2003", }, { description: "A multilingual dataset of Wikipedia articles annotated for named entity recognition in over 150 different languages.", id: "wikiann", }, ], demo: { inputs: [ { label: "Input", content: "My name is Omar and I live in Zürich.", type: "text", }, ], outputs: [ { text: "My name is Omar and I live in Zürich.", tokens: [ { type: "PERSON", start: 11, end: 15, }, { type: "GPE", start: 30, end: 36, }, ], type: "text-with-tokens", }, ], }, metrics: [ { description: "", id: "accuracy", }, { description: "", id: "recall", }, { description: "", id: "precision", }, { description: "", id: "f1", }, ], models: [ { description: "A robust performance model to identify people, locations, organizations and names of miscellaneous entities.", id: "dslim/bert-base-NER", }, { description: "Flair models are typically the state of the art in named entity recognition tasks.", id: "flair/ner-english", }, ], spaces: [ { description: "An application that can recognizes entities, extracts noun chunks and recognizes various linguistic features of each token.", id: "spacy/gradio_pipeline_visualizer", }, ], summary: "Token classification is a natural language understanding task in which a label is assigned to some tokens in a text. Some popular token classification subtasks are Named Entity Recognition (NER) and Part-of-Speech (PoS) tagging. NER models could be trained to identify specific entities in a text, such as dates, individuals and places; and PoS tagging would identify, for example, which words in a text are verbs, nouns, and punctuation marks.", widgetModels: ["dslim/bert-base-NER"], youtubeId: "wVHdVlPScxA", }; export default taskData;