Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
import type { TaskDataCustom } from "../Types"; | |
const taskData: TaskDataCustom = { | |
datasets: [ | |
{ | |
description: "Thousands of short audio clips of a single speaker.", | |
id: "lj_speech", | |
}, | |
{ | |
description: "Multi-speaker English dataset.", | |
id: "LibriTTS", | |
}, | |
], | |
demo: { | |
inputs: [ | |
{ | |
label: "Input", | |
content: "I love audio models on the Hub!", | |
type: "text", | |
}, | |
], | |
outputs: [ | |
{ | |
filename: "audio.wav", | |
type: "audio", | |
}, | |
], | |
}, | |
metrics: [ | |
{ | |
description: "The Mel Cepstral Distortion (MCD) metric is used to calculate the quality of generated speech.", | |
id: "mel cepstral distortion", | |
}, | |
], | |
models: [ | |
{ | |
description: "A powerful TTS model.", | |
id: "suno/bark", | |
}, | |
{ | |
description: "A massively multi-lingual TTS model.", | |
id: "facebook/mms-tts", | |
}, | |
{ | |
description: "An end-to-end speech synthesis model.", | |
id: "microsoft/speecht5_tts", | |
}, | |
], | |
spaces: [ | |
{ | |
description: "An application for generate highly realistic, multilingual speech.", | |
id: "suno/bark", | |
}, | |
{ | |
description: "An application that contains multiple speech synthesis models for various languages and accents.", | |
id: "coqui/CoquiTTS", | |
}, | |
{ | |
description: "An application that synthesizes speech for various speaker types.", | |
id: "Matthijs/speecht5-tts-demo", | |
}, | |
], | |
summary: | |
"Text-to-Speech (TTS) is the task of generating natural sounding speech given text input. TTS models can be extended to have a single model that generates speech for multiple speakers and multiple languages.", | |
widgetModels: ["microsoft/speecht5_tts"], | |
youtubeId: "NW62DpzJ274", | |
}; | |
export default taskData; | |