coyotte508's picture
coyotte508 HF staff
🍱 Copy folders from huggingface.js
b2ecf7d
raw
history blame
1.66 kB
import type { TaskDataCustom } from "../Types";
const taskData: TaskDataCustom = {
datasets: [
{
description: "Thousands of short audio clips of a single speaker.",
id: "lj_speech",
},
{
description: "Multi-speaker English dataset.",
id: "LibriTTS",
},
],
demo: {
inputs: [
{
label: "Input",
content: "I love audio models on the Hub!",
type: "text",
},
],
outputs: [
{
filename: "audio.wav",
type: "audio",
},
],
},
metrics: [
{
description: "The Mel Cepstral Distortion (MCD) metric is used to calculate the quality of generated speech.",
id: "mel cepstral distortion",
},
],
models: [
{
description: "A powerful TTS model.",
id: "suno/bark",
},
{
description: "A massively multi-lingual TTS model.",
id: "facebook/mms-tts",
},
{
description: "An end-to-end speech synthesis model.",
id: "microsoft/speecht5_tts",
},
],
spaces: [
{
description: "An application for generate highly realistic, multilingual speech.",
id: "suno/bark",
},
{
description: "An application that contains multiple speech synthesis models for various languages and accents.",
id: "coqui/CoquiTTS",
},
{
description: "An application that synthesizes speech for various speaker types.",
id: "Matthijs/speecht5-tts-demo",
},
],
summary:
"Text-to-Speech (TTS) is the task of generating natural sounding speech given text input. TTS models can be extended to have a single model that generates speech for multiple speakers and multiple languages.",
widgetModels: ["microsoft/speecht5_tts"],
youtubeId: "NW62DpzJ274",
};
export default taskData;