machineuser commited on
Commit
a899be4
·
1 Parent(s): 70192be

Sync widgets demo

Browse files
packages/tasks/src/text-to-speech/about.md CHANGED
@@ -25,7 +25,7 @@ def query(payload):
25
  response = requests.post(API_URL, headers=headers, json=payload)
26
  return response
27
 
28
- output = query({"text_inputs": "This is a test"})
29
  ```
30
 
31
  You can also use libraries such as [espnet](https://huggingface.co/models?library=espnet&pipeline_tag=text-to-speech&sort=downloads) or [transformers](https://huggingface.co/models?pipeline_tag=text-to-speech&library=transformers&sort=trending) if you want to handle the Inference directly.
@@ -56,6 +56,7 @@ await inference.textToSpeech({
56
 
57
  ## Useful Resources
58
 
 
59
  - [ML for Audio Study Group - Text to Speech Deep Dive](https://www.youtube.com/watch?v=aLBedWj-5CQ)
60
  - [An introduction to SpeechT5, a multi-purpose speech recognition and synthesis model](https://huggingface.co/blog/speecht5).
61
  - [A guide on Fine-tuning Whisper For Multilingual ASR with 🤗Transformers](https://huggingface.co/blog/fine-tune-whisper)
 
25
  response = requests.post(API_URL, headers=headers, json=payload)
26
  return response
27
 
28
+ output = query({"text_inputs": "Max is the best doggo."})
29
  ```
30
 
31
  You can also use libraries such as [espnet](https://huggingface.co/models?library=espnet&pipeline_tag=text-to-speech&sort=downloads) or [transformers](https://huggingface.co/models?pipeline_tag=text-to-speech&library=transformers&sort=trending) if you want to handle the Inference directly.
 
56
 
57
  ## Useful Resources
58
 
59
+ - [Hugging Face Audio Course](https://huggingface.co/learn/audio-course/chapter6/introduction)
60
  - [ML for Audio Study Group - Text to Speech Deep Dive](https://www.youtube.com/watch?v=aLBedWj-5CQ)
61
  - [An introduction to SpeechT5, a multi-purpose speech recognition and synthesis model](https://huggingface.co/blog/speecht5).
62
  - [A guide on Fine-tuning Whisper For Multilingual ASR with 🤗Transformers](https://huggingface.co/blog/fine-tune-whisper)
packages/tasks/src/text-to-speech/data.ts CHANGED
@@ -52,8 +52,8 @@ const taskData: TaskDataCustom = {
52
  id: "suno/bark",
53
  },
54
  {
55
- description: "An application that contains multiple speech synthesis models for various languages and accents.",
56
- id: "coqui/CoquiTTS",
57
  },
58
  {
59
  description: "An application that synthesizes speech for various speaker types.",
@@ -62,7 +62,7 @@ const taskData: TaskDataCustom = {
62
  ],
63
  summary:
64
  "Text-to-Speech (TTS) is the task of generating natural sounding speech given text input. TTS models can be extended to have a single model that generates speech for multiple speakers and multiple languages.",
65
- widgetModels: ["microsoft/speecht5_tts"],
66
  youtubeId: "NW62DpzJ274",
67
  };
68
 
 
52
  id: "suno/bark",
53
  },
54
  {
55
+ description: "XTTS is a Voice generation model that lets you clone voices into different languages.",
56
+ id: "coqui/xtts",
57
  },
58
  {
59
  description: "An application that synthesizes speech for various speaker types.",
 
62
  ],
63
  summary:
64
  "Text-to-Speech (TTS) is the task of generating natural sounding speech given text input. TTS models can be extended to have a single model that generates speech for multiple speakers and multiple languages.",
65
+ widgetModels: ["suno/bark"],
66
  youtubeId: "NW62DpzJ274",
67
  };
68