Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
machineuser
commited on
Commit
·
a899be4
1
Parent(s):
70192be
Sync widgets demo
Browse files
packages/tasks/src/text-to-speech/about.md
CHANGED
@@ -25,7 +25,7 @@ def query(payload):
|
|
25 |
response = requests.post(API_URL, headers=headers, json=payload)
|
26 |
return response
|
27 |
|
28 |
-
output = query({"text_inputs": "
|
29 |
```
|
30 |
|
31 |
You can also use libraries such as [espnet](https://huggingface.co/models?library=espnet&pipeline_tag=text-to-speech&sort=downloads) or [transformers](https://huggingface.co/models?pipeline_tag=text-to-speech&library=transformers&sort=trending) if you want to handle the Inference directly.
|
@@ -56,6 +56,7 @@ await inference.textToSpeech({
|
|
56 |
|
57 |
## Useful Resources
|
58 |
|
|
|
59 |
- [ML for Audio Study Group - Text to Speech Deep Dive](https://www.youtube.com/watch?v=aLBedWj-5CQ)
|
60 |
- [An introduction to SpeechT5, a multi-purpose speech recognition and synthesis model](https://huggingface.co/blog/speecht5).
|
61 |
- [A guide on Fine-tuning Whisper For Multilingual ASR with 🤗Transformers](https://huggingface.co/blog/fine-tune-whisper)
|
|
|
25 |
response = requests.post(API_URL, headers=headers, json=payload)
|
26 |
return response
|
27 |
|
28 |
+
output = query({"text_inputs": "Max is the best doggo."})
|
29 |
```
|
30 |
|
31 |
You can also use libraries such as [espnet](https://huggingface.co/models?library=espnet&pipeline_tag=text-to-speech&sort=downloads) or [transformers](https://huggingface.co/models?pipeline_tag=text-to-speech&library=transformers&sort=trending) if you want to handle the Inference directly.
|
|
|
56 |
|
57 |
## Useful Resources
|
58 |
|
59 |
+
- [Hugging Face Audio Course](https://huggingface.co/learn/audio-course/chapter6/introduction)
|
60 |
- [ML for Audio Study Group - Text to Speech Deep Dive](https://www.youtube.com/watch?v=aLBedWj-5CQ)
|
61 |
- [An introduction to SpeechT5, a multi-purpose speech recognition and synthesis model](https://huggingface.co/blog/speecht5).
|
62 |
- [A guide on Fine-tuning Whisper For Multilingual ASR with 🤗Transformers](https://huggingface.co/blog/fine-tune-whisper)
|
packages/tasks/src/text-to-speech/data.ts
CHANGED
@@ -52,8 +52,8 @@ const taskData: TaskDataCustom = {
|
|
52 |
id: "suno/bark",
|
53 |
},
|
54 |
{
|
55 |
-
description: "
|
56 |
-
id: "coqui/
|
57 |
},
|
58 |
{
|
59 |
description: "An application that synthesizes speech for various speaker types.",
|
@@ -62,7 +62,7 @@ const taskData: TaskDataCustom = {
|
|
62 |
],
|
63 |
summary:
|
64 |
"Text-to-Speech (TTS) is the task of generating natural sounding speech given text input. TTS models can be extended to have a single model that generates speech for multiple speakers and multiple languages.",
|
65 |
-
widgetModels: ["
|
66 |
youtubeId: "NW62DpzJ274",
|
67 |
};
|
68 |
|
|
|
52 |
id: "suno/bark",
|
53 |
},
|
54 |
{
|
55 |
+
description: "XTTS is a Voice generation model that lets you clone voices into different languages.",
|
56 |
+
id: "coqui/xtts",
|
57 |
},
|
58 |
{
|
59 |
description: "An application that synthesizes speech for various speaker types.",
|
|
|
62 |
],
|
63 |
summary:
|
64 |
"Text-to-Speech (TTS) is the task of generating natural sounding speech given text input. TTS models can be extended to have a single model that generates speech for multiple speakers and multiple languages.",
|
65 |
+
widgetModels: ["suno/bark"],
|
66 |
youtubeId: "NW62DpzJ274",
|
67 |
};
|
68 |
|