Spaces:
Build error
Build error
Commit
·
201db01
1
Parent(s):
ebe9cbe
Added new sample voices audio
Browse files- .vscode/settings.json +5 -1
- app.py +17 -6
- gradio_queue.db +0 -0
- input/sample/Madara.mp3 +3 -0
- input/sample/tony-stark-2.wav +3 -0
- input/sample/tony-stark.wav +3 -0
- output/output.wav +2 -2
.vscode/settings.json
CHANGED
@@ -1,3 +1,7 @@
|
|
1 |
{
|
2 |
-
"cSpell.words": ["Elon"]
|
|
|
|
|
|
|
|
|
3 |
}
|
|
|
1 |
{
|
2 |
+
"cSpell.words": ["Elon"],
|
3 |
+
"[python]": {
|
4 |
+
"editor.defaultFormatter": "ms-python.autopep8"
|
5 |
+
},
|
6 |
+
"python.formatting.provider": "none"
|
7 |
}
|
app.py
CHANGED
@@ -2,16 +2,19 @@ from subprocess import call
|
|
2 |
import gradio as gr
|
3 |
import os
|
4 |
from TTS.api import TTS
|
|
|
5 |
|
6 |
# List available 🐸TTS models and choose the first one
|
7 |
-
all_models = TTS.list_models()
|
8 |
# for model in all_models:
|
9 |
# print(model)
|
10 |
|
11 |
# print("Using model: ", all_models[0])
|
12 |
-
model = all_models[0]
|
13 |
# Init TTS
|
14 |
|
|
|
|
|
15 |
|
16 |
print("Downloading model...", '')
|
17 |
|
@@ -30,6 +33,10 @@ def run_cmd(command):
|
|
30 |
|
31 |
|
32 |
def inference(text, speaker):
|
|
|
|
|
|
|
|
|
33 |
if (speaker == 'Speaker-1'):
|
34 |
speaker = 'input/amitabh.mp3'
|
35 |
elif (speaker == 'Speaker-2'):
|
@@ -44,6 +51,10 @@ def inference(text, speaker):
|
|
44 |
speaker = 'input/sample/Elon-Sample.wav'
|
45 |
elif (speaker == 'Obama'):
|
46 |
speaker = 'input/sample/Obama-sample.wav'
|
|
|
|
|
|
|
|
|
47 |
else:
|
48 |
speaker = 'input/z-default.wav'
|
49 |
# print("speaker: ", speaker)
|
@@ -63,12 +74,12 @@ def inference(text, speaker):
|
|
63 |
|
64 |
|
65 |
sampleInput = ['Speaker-1', 'Speaker-2', 'Speaker-3',
|
66 |
-
'Speaker-4', 'Rock', 'Elon', 'Obama']
|
67 |
-
inputs = [gr.
|
68 |
-
gr.
|
69 |
sampleInput, label="Sample Input", default="Speaker-1",)
|
70 |
]
|
71 |
-
outputs = gr.
|
72 |
title = "Text To Speech"
|
73 |
description = "An example of using TTS to generate speech from text."
|
74 |
article = ""
|
|
|
2 |
import gradio as gr
|
3 |
import os
|
4 |
from TTS.api import TTS
|
5 |
+
from TTS.utils.synthesizer import Synthesizer
|
6 |
|
7 |
# List available 🐸TTS models and choose the first one
|
8 |
+
# all_models = TTS.list_models()
|
9 |
# for model in all_models:
|
10 |
# print(model)
|
11 |
|
12 |
# print("Using model: ", all_models[0])
|
13 |
+
# model = all_models[0]
|
14 |
# Init TTS
|
15 |
|
16 |
+
MAX_TXT_LEN = 500
|
17 |
+
|
18 |
|
19 |
print("Downloading model...", '')
|
20 |
|
|
|
33 |
|
34 |
|
35 |
def inference(text, speaker):
|
36 |
+
if len(text) > MAX_TXT_LEN:
|
37 |
+
text = text[:MAX_TXT_LEN]
|
38 |
+
print(
|
39 |
+
f"Input text was cutoff since it went over the {MAX_TXT_LEN} character limit.")
|
40 |
if (speaker == 'Speaker-1'):
|
41 |
speaker = 'input/amitabh.mp3'
|
42 |
elif (speaker == 'Speaker-2'):
|
|
|
51 |
speaker = 'input/sample/Elon-Sample.wav'
|
52 |
elif (speaker == 'Obama'):
|
53 |
speaker = 'input/sample/Obama-sample.wav'
|
54 |
+
elif (speaker == 'Tony'):
|
55 |
+
speaker = 'input/sample/tony-stark-2.wav'
|
56 |
+
elif (speaker == 'Madara Uchiha'):
|
57 |
+
speaker = 'input/sample/Madara.mp3'
|
58 |
else:
|
59 |
speaker = 'input/z-default.wav'
|
60 |
# print("speaker: ", speaker)
|
|
|
74 |
|
75 |
|
76 |
sampleInput = ['Speaker-1', 'Speaker-2', 'Speaker-3',
|
77 |
+
'Speaker-4', 'Rock', 'Elon', 'Obama', 'Tony', 'Madara Uchiha']
|
78 |
+
inputs = [gr.Textbox(lines=5, label="Input Text"),
|
79 |
+
gr.Dropdown(
|
80 |
sampleInput, label="Sample Input", default="Speaker-1",)
|
81 |
]
|
82 |
+
outputs = gr.Audio(type="filepath", label="Output Audio")
|
83 |
title = "Text To Speech"
|
84 |
description = "An example of using TTS to generate speech from text."
|
85 |
article = ""
|
gradio_queue.db
CHANGED
Binary files a/gradio_queue.db and b/gradio_queue.db differ
|
|
input/sample/Madara.mp3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:601c62ffb87f3879576194637190758defa9a13000c3fb38f814332a64e6835e
|
3 |
+
size 259062
|
input/sample/tony-stark-2.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:106c43d952d7caf2d9e372cf4f74c7febde7a8a543532b5fc5e3a02ab4956cc3
|
3 |
+
size 99862
|
input/sample/tony-stark.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a46f91b72ca5825e4166652af58155bb6c8e764b368b51da0652775a104c19fb
|
3 |
+
size 17998
|
output/output.wav
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6cbd93714af794b46b7ccd96d30949ae39b55343bb841abf37a2d17b4ce4824
|
3 |
+
size 172108
|