Update app.py
Browse files
app.py
CHANGED
@@ -14,6 +14,19 @@ import re
|
|
14 |
import time
|
15 |
from streaming_stt_nemo import Model
|
16 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
17 |
default_lang = "en"
|
18 |
|
19 |
engines = { default_lang: Model(default_lang) }
|
@@ -54,9 +67,19 @@ def model(text):
|
|
54 |
async def respond(audio):
|
55 |
user = transcribe(audio)
|
56 |
reply = model(user)
|
57 |
-
|
58 |
-
voice
|
59 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
60 |
|
61 |
with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
|
62 |
tmp_path = tmp_file.name
|
@@ -87,10 +110,18 @@ async def generate1(prompt):
|
|
87 |
if not response.token.text == "</s>":
|
88 |
output += response.token.text
|
89 |
|
90 |
-
|
91 |
-
|
92 |
-
|
93 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
94 |
|
95 |
with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
|
96 |
tmp_path = tmp_file.name
|
@@ -103,6 +134,11 @@ with gr.Blocks(css="style.css") as demo:
|
|
103 |
### <center>An Artificial Intelligence Assistant just for YOU:
|
104 |
### <center>Now you can Ask for a spell to Hermione</center>
|
105 |
""")
|
|
|
|
|
|
|
|
|
|
|
106 |
with gr.Row():
|
107 |
input = gr.Audio(label="Your Voice Chat", type="filepath", interactive=True, sources="microphone", waveform_options=False)
|
108 |
output = gr.Audio(label="Hermione", type="filepath", interactive=False, autoplay=True, elem_classes="audio")
|
|
|
14 |
import time
|
15 |
from streaming_stt_nemo import Model
|
16 |
|
17 |
+
Female_language_dict = {
|
18 |
+
'English-Jenny (Female)': 'en-US-JennyNeural',
|
19 |
+
'English-Ana (Female)': 'en-US-AnaNeural',
|
20 |
+
'English-Aria (Female)': 'en-US-AriaNeural',
|
21 |
+
'English-Michelle (Female)': 'en-US-MichelleNeural',
|
22 |
+
'English (Australia)-Natasha- (Female)': 'en-AU-NatashaNeural',
|
23 |
+
'English (Canada)-Clara- (Female)': 'en-CA-ClaraNeural',
|
24 |
+
'English (UK)-Libby- (Female)': 'en-GB-LibbyNeural',
|
25 |
+
'English (UK)-Maisie- (Female)': 'en-GB-MaisieNeural',
|
26 |
+
'English (UK)-Sonia- (Female)': 'en-GB-SoniaNeural',
|
27 |
+
'English (Ireland)-Emily- (Female)': 'en-IE-EmilyNeural',
|
28 |
+
}
|
29 |
+
|
30 |
default_lang = "en"
|
31 |
|
32 |
engines = { default_lang: Model(default_lang) }
|
|
|
67 |
async def respond(audio):
|
68 |
user = transcribe(audio)
|
69 |
reply = model(user)
|
70 |
+
|
71 |
+
# Random voice choise from Manager base on locale and gender
|
72 |
+
#
|
73 |
+
#voices = await VoicesManager.create()
|
74 |
+
#voice = voices.find(Gender="Female", Locale="en-GB")
|
75 |
+
#communicate = edge_tts.Communicate(reply, random.choice(voice)["Name"])
|
76 |
+
#
|
77 |
+
# Or the following as one selected Voice for the character.
|
78 |
+
|
79 |
+
language_code = 'English (UK)-Maisie- (Female)'
|
80 |
+
|
81 |
+
voice = language_dict.get(language_code, "default_voice")
|
82 |
+
communicate = edge_tts.Communicate(reply, voice)
|
83 |
|
84 |
with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
|
85 |
tmp_path = tmp_file.name
|
|
|
110 |
if not response.token.text == "</s>":
|
111 |
output += response.token.text
|
112 |
|
113 |
+
# Random voice choice from VoiceManager base on locale and gender
|
114 |
+
#
|
115 |
+
#voices = await VoicesManager.create()
|
116 |
+
#voice = voices.find(Gender="Female", Locale="en-GB")
|
117 |
+
#communicate = edge_tts.Communicate(reply, random.choice(voice)["Name"])
|
118 |
+
#
|
119 |
+
# Or the following as one selected voice for the character.
|
120 |
+
|
121 |
+
language_code = 'English (UK)-Maisie- (Female)'
|
122 |
+
|
123 |
+
voice = language_dict.get(language_code, "default_voice")
|
124 |
+
communicate = edge_tts.Communicate(output, voice)
|
125 |
|
126 |
with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
|
127 |
tmp_path = tmp_file.name
|
|
|
134 |
### <center>An Artificial Intelligence Assistant just for YOU:
|
135 |
### <center>Now you can Ask for a spell to Hermione</center>
|
136 |
""")
|
137 |
+
# Use for the Selection of voice for Hermione
|
138 |
+
#with gr.Row():
|
139 |
+
# language_code = gr.Dropdown(choices=list(Female_language_dict.keys()), label="Select Voice for Hermione")
|
140 |
+
#
|
141 |
+
|
142 |
with gr.Row():
|
143 |
input = gr.Audio(label="Your Voice Chat", type="filepath", interactive=True, sources="microphone", waveform_options=False)
|
144 |
output = gr.Audio(label="Hermione", type="filepath", interactive=False, autoplay=True, elem_classes="audio")
|