mrq
commited on
Commit
·
fbe5bba
1
Parent(s):
4715909
this still needs to be manually updated because of a weird quirk where the latest repo just isn't fetched
Browse files- app.py +4 -1
- requirements.txt +1 -1
app.py
CHANGED
@@ -204,6 +204,7 @@ def do_inference_tts( progress=gr.Progress(track_tqdm=True), *args, **kwargs ):
|
|
204 |
parser.add_argument("--modality", type=str, default=kwargs["modality"])
|
205 |
parser.add_argument("--references", type=str, default=kwargs["reference"])
|
206 |
parser.add_argument("--language", type=str, default=kwargs["language"])
|
|
|
207 |
parser.add_argument("--split-text-by", type=str, default=kwargs["split-text-by"])
|
208 |
parser.add_argument("--context-history", type=int, default=kwargs["context-history"])
|
209 |
parser.add_argument("--input-prompt-length", type=float, default=kwargs["input-prompt-length"])
|
@@ -300,6 +301,7 @@ def do_inference_tts( progress=gr.Progress(track_tqdm=True), *args, **kwargs ):
|
|
300 |
wav, sr = tts.inference(
|
301 |
text=args.text,
|
302 |
language=args.language,
|
|
|
303 |
task=args.task,
|
304 |
modality=args.modality.lower(),
|
305 |
references=args.references.split(";") if args.references is not None else [],
|
@@ -445,7 +447,8 @@ with ui:
|
|
445 |
with gr.Row():
|
446 |
layout["inference_tts"]["inputs"]["cfg-strength"] = gr.Slider(value=1.0, minimum=0.0, maximum=14.0, step=0.05, label="CFG Strength", info="Classifier Free Guidance scale (AR needs 1, NAR-len needs 3).")
|
447 |
layout["inference_tts"]["inputs"]["cfg-rescale"] = gr.Slider(value=0.75, minimum=0.0, maximum=1.0, step=0.05, label="CFG Rescale (Phi)", info="Factor when rescaling for Classifier Free Guidance (0 to disable).")
|
448 |
-
layout["inference_tts"]["inputs"]["language"] = gr.Dropdown(choices=get_languages(), label="Language", value="en")
|
|
|
449 |
with gr.Row():
|
450 |
layout["inference_tts"]["inputs"]["split-text-by"] = gr.Dropdown(choices=["sentences", "lines"], label="Text Delimiter", info="Splits the text into pieces.", value="sentences")
|
451 |
layout["inference_tts"]["inputs"]["context-history"] = gr.Slider(value=0, minimum=0, maximum=4, step=1, label="(Rolling) Context History", info="How many prior lines to serve as the context/prefix (0 to disable).")
|
|
|
204 |
parser.add_argument("--modality", type=str, default=kwargs["modality"])
|
205 |
parser.add_argument("--references", type=str, default=kwargs["reference"])
|
206 |
parser.add_argument("--language", type=str, default=kwargs["language"])
|
207 |
+
parser.add_argument("--text-language", type=str, default=kwargs["text-language"])
|
208 |
parser.add_argument("--split-text-by", type=str, default=kwargs["split-text-by"])
|
209 |
parser.add_argument("--context-history", type=int, default=kwargs["context-history"])
|
210 |
parser.add_argument("--input-prompt-length", type=float, default=kwargs["input-prompt-length"])
|
|
|
301 |
wav, sr = tts.inference(
|
302 |
text=args.text,
|
303 |
language=args.language,
|
304 |
+
text_language=args.text_language,
|
305 |
task=args.task,
|
306 |
modality=args.modality.lower(),
|
307 |
references=args.references.split(";") if args.references is not None else [],
|
|
|
447 |
with gr.Row():
|
448 |
layout["inference_tts"]["inputs"]["cfg-strength"] = gr.Slider(value=1.0, minimum=0.0, maximum=14.0, step=0.05, label="CFG Strength", info="Classifier Free Guidance scale (AR needs 1, NAR-len needs 3).")
|
449 |
layout["inference_tts"]["inputs"]["cfg-rescale"] = gr.Slider(value=0.75, minimum=0.0, maximum=1.0, step=0.05, label="CFG Rescale (Phi)", info="Factor when rescaling for Classifier Free Guidance (0 to disable).")
|
450 |
+
layout["inference_tts"]["inputs"]["language"] = gr.Dropdown(choices=get_languages(), label="Language (Output)", value="en", info="Target language/accent to output.")
|
451 |
+
layout["inference_tts"]["inputs"]["text-language"] = gr.Dropdown(choices=get_languages(), label="Language (Text)", value="en", info="Language the input text is in.")
|
452 |
with gr.Row():
|
453 |
layout["inference_tts"]["inputs"]["split-text-by"] = gr.Dropdown(choices=["sentences", "lines"], label="Text Delimiter", info="Splits the text into pieces.", value="sentences")
|
454 |
layout["inference_tts"]["inputs"]["context-history"] = gr.Slider(value=0, minimum=0, maximum=4, step=1, label="(Rolling) Context History", info="How many prior lines to serve as the context/prefix (0 to disable).")
|
requirements.txt
CHANGED
@@ -2,4 +2,4 @@
|
|
2 |
torch
|
3 |
torchaudio
|
4 |
|
5 |
-
vall_e @ git+https://github.com/e-c-k-e-r/vall-e.git@
|
|
|
2 |
torch
|
3 |
torchaudio
|
4 |
|
5 |
+
vall_e @ git+https://github.com/e-c-k-e-r/vall-e.git@5d80a2d0d44f9b1949f7b43cdeebe48e2772649c
|