mrq commited on
Commit
fbe5bba
·
1 Parent(s): 4715909

this still needs to be manually updated because of a weird quirk where the latest repo just isn't fetched

Browse files
Files changed (2) hide show
  1. app.py +4 -1
  2. requirements.txt +1 -1
app.py CHANGED
@@ -204,6 +204,7 @@ def do_inference_tts( progress=gr.Progress(track_tqdm=True), *args, **kwargs ):
204
  parser.add_argument("--modality", type=str, default=kwargs["modality"])
205
  parser.add_argument("--references", type=str, default=kwargs["reference"])
206
  parser.add_argument("--language", type=str, default=kwargs["language"])
 
207
  parser.add_argument("--split-text-by", type=str, default=kwargs["split-text-by"])
208
  parser.add_argument("--context-history", type=int, default=kwargs["context-history"])
209
  parser.add_argument("--input-prompt-length", type=float, default=kwargs["input-prompt-length"])
@@ -300,6 +301,7 @@ def do_inference_tts( progress=gr.Progress(track_tqdm=True), *args, **kwargs ):
300
  wav, sr = tts.inference(
301
  text=args.text,
302
  language=args.language,
 
303
  task=args.task,
304
  modality=args.modality.lower(),
305
  references=args.references.split(";") if args.references is not None else [],
@@ -445,7 +447,8 @@ with ui:
445
  with gr.Row():
446
  layout["inference_tts"]["inputs"]["cfg-strength"] = gr.Slider(value=1.0, minimum=0.0, maximum=14.0, step=0.05, label="CFG Strength", info="Classifier Free Guidance scale (AR needs 1, NAR-len needs 3).")
447
  layout["inference_tts"]["inputs"]["cfg-rescale"] = gr.Slider(value=0.75, minimum=0.0, maximum=1.0, step=0.05, label="CFG Rescale (Phi)", info="Factor when rescaling for Classifier Free Guidance (0 to disable).")
448
- layout["inference_tts"]["inputs"]["language"] = gr.Dropdown(choices=get_languages(), label="Language", value="en")
 
449
  with gr.Row():
450
  layout["inference_tts"]["inputs"]["split-text-by"] = gr.Dropdown(choices=["sentences", "lines"], label="Text Delimiter", info="Splits the text into pieces.", value="sentences")
451
  layout["inference_tts"]["inputs"]["context-history"] = gr.Slider(value=0, minimum=0, maximum=4, step=1, label="(Rolling) Context History", info="How many prior lines to serve as the context/prefix (0 to disable).")
 
204
  parser.add_argument("--modality", type=str, default=kwargs["modality"])
205
  parser.add_argument("--references", type=str, default=kwargs["reference"])
206
  parser.add_argument("--language", type=str, default=kwargs["language"])
207
+ parser.add_argument("--text-language", type=str, default=kwargs["text-language"])
208
  parser.add_argument("--split-text-by", type=str, default=kwargs["split-text-by"])
209
  parser.add_argument("--context-history", type=int, default=kwargs["context-history"])
210
  parser.add_argument("--input-prompt-length", type=float, default=kwargs["input-prompt-length"])
 
301
  wav, sr = tts.inference(
302
  text=args.text,
303
  language=args.language,
304
+ text_language=args.text_language,
305
  task=args.task,
306
  modality=args.modality.lower(),
307
  references=args.references.split(";") if args.references is not None else [],
 
447
  with gr.Row():
448
  layout["inference_tts"]["inputs"]["cfg-strength"] = gr.Slider(value=1.0, minimum=0.0, maximum=14.0, step=0.05, label="CFG Strength", info="Classifier Free Guidance scale (AR needs 1, NAR-len needs 3).")
449
  layout["inference_tts"]["inputs"]["cfg-rescale"] = gr.Slider(value=0.75, minimum=0.0, maximum=1.0, step=0.05, label="CFG Rescale (Phi)", info="Factor when rescaling for Classifier Free Guidance (0 to disable).")
450
+ layout["inference_tts"]["inputs"]["language"] = gr.Dropdown(choices=get_languages(), label="Language (Output)", value="en", info="Target language/accent to output.")
451
+ layout["inference_tts"]["inputs"]["text-language"] = gr.Dropdown(choices=get_languages(), label="Language (Text)", value="en", info="Language the input text is in.")
452
  with gr.Row():
453
  layout["inference_tts"]["inputs"]["split-text-by"] = gr.Dropdown(choices=["sentences", "lines"], label="Text Delimiter", info="Splits the text into pieces.", value="sentences")
454
  layout["inference_tts"]["inputs"]["context-history"] = gr.Slider(value=0, minimum=0, maximum=4, step=1, label="(Rolling) Context History", info="How many prior lines to serve as the context/prefix (0 to disable).")
requirements.txt CHANGED
@@ -2,4 +2,4 @@
2
  torch
3
  torchaudio
4
 
5
- vall_e @ git+https://github.com/e-c-k-e-r/vall-e.git@c66a53492c98222f2087de7af7e12da228d29534
 
2
  torch
3
  torchaudio
4
 
5
+ vall_e @ git+https://github.com/e-c-k-e-r/vall-e.git@5d80a2d0d44f9b1949f7b43cdeebe48e2772649c