ntt123 commited on
Commit
757c793
·
1 Parent(s): 41d0fa1
Files changed (2) hide show
  1. README.md +0 -16
  2. requirements.txt +3 -6
README.md CHANGED
@@ -5,24 +5,8 @@ colorFrom: red
5
  colorTo: pink
6
  sdk: gradio
7
  sdk_version: 5.9.1
8
- python_version: 3.11
9
  app_file: app.py
10
  pinned: false
11
  license: mit
12
- models:
13
- - ntt123/diffusion-speech-360h
14
- preload_from_hub: true
15
- - ntt123/diffusion-speech-360h acoustic_model_0140000.pt,duration_model_0120000.pt
16
  short_description: A simple diffusion-based text to speech model
17
  ---
18
-
19
- ```
20
- uv run synthesize.py \
21
- --duration-model-config ./train_duration_dit_s.yaml \
22
- --acoustic-model-config ./train_acoustic_dit_b.yaml \
23
- --duration-model-checkpoint ./duration_model_0120000.pt \
24
- --acoustic-model-checkpoint ./acoustic_model_0140000.pt \
25
- --speaker-id 1914 \
26
- --output-file ./audio.wav \
27
- --text "Ilya has made several major contributions to the field of deep learning."
28
- ```
 
5
  colorTo: pink
6
  sdk: gradio
7
  sdk_version: 5.9.1
 
8
  app_file: app.py
9
  pinned: false
10
  license: mit
 
 
 
 
11
  short_description: A simple diffusion-based text to speech model
12
  ---
 
 
 
 
 
 
 
 
 
 
 
requirements.txt CHANGED
@@ -1,9 +1,6 @@
1
- einops==0.8.0
2
- g2p-en==2.1.0
3
- jinja2==3.1.3
4
- nltk==3.9.1
5
- orjson==3.10.12
6
- soundfile==0.12.1
7
  torch
8
  torchaudio
 
 
 
9
  vocos==0.1.0
 
 
 
 
 
 
 
1
  torch
2
  torchaudio
3
+ spaces
4
+ g2p-en==2.1.0
5
+ nltk==3.9.1
6
  vocos==0.1.0