Commit
·
3b96c34
1
Parent(s):
97f62f8
Update TTS/vocoder/configs/shared_configs.py
Browse files
TTS/vocoder/configs/shared_configs.py
CHANGED
|
@@ -50,7 +50,7 @@ class BaseVocoderConfig(BaseTrainingConfig):
|
|
| 50 |
conv_pad: int = 0 # additional padding against convolutions applied to spectrograms
|
| 51 |
use_cache: bool = False # use in memory cache to keep the computed features. This might cause OOM.
|
| 52 |
# OPTIMIZER
|
| 53 |
-
epochs: int =
|
| 54 |
wd: float = 0.0 # Weight decay weight.
|
| 55 |
optimizer: str = "AdamW"
|
| 56 |
optimizer_params: dict = field(default_factory=lambda: {"betas": [0.8, 0.99], "weight_decay": 0.0})
|
|
@@ -90,7 +90,7 @@ class BaseGANVocoderConfig(BaseVocoderConfig):
|
|
| 90 |
Parameters for the L1 spectrogram loss. Defaults to
|
| 91 |
`{
|
| 92 |
"use_mel": True,
|
| 93 |
-
"sample_rate":
|
| 94 |
"n_fft": 1024,
|
| 95 |
"hop_length": 256,
|
| 96 |
"win_length": 1024,
|
|
@@ -155,7 +155,7 @@ class BaseGANVocoderConfig(BaseVocoderConfig):
|
|
| 155 |
l1_spec_loss_params: dict = field(
|
| 156 |
default_factory=lambda: {
|
| 157 |
"use_mel": True,
|
| 158 |
-
"sample_rate":
|
| 159 |
"n_fft": 1024,
|
| 160 |
"hop_length": 256,
|
| 161 |
"win_length": 1024,
|
|
|
|
| 50 |
conv_pad: int = 0 # additional padding against convolutions applied to spectrograms
|
| 51 |
use_cache: bool = False # use in memory cache to keep the computed features. This might cause OOM.
|
| 52 |
# OPTIMIZER
|
| 53 |
+
epochs: int = 10000 # total number of epochs to train.
|
| 54 |
wd: float = 0.0 # Weight decay weight.
|
| 55 |
optimizer: str = "AdamW"
|
| 56 |
optimizer_params: dict = field(default_factory=lambda: {"betas": [0.8, 0.99], "weight_decay": 0.0})
|
|
|
|
| 90 |
Parameters for the L1 spectrogram loss. Defaults to
|
| 91 |
`{
|
| 92 |
"use_mel": True,
|
| 93 |
+
"sample_rate": 22050,
|
| 94 |
"n_fft": 1024,
|
| 95 |
"hop_length": 256,
|
| 96 |
"win_length": 1024,
|
|
|
|
| 155 |
l1_spec_loss_params: dict = field(
|
| 156 |
default_factory=lambda: {
|
| 157 |
"use_mel": True,
|
| 158 |
+
"sample_rate": 22050,
|
| 159 |
"n_fft": 1024,
|
| 160 |
"hop_length": 256,
|
| 161 |
"win_length": 1024,
|