File size: 639 Bytes
9206300
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
base_config: ./fs.yaml
task_cls: tasks.tts.fs_adv.FastSpeechAdvTask

lambda_mel_adv: 0.05

disc_win_num: 3
mel_disc_hidden_size: 128
disc_norm: in
disc_reduction: stack
disc_interval: 1
disc_lr: 0.0001
disc_start_steps: 0
discriminator_scheduler_params:
  gamma: 0.5
  step_size: 40000
discriminator_optimizer_params:
  eps: 1.0e-06
  weight_decay: 0.0

scheduler: rsqrt
lr: 0.4 # edit from 1.

# copied from graph-porta-speech repo
predictor_grad: 0.02

max_tokens: 30000
num_sanity_val_steps: 0 # steps of validation at the beginning
ds_workers: 1

use_pitch_embed: false # Attention! no pitch predictor!
pitch_type: cwt # frame|ph|cwt