Spaces:
Sleeping
Sleeping
Update Modules/ToucanTTS/InferenceToucanTTS.py
Browse files
Modules/ToucanTTS/InferenceToucanTTS.py
CHANGED
@@ -270,7 +270,7 @@ class ToucanTTS(torch.nn.Module):
|
|
270 |
refined_codec_frames = self.flow_matching_decoder(mu=preliminary_spectrogram.transpose(1, 2),
|
271 |
mask=make_non_pad_mask([len(decoded_speech[0])], device=decoded_speech.device).unsqueeze(-2),
|
272 |
n_timesteps=15,
|
273 |
-
temperature=0.
|
274 |
c=None).transpose(1, 2)
|
275 |
|
276 |
return refined_codec_frames, predicted_durations.squeeze(), pitch_predictions.squeeze(), energy_predictions.squeeze()
|
|
|
270 |
refined_codec_frames = self.flow_matching_decoder(mu=preliminary_spectrogram.transpose(1, 2),
|
271 |
mask=make_non_pad_mask([len(decoded_speech[0])], device=decoded_speech.device).unsqueeze(-2),
|
272 |
n_timesteps=15,
|
273 |
+
temperature=0.2, # low temperature, so the model follows the specified prosody curves better.
|
274 |
c=None).transpose(1, 2)
|
275 |
|
276 |
return refined_codec_frames, predicted_durations.squeeze(), pitch_predictions.squeeze(), energy_predictions.squeeze()
|