Abrahamau commited on
Commit
6d21195
·
verified ·
1 Parent(s): 1269470

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -6
app.py CHANGED
@@ -27,17 +27,14 @@ def guessanAge(model, image):
27
 
28
  @spaces.GPU(duration=120)
29
  def text2speech(model, text, voice):
30
- print(model, text, voice)
31
  if len(text) > 0:
32
- processor = SpeechT5Processor.from_pretrained("microsoft/speecht5_tts")
33
- model = SpeechT5ForTextToSpeech.from_pretrained("microsoft/speecht5_tts")
34
- vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
35
- inputs = processor(text=text, return_tensors="pt")
36
 
37
  embeddings_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
38
  speaker_embedding = torch.tensor(embeddings_dataset[voice]["xvector"]).unsqueeze(0)
39
 
40
- speech = model.generate_speech(inputs["input_ids"], speaker_embeddings, vocoder=vocoder)
41
  audio_data = np.frombuffer(speech["audio"], dtype=np.float32)
42
  audio_data_16bit = (audio_data * 32767).astype(np.int16)
43
  return speech["sampling_rate"], audio_data_16bit
 
27
 
28
  @spaces.GPU(duration=120)
29
  def text2speech(model, text, voice):
30
+ print(voice)
31
  if len(text) > 0:
32
+ synthesiser = pipeline("text-to-speech", model=model)
 
 
 
33
 
34
  embeddings_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
35
  speaker_embedding = torch.tensor(embeddings_dataset[voice]["xvector"]).unsqueeze(0)
36
 
37
+ speech = synthesiser(text, forward_params={"speaker_embeddings": speaker_embedding})
38
  audio_data = np.frombuffer(speech["audio"], dtype=np.float32)
39
  audio_data_16bit = (audio_data * 32767).astype(np.int16)
40
  return speech["sampling_rate"], audio_data_16bit