speech-to-speech-translation

Sleeping

Everton Aleixo commited on Aug 29, 2023

Commit

d669329

1 Parent(s): 9578405

Change asr. Add translation.

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,6 +9,7 @@ device = "cuda:0" if torch.cuda.is_available() else "cpu"
 # load speech translation checkpoint
 asr_pipe = pipeline("automatic-speech-recognition", model="openai/whisper-medium", device=device)
 # load text-to-speech checkpoint and speaker embeddings
 processor = SpeechT5Processor.from_pretrained("microsoft/speecht5_tts")
@@ -21,9 +22,13 @@ speaker_embeddings = torch.tensor(embeddings_dataset[7306]["xvector"]).unsqueeze
 def translate(audio):
-    outputs = asr_pipe(audio, max_new_tokens=256, generate_kwargs={"task": "transcribe", "language":"portuguese"})
     print('outputs', outputs)
-    return outputs["text"]
 def synthesise(text):

 # load speech translation checkpoint
 asr_pipe = pipeline("automatic-speech-recognition", model="openai/whisper-medium", device=device)
+translation_pipe = pipeline("translation", model="alirezamsh/small100")
 # load text-to-speech checkpoint and speaker embeddings
 processor = SpeechT5Processor.from_pretrained("microsoft/speecht5_tts")
 def translate(audio):
+    outputs = asr_pipe(audio, max_new_tokens=256, generate_kwargs={"task": "transcribe", "language":"english"})
     print('outputs', outputs)
+    text = outputs["text"]
+    translation = translation_pipe(text, src_lang='pt', tgt_lang='pt')[0]
+    print('translation', translation)
+    return translation['translation_text']
 def synthesise(text):