Spaces:

gdnartea
/

Chatty_Ashe

Runtime error

gdnartea commited on May 1, 2024

Commit

d1e03b7

verified ·

1 Parent(s): 70fb7bf

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,11 +1,11 @@
 import gradio as gr
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM, VitsModel
-from nemo.collections.asr.models import ASRModel
 # load speech to text model
-canary_model = ASRModel.from_pretrained('nvidia/canary-1b')
 canary_model.eval()
 # update decode params
@@ -34,7 +34,11 @@ tts_tokenizer = AutoTokenizer.from_pretrained("facebook/mms-tts-eng")
 def process_speech(speech):
     # Convert the speech to text
-    transcription = canary_model.transcribe(speech, logprobs=False)
     # Process the text
     inputs = proc_tokenizer.encode(transcription + proc_tokenizer.eos_token, return_tensors='pt')

 import gradio as gr
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM, VitsModel
+from nemo.collections.asr.models import EncDecMultiTaskModel
 # load speech to text model
+canary_model = EncDecMultiTaskModel.from_pretrained('nvidia/canary-1b')
 canary_model.eval()
 # update decode params
 def process_speech(speech):
     # Convert the speech to text
+    transcription = canary_model.transcribe(
+        speech,
+        batch_size=16,
+        logprobs=False,
+    )
     # Process the text
     inputs = proc_tokenizer.encode(transcription + proc_tokenizer.eos_token, return_tensors='pt')