from streaming_stt_nemo import Model import gradio as gr LANGUAGES = list(Model.langs.keys()) default_lang = "en" engines = { default_lang: Model(default_lang) } def transcribe(audio, language: str): if language not in engines: engines[language] = Model(language) model = engines[language] text = model.stt_model.transcribe([audio])[0] return text gr.Interface( fn=transcribe, inputs=[ gr.Audio(source="microphone", type="filepath"), gr.Radio( label="Language", choices=LANGUAGES, value=default_lang ) ], outputs=[ "textbox" ], live=True).launch()