TWASR / model.py
JacobLinCool's picture
feat: update model
f4c725a
raw
history blame
489 Bytes
from transformers import pipeline
from accelerate import Accelerator
device = Accelerator().device
model_id = "JacobLinCool/whisper-large-v3-turbo-common_voice_19_0-zh-TW"
pipe = None
def load_model():
global pipe
pipe = pipeline("automatic-speech-recognition", model=model_id, device=device)
def transcribe_audio_local(audio: str) -> str:
print(f"{audio=}")
if pipe is None:
load_model()
out = pipe(audio)
print(f"{out=}")
return out["text"]