File size: 1,240 Bytes
b1426fb |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 |
"""
Speaker Diarization Model Handler
Manages the pyannote-audio model for speaker diarization tasks.
"""
from pyannote.audio import Pipeline
import streamlit as st
class SpeakerDiarizer:
def __init__(self, token: str):
"""Initialize the diarization model.
Args:
token (str): HuggingFace authentication token
"""
self.token = token
self.model = None
def load_model(self):
"""Load the pyannote speaker diarization model."""
try:
self.model = Pipeline.from_pretrained(
"pyannote/speaker-diarization",
use_auth_token=self.token
)
return self.model
except Exception as e:
st.error(f"Error loading diarization model: {str(e)}")
return None
def process(self, audio_path: str):
"""Process audio file for speaker diarization.
Args:
audio_path (str): Path to the audio file
Returns:
dict: Diarization results
"""
try:
return self.model(audio_path)
except Exception as e:
st.error(f"Error in diarization: {str(e)}")
return None |