kotoba-whisper-v2.2 / pipeline /test_pipeline.py
asahi417's picture
init
4f38470
raw
history blame
587 Bytes
"""wget https://huggingface.co/kotoba-tech/kotoba-whisper-v2.2/resolve/main/sample_audio/sample_diarization_japanese.mp3"""
from pprint import pprint
from transformers.pipelines import pipeline
pipe = pipeline(model="kotoba-tech/kotoba-whisper-v2.2", chunk_length_s=None, batch_size=16, trust_remote_code=True)
output = pipe("sample_diarization_japanese.mp3")
pprint(output)
pipe = pipeline(model="kotoba-tech/kotoba-whisper-v2.2", chunk_length_s=None, batch_size=16, trust_remote_code=True, return_unique_speaker=False)
output = pipe("sample_diarization_japanese.mp3")
pprint(output)