asahi417 commited on
Commit
f1a4af3
·
verified ·
1 Parent(s): 3d437ce

Update benchmark_hf_pipeline.py

Browse files
Files changed (1) hide show
  1. benchmark_hf_pipeline.py +9 -7
benchmark_hf_pipeline.py CHANGED
@@ -13,13 +13,15 @@ pipe = pipeline(
13
  chunk_length_s=15,
14
  batch_size=64
15
  )
16
-
17
- # load sample audio (concatenate instances to create a long audio)
18
- dataset = load_dataset("kotoba-tech/kotoba-whisper-eval", split="train")
19
- x = dataset['audio'][0]
 
 
20
  elapsed = {}
21
- for x in dataset['audio']:
22
  start = time()
23
- transcription = pipe(x.copy(), generate_kwargs=generate_kwargs)
24
- elapsed[x['path']] = time() - start
25
  pprint(elapsed)
 
13
  chunk_length_s=15,
14
  batch_size=64
15
  )
16
+ test_audio = [
17
+ "kotoba-whisper-eval/audio/long_interview_1.wav",
18
+ "kotoba-whisper-eval/audio/manzai1.wav",
19
+ "kotoba-whisper-eval/audio/manzai2.wav",
20
+ "kotoba-whisper-eval/audio/manzai3.wav"
21
+ ]
22
  elapsed = {}
23
+ for x in test_audio:
24
  start = time()
25
+ transcription = pipe(x, generate_kwargs=generate_kwargs)
26
+ elapsed[x] = time() - start
27
  pprint(elapsed)