cdactvm commited on
Commit
3137a68
·
verified ·
1 Parent(s): b161c5a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -34,10 +34,10 @@ transcriber_hindi_new = pipeline(task="automatic-speech-recognition", model="cda
34
  processor = AutoProcessor.from_pretrained("cdactvm/w2v-bert-tamil_new")
35
  vocab_dict = processor.tokenizer.get_vocab()
36
  sorted_vocab_dict = {k.lower(): v for k, v in sorted(vocab_dict.items(), key=lambda item: item[1])}
37
- decoder = build_ctcdecoder(
38
- labels=list(sorted_vocab_dict.keys()),
39
- kenlm_model_path="lm.binary",
40
- )
41
  # processor_with_lm = Wav2Vec2ProcessorWithLM(
42
  # feature_extractor=processor.feature_extractor,
43
  # tokenizer=processor.tokenizer,
 
34
  processor = AutoProcessor.from_pretrained("cdactvm/w2v-bert-tamil_new")
35
  vocab_dict = processor.tokenizer.get_vocab()
36
  sorted_vocab_dict = {k.lower(): v for k, v in sorted(vocab_dict.items(), key=lambda item: item[1])}
37
+ # decoder = build_ctcdecoder(
38
+ # labels=list(sorted_vocab_dict.keys()),
39
+ # kenlm_model_path="lm.binary",
40
+ # )
41
  # processor_with_lm = Wav2Vec2ProcessorWithLM(
42
  # feature_extractor=processor.feature_extractor,
43
  # tokenizer=processor.tokenizer,