bel32123 commited on
Commit
31ac586
·
1 Parent(s): 00b49e2

Adjust app to support the use of cleaner model interface

Browse files
Files changed (2) hide show
  1. app.py +7 -7
  2. requirements.txt +7 -1
app.py CHANGED
@@ -1,19 +1,19 @@
1
  import streamlit as st
2
- import torch
3
- from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
4
  from speechbrain.pretrained import GraphemeToPhoneme
5
  import os
6
  import torchaudio
7
  from wav2vecasr.MispronounciationDetector import MispronounciationDetector
 
 
8
 
9
  @st.cache_resource
10
  def load_model():
11
- device = "cuda" if torch.cuda.is_available() else "cpu"
12
- path = os.path.join(os.getcwd(), "wav2vecasr", "model", "checkpoint-1200")
13
- model = Wav2Vec2ForCTC.from_pretrained(path).to(device)
14
- processor = Wav2Vec2Processor.from_pretrained(path)
15
  g2p = GraphemeToPhoneme.from_hparams("speechbrain/soundchoice-g2p")
16
- mispronounciation_detector = MispronounciationDetector(model, processor, g2p, "cpu")
17
  return mispronounciation_detector
18
 
19
 
 
1
  import streamlit as st
 
 
2
  from speechbrain.pretrained import GraphemeToPhoneme
3
  import os
4
  import torchaudio
5
  from wav2vecasr.MispronounciationDetector import MispronounciationDetector
6
+ from wav2vecasr.PhonemeASRModel import Wav2Vec2PhonemeASRModel, Wav2Vec2OptimisedPhonemeASRModel
7
+
8
 
9
  @st.cache_resource
10
  def load_model():
11
+ path = os.path.join(os.getcwd(), "wav2vecasr", "model", "checkpoint-600")
12
+ asr_model = Wav2Vec2OptimisedPhonemeASRModel(path, os.path.join(path, "wav2vec2_vocab_final.json"),
13
+ os.path.join(os.getcwd(), "wav2vecasr", "pretrained_models",
14
+ "ken-lm-ngram"))
15
  g2p = GraphemeToPhoneme.from_hparams("speechbrain/soundchoice-g2p")
16
+ mispronounciation_detector = MispronounciationDetector(asr_model, g2p, "cpu")
17
  return mispronounciation_detector
18
 
19
 
requirements.txt CHANGED
@@ -4,7 +4,7 @@ altair==5.1.2
4
  async-timeout==4.0.3
5
  attrs==23.1.0
6
  audioread==3.0.1
7
- backports.zoneinfo;python_version<"3.9"
8
  blinker==1.6.3
9
  cachetools==5.3.1
10
  certifi==2023.7.22
@@ -15,6 +15,7 @@ colorama==0.4.6
15
  datasets==1.18.3
16
  decorator==5.1.1
17
  dill==0.3.7
 
18
  filelock==3.12.4
19
  frozenlist==1.4.0
20
  fsspec==2023.9.2
@@ -22,6 +23,7 @@ gitdb==4.0.10
22
  GitPython==3.1.37
23
  huggingface-hub==0.17.3
24
  HyperPyYAML==1.2.2
 
25
  idna==3.4
26
  importlib-metadata==6.8.0
27
  importlib-resources==6.1.0
@@ -30,6 +32,7 @@ jiwer==3.0.3
30
  joblib==1.3.2
31
  jsonschema==4.19.1
32
  jsonschema-specifications==2023.7.1
 
33
  lazy_loader==0.3
34
  librosa==0.10.1
35
  llvmlite==0.41.0
@@ -52,8 +55,10 @@ pooch==1.7.0
52
  protobuf==4.24.4
53
  pyarrow==13.0.0
54
  pycparser==2.21
 
55
  pydeck==0.8.1b0
56
  Pygments==2.16.1
 
57
  python-dateutil==2.8.2
58
  pytz==2023.3.post1
59
  PyYAML==6.0.1
@@ -71,6 +76,7 @@ scipy==1.10.1
71
  sentencepiece==0.1.99
72
  six==1.16.0
73
  smmap==5.0.1
 
74
  soundfile==0.12.1
75
  soxr==0.3.7
76
  speechbrain==0.5.15
 
4
  async-timeout==4.0.3
5
  attrs==23.1.0
6
  audioread==3.0.1
7
+ backports.zoneinfo==0.2.1
8
  blinker==1.6.3
9
  cachetools==5.3.1
10
  certifi==2023.7.22
 
15
  datasets==1.18.3
16
  decorator==5.1.1
17
  dill==0.3.7
18
+ exceptiongroup==1.1.3
19
  filelock==3.12.4
20
  frozenlist==1.4.0
21
  fsspec==2023.9.2
 
23
  GitPython==3.1.37
24
  huggingface-hub==0.17.3
25
  HyperPyYAML==1.2.2
26
+ hypothesis==6.88.1
27
  idna==3.4
28
  importlib-metadata==6.8.0
29
  importlib-resources==6.1.0
 
32
  joblib==1.3.2
33
  jsonschema==4.19.1
34
  jsonschema-specifications==2023.7.1
35
+ kenlm @ git+https://github.com/kpu/kenlm/archive/master.zip
36
  lazy_loader==0.3
37
  librosa==0.10.1
38
  llvmlite==0.41.0
 
55
  protobuf==4.24.4
56
  pyarrow==13.0.0
57
  pycparser==2.21
58
+ pyctcdecode==0.5.0
59
  pydeck==0.8.1b0
60
  Pygments==2.16.1
61
+ pygtrie==2.5.0
62
  python-dateutil==2.8.2
63
  pytz==2023.3.post1
64
  PyYAML==6.0.1
 
76
  sentencepiece==0.1.99
77
  six==1.16.0
78
  smmap==5.0.1
79
+ sortedcontainers==2.4.0
80
  soundfile==0.12.1
81
  soxr==0.3.7
82
  speechbrain==0.5.15