Spaces:
Runtime error
Runtime error
Adjust app to support the use of cleaner model interface
Browse files- app.py +7 -7
- requirements.txt +7 -1
app.py
CHANGED
@@ -1,19 +1,19 @@
|
|
1 |
import streamlit as st
|
2 |
-
import torch
|
3 |
-
from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
|
4 |
from speechbrain.pretrained import GraphemeToPhoneme
|
5 |
import os
|
6 |
import torchaudio
|
7 |
from wav2vecasr.MispronounciationDetector import MispronounciationDetector
|
|
|
|
|
8 |
|
9 |
@st.cache_resource
|
10 |
def load_model():
|
11 |
-
|
12 |
-
|
13 |
-
|
14 |
-
|
15 |
g2p = GraphemeToPhoneme.from_hparams("speechbrain/soundchoice-g2p")
|
16 |
-
mispronounciation_detector = MispronounciationDetector(
|
17 |
return mispronounciation_detector
|
18 |
|
19 |
|
|
|
1 |
import streamlit as st
|
|
|
|
|
2 |
from speechbrain.pretrained import GraphemeToPhoneme
|
3 |
import os
|
4 |
import torchaudio
|
5 |
from wav2vecasr.MispronounciationDetector import MispronounciationDetector
|
6 |
+
from wav2vecasr.PhonemeASRModel import Wav2Vec2PhonemeASRModel, Wav2Vec2OptimisedPhonemeASRModel
|
7 |
+
|
8 |
|
9 |
@st.cache_resource
|
10 |
def load_model():
|
11 |
+
path = os.path.join(os.getcwd(), "wav2vecasr", "model", "checkpoint-600")
|
12 |
+
asr_model = Wav2Vec2OptimisedPhonemeASRModel(path, os.path.join(path, "wav2vec2_vocab_final.json"),
|
13 |
+
os.path.join(os.getcwd(), "wav2vecasr", "pretrained_models",
|
14 |
+
"ken-lm-ngram"))
|
15 |
g2p = GraphemeToPhoneme.from_hparams("speechbrain/soundchoice-g2p")
|
16 |
+
mispronounciation_detector = MispronounciationDetector(asr_model, g2p, "cpu")
|
17 |
return mispronounciation_detector
|
18 |
|
19 |
|
requirements.txt
CHANGED
@@ -4,7 +4,7 @@ altair==5.1.2
|
|
4 |
async-timeout==4.0.3
|
5 |
attrs==23.1.0
|
6 |
audioread==3.0.1
|
7 |
-
backports.zoneinfo
|
8 |
blinker==1.6.3
|
9 |
cachetools==5.3.1
|
10 |
certifi==2023.7.22
|
@@ -15,6 +15,7 @@ colorama==0.4.6
|
|
15 |
datasets==1.18.3
|
16 |
decorator==5.1.1
|
17 |
dill==0.3.7
|
|
|
18 |
filelock==3.12.4
|
19 |
frozenlist==1.4.0
|
20 |
fsspec==2023.9.2
|
@@ -22,6 +23,7 @@ gitdb==4.0.10
|
|
22 |
GitPython==3.1.37
|
23 |
huggingface-hub==0.17.3
|
24 |
HyperPyYAML==1.2.2
|
|
|
25 |
idna==3.4
|
26 |
importlib-metadata==6.8.0
|
27 |
importlib-resources==6.1.0
|
@@ -30,6 +32,7 @@ jiwer==3.0.3
|
|
30 |
joblib==1.3.2
|
31 |
jsonschema==4.19.1
|
32 |
jsonschema-specifications==2023.7.1
|
|
|
33 |
lazy_loader==0.3
|
34 |
librosa==0.10.1
|
35 |
llvmlite==0.41.0
|
@@ -52,8 +55,10 @@ pooch==1.7.0
|
|
52 |
protobuf==4.24.4
|
53 |
pyarrow==13.0.0
|
54 |
pycparser==2.21
|
|
|
55 |
pydeck==0.8.1b0
|
56 |
Pygments==2.16.1
|
|
|
57 |
python-dateutil==2.8.2
|
58 |
pytz==2023.3.post1
|
59 |
PyYAML==6.0.1
|
@@ -71,6 +76,7 @@ scipy==1.10.1
|
|
71 |
sentencepiece==0.1.99
|
72 |
six==1.16.0
|
73 |
smmap==5.0.1
|
|
|
74 |
soundfile==0.12.1
|
75 |
soxr==0.3.7
|
76 |
speechbrain==0.5.15
|
|
|
4 |
async-timeout==4.0.3
|
5 |
attrs==23.1.0
|
6 |
audioread==3.0.1
|
7 |
+
backports.zoneinfo==0.2.1
|
8 |
blinker==1.6.3
|
9 |
cachetools==5.3.1
|
10 |
certifi==2023.7.22
|
|
|
15 |
datasets==1.18.3
|
16 |
decorator==5.1.1
|
17 |
dill==0.3.7
|
18 |
+
exceptiongroup==1.1.3
|
19 |
filelock==3.12.4
|
20 |
frozenlist==1.4.0
|
21 |
fsspec==2023.9.2
|
|
|
23 |
GitPython==3.1.37
|
24 |
huggingface-hub==0.17.3
|
25 |
HyperPyYAML==1.2.2
|
26 |
+
hypothesis==6.88.1
|
27 |
idna==3.4
|
28 |
importlib-metadata==6.8.0
|
29 |
importlib-resources==6.1.0
|
|
|
32 |
joblib==1.3.2
|
33 |
jsonschema==4.19.1
|
34 |
jsonschema-specifications==2023.7.1
|
35 |
+
kenlm @ git+https://github.com/kpu/kenlm/archive/master.zip
|
36 |
lazy_loader==0.3
|
37 |
librosa==0.10.1
|
38 |
llvmlite==0.41.0
|
|
|
55 |
protobuf==4.24.4
|
56 |
pyarrow==13.0.0
|
57 |
pycparser==2.21
|
58 |
+
pyctcdecode==0.5.0
|
59 |
pydeck==0.8.1b0
|
60 |
Pygments==2.16.1
|
61 |
+
pygtrie==2.5.0
|
62 |
python-dateutil==2.8.2
|
63 |
pytz==2023.3.post1
|
64 |
PyYAML==6.0.1
|
|
|
76 |
sentencepiece==0.1.99
|
77 |
six==1.16.0
|
78 |
smmap==5.0.1
|
79 |
+
sortedcontainers==2.4.0
|
80 |
soundfile==0.12.1
|
81 |
soxr==0.3.7
|
82 |
speechbrain==0.5.15
|