Spaces:
Runtime error
Runtime error
Adjust app to support the use of cleaner model interface
Browse files- app.py +7 -7
- requirements.txt +7 -1
app.py
CHANGED
|
@@ -1,19 +1,19 @@
|
|
| 1 |
import streamlit as st
|
| 2 |
-
import torch
|
| 3 |
-
from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
|
| 4 |
from speechbrain.pretrained import GraphemeToPhoneme
|
| 5 |
import os
|
| 6 |
import torchaudio
|
| 7 |
from wav2vecasr.MispronounciationDetector import MispronounciationDetector
|
|
|
|
|
|
|
| 8 |
|
| 9 |
@st.cache_resource
|
| 10 |
def load_model():
|
| 11 |
-
|
| 12 |
-
|
| 13 |
-
|
| 14 |
-
|
| 15 |
g2p = GraphemeToPhoneme.from_hparams("speechbrain/soundchoice-g2p")
|
| 16 |
-
mispronounciation_detector = MispronounciationDetector(
|
| 17 |
return mispronounciation_detector
|
| 18 |
|
| 19 |
|
|
|
|
| 1 |
import streamlit as st
|
|
|
|
|
|
|
| 2 |
from speechbrain.pretrained import GraphemeToPhoneme
|
| 3 |
import os
|
| 4 |
import torchaudio
|
| 5 |
from wav2vecasr.MispronounciationDetector import MispronounciationDetector
|
| 6 |
+
from wav2vecasr.PhonemeASRModel import Wav2Vec2PhonemeASRModel, Wav2Vec2OptimisedPhonemeASRModel
|
| 7 |
+
|
| 8 |
|
| 9 |
@st.cache_resource
|
| 10 |
def load_model():
|
| 11 |
+
path = os.path.join(os.getcwd(), "wav2vecasr", "model", "checkpoint-600")
|
| 12 |
+
asr_model = Wav2Vec2OptimisedPhonemeASRModel(path, os.path.join(path, "wav2vec2_vocab_final.json"),
|
| 13 |
+
os.path.join(os.getcwd(), "wav2vecasr", "pretrained_models",
|
| 14 |
+
"ken-lm-ngram"))
|
| 15 |
g2p = GraphemeToPhoneme.from_hparams("speechbrain/soundchoice-g2p")
|
| 16 |
+
mispronounciation_detector = MispronounciationDetector(asr_model, g2p, "cpu")
|
| 17 |
return mispronounciation_detector
|
| 18 |
|
| 19 |
|
requirements.txt
CHANGED
|
@@ -4,7 +4,7 @@ altair==5.1.2
|
|
| 4 |
async-timeout==4.0.3
|
| 5 |
attrs==23.1.0
|
| 6 |
audioread==3.0.1
|
| 7 |
-
backports.zoneinfo
|
| 8 |
blinker==1.6.3
|
| 9 |
cachetools==5.3.1
|
| 10 |
certifi==2023.7.22
|
|
@@ -15,6 +15,7 @@ colorama==0.4.6
|
|
| 15 |
datasets==1.18.3
|
| 16 |
decorator==5.1.1
|
| 17 |
dill==0.3.7
|
|
|
|
| 18 |
filelock==3.12.4
|
| 19 |
frozenlist==1.4.0
|
| 20 |
fsspec==2023.9.2
|
|
@@ -22,6 +23,7 @@ gitdb==4.0.10
|
|
| 22 |
GitPython==3.1.37
|
| 23 |
huggingface-hub==0.17.3
|
| 24 |
HyperPyYAML==1.2.2
|
|
|
|
| 25 |
idna==3.4
|
| 26 |
importlib-metadata==6.8.0
|
| 27 |
importlib-resources==6.1.0
|
|
@@ -30,6 +32,7 @@ jiwer==3.0.3
|
|
| 30 |
joblib==1.3.2
|
| 31 |
jsonschema==4.19.1
|
| 32 |
jsonschema-specifications==2023.7.1
|
|
|
|
| 33 |
lazy_loader==0.3
|
| 34 |
librosa==0.10.1
|
| 35 |
llvmlite==0.41.0
|
|
@@ -52,8 +55,10 @@ pooch==1.7.0
|
|
| 52 |
protobuf==4.24.4
|
| 53 |
pyarrow==13.0.0
|
| 54 |
pycparser==2.21
|
|
|
|
| 55 |
pydeck==0.8.1b0
|
| 56 |
Pygments==2.16.1
|
|
|
|
| 57 |
python-dateutil==2.8.2
|
| 58 |
pytz==2023.3.post1
|
| 59 |
PyYAML==6.0.1
|
|
@@ -71,6 +76,7 @@ scipy==1.10.1
|
|
| 71 |
sentencepiece==0.1.99
|
| 72 |
six==1.16.0
|
| 73 |
smmap==5.0.1
|
|
|
|
| 74 |
soundfile==0.12.1
|
| 75 |
soxr==0.3.7
|
| 76 |
speechbrain==0.5.15
|
|
|
|
| 4 |
async-timeout==4.0.3
|
| 5 |
attrs==23.1.0
|
| 6 |
audioread==3.0.1
|
| 7 |
+
backports.zoneinfo==0.2.1
|
| 8 |
blinker==1.6.3
|
| 9 |
cachetools==5.3.1
|
| 10 |
certifi==2023.7.22
|
|
|
|
| 15 |
datasets==1.18.3
|
| 16 |
decorator==5.1.1
|
| 17 |
dill==0.3.7
|
| 18 |
+
exceptiongroup==1.1.3
|
| 19 |
filelock==3.12.4
|
| 20 |
frozenlist==1.4.0
|
| 21 |
fsspec==2023.9.2
|
|
|
|
| 23 |
GitPython==3.1.37
|
| 24 |
huggingface-hub==0.17.3
|
| 25 |
HyperPyYAML==1.2.2
|
| 26 |
+
hypothesis==6.88.1
|
| 27 |
idna==3.4
|
| 28 |
importlib-metadata==6.8.0
|
| 29 |
importlib-resources==6.1.0
|
|
|
|
| 32 |
joblib==1.3.2
|
| 33 |
jsonschema==4.19.1
|
| 34 |
jsonschema-specifications==2023.7.1
|
| 35 |
+
kenlm @ git+https://github.com/kpu/kenlm/archive/master.zip
|
| 36 |
lazy_loader==0.3
|
| 37 |
librosa==0.10.1
|
| 38 |
llvmlite==0.41.0
|
|
|
|
| 55 |
protobuf==4.24.4
|
| 56 |
pyarrow==13.0.0
|
| 57 |
pycparser==2.21
|
| 58 |
+
pyctcdecode==0.5.0
|
| 59 |
pydeck==0.8.1b0
|
| 60 |
Pygments==2.16.1
|
| 61 |
+
pygtrie==2.5.0
|
| 62 |
python-dateutil==2.8.2
|
| 63 |
pytz==2023.3.post1
|
| 64 |
PyYAML==6.0.1
|
|
|
|
| 76 |
sentencepiece==0.1.99
|
| 77 |
six==1.16.0
|
| 78 |
smmap==5.0.1
|
| 79 |
+
sortedcontainers==2.4.0
|
| 80 |
soundfile==0.12.1
|
| 81 |
soxr==0.3.7
|
| 82 |
speechbrain==0.5.15
|