Spaces:

pythonitalia
/

realtime-transcription

Build error

App Files Files Community

rrevo commited on Jan 13, 2024

Commit

1ba4a0c

1 Parent(s): 6e090f6

http

Browse files

Files changed (4) hide show

client/pdm.lock +66 -1
client/pyproject.toml +1 -0
client/src/main.py +8 -1
server/src/main.py +3 -3

client/pdm.lock CHANGED Viewed

@@ -5,7 +5,7 @@
 groups = ["default"]
 strategy = ["cross_platform"]
 lock_version = "4.4"
-content_hash = "sha256:89d7b04abcb48301359df73888824b63edc037d5a7cdbdfa64bf22c7352dc2a9"
 [[package]]
 name = "accelerate"
@@ -26,6 +26,20 @@ files = [
     {file = "accelerate-0.26.1.tar.gz", hash = "sha256:bf63716b6bd9460d87da970cf4d833abb824ca0aa633be36b741e63a1b504f89"},
 ]
 [[package]]
 name = "certifi"
 version = "2023.11.17"
@@ -106,6 +120,47 @@ files = [
     {file = "fsspec-2023.12.2.tar.gz", hash = "sha256:8548d39e8810b59c38014934f6b31e57f40c1b20f911f4cc2b85389c7e9bf0cb"},
 ]
 [[package]]
 name = "huggingface-hub"
 version = "0.20.2"
@@ -526,6 +581,16 @@ files = [
     {file = "safetensors-0.4.1.tar.gz", hash = "sha256:2304658e6ada81a5223225b4efe84748e760c46079bffedf7e321763cafb36c9"},
 ]
 [[package]]
 name = "speechrecognition"
 version = "3.10.1"

 groups = ["default"]
 strategy = ["cross_platform"]
 lock_version = "4.4"
+content_hash = "sha256:cb77a02fed8fa68d3cdbb9acec8b4eb8cd20809e92c3fb5f5195bcb1e80fedb7"
 [[package]]
 name = "accelerate"
     {file = "accelerate-0.26.1.tar.gz", hash = "sha256:bf63716b6bd9460d87da970cf4d833abb824ca0aa633be36b741e63a1b504f89"},
 ]
+[[package]]
+name = "anyio"
+version = "4.2.0"
+requires_python = ">=3.8"
+summary = "High level compatibility layer for multiple asynchronous event loop implementations"
+dependencies = [
+    "idna>=2.8",
+    "sniffio>=1.1",
+]
+files = [
+    {file = "anyio-4.2.0-py3-none-any.whl", hash = "sha256:745843b39e829e108e518c489b31dc757de7d2131d53fac32bd8df268227bfee"},
+    {file = "anyio-4.2.0.tar.gz", hash = "sha256:e1875bb4b4e2de1669f4bc7869b6d3f54231cdced71605e6e64c9be77e3be50f"},
+]
 [[package]]
 name = "certifi"
 version = "2023.11.17"
     {file = "fsspec-2023.12.2.tar.gz", hash = "sha256:8548d39e8810b59c38014934f6b31e57f40c1b20f911f4cc2b85389c7e9bf0cb"},
 ]
+[[package]]
+name = "h11"
+version = "0.14.0"
+requires_python = ">=3.7"
+summary = "A pure-Python, bring-your-own-I/O implementation of HTTP/1.1"
+files = [
+    {file = "h11-0.14.0-py3-none-any.whl", hash = "sha256:e3fe4ac4b851c468cc8363d500db52c2ead036020723024a109d37346efaa761"},
+    {file = "h11-0.14.0.tar.gz", hash = "sha256:8f19fbbe99e72420ff35c00b27a34cb9937e902a8b810e2c88300c6f0a3b699d"},
+]
+[[package]]
+name = "httpcore"
+version = "1.0.2"
+requires_python = ">=3.8"
+summary = "A minimal low-level HTTP client."
+dependencies = [
+    "certifi",
+    "h11<0.15,>=0.13",
+]
+files = [
+    {file = "httpcore-1.0.2-py3-none-any.whl", hash = "sha256:096cc05bca73b8e459a1fc3dcf585148f63e534eae4339559c9b8a8d6399acc7"},
+    {file = "httpcore-1.0.2.tar.gz", hash = "sha256:9fc092e4799b26174648e54b74ed5f683132a464e95643b226e00c2ed2fa6535"},
+]
+[[package]]
+name = "httpx"
+version = "0.26.0"
+requires_python = ">=3.8"
+summary = "The next generation HTTP client."
+dependencies = [
+    "anyio",
+    "certifi",
+    "httpcore==1.*",
+    "idna",
+    "sniffio",
+]
+files = [
+    {file = "httpx-0.26.0-py3-none-any.whl", hash = "sha256:8915f5a3627c4d47b73e8202457cb28f1266982d1159bd5779d86a80c0eab1cd"},
+    {file = "httpx-0.26.0.tar.gz", hash = "sha256:451b55c30d5185ea6b23c2c793abf9bb237d2a7dfb901ced6ff69ad37ec1dfaf"},
+]
 [[package]]
 name = "huggingface-hub"
 version = "0.20.2"
     {file = "safetensors-0.4.1.tar.gz", hash = "sha256:2304658e6ada81a5223225b4efe84748e760c46079bffedf7e321763cafb36c9"},
 ]
+[[package]]
+name = "sniffio"
+version = "1.3.0"
+requires_python = ">=3.7"
+summary = "Sniff out which async library your code is running under"
+files = [
+    {file = "sniffio-1.3.0-py3-none-any.whl", hash = "sha256:eecefdce1e5bbfb7ad2eeaabf7c1eeb404d7757c379bd1f7e5cce9d8bf425384"},
+    {file = "sniffio-1.3.0.tar.gz", hash = "sha256:e60305c5e5d314f5389259b7f22aaa33d8f7dee49763119234af3755c55b9101"},
+]
 [[package]]
 name = "speechrecognition"
 version = "3.10.1"

client/pyproject.toml CHANGED Viewed

@@ -10,6 +10,7 @@ dependencies = [
     "PyAudio>=0.2.14",
     "SpeechRecognition>=3.10.1",
     "transformers[torch]>=4.36.2",
 ]
 requires-python = ">=3.11"
 readme = "README.md"

     "PyAudio>=0.2.14",
     "SpeechRecognition>=3.10.1",
     "transformers[torch]>=4.36.2",
+    "httpx>=0.26.0",
 ]
 requires-python = ">=3.11"
 readme = "README.md"

client/src/main.py CHANGED Viewed

@@ -1,3 +1,4 @@
 from queue import Queue
 import logging
 from datetime import UTC, datetime, timedelta
@@ -10,6 +11,9 @@ from audio_utils import get_microphone, get_speech_recognizer, get_all_audio_que
 logger = logging.getLogger(__name__)
 def main():
     recording_duration = 2
     sample_rate = 16000
@@ -48,7 +52,10 @@ def main():
                 if current_audio_chunk.is_complete:
                     serialized = pickle.dumps(current_audio_chunk.audio_array)
-                    print('chunk done', serialized)
                     # text = transcribe_model.transcribe(current_audio_chunk.audio_array)
                     # sentence = Sentence(
                     #     start_time=current_audio_chunk.start_time, end_time=current_audio_chunk.end_time, text=text

+import httpx
 from queue import Queue
 import logging
 from datetime import UTC, datetime, timedelta
 logger = logging.getLogger(__name__)
+TRANSCRIBING_SERVER = "http://localhost:3535/transcribe"
 def main():
     recording_duration = 2
     sample_rate = 16000
                 if current_audio_chunk.is_complete:
                     serialized = pickle.dumps(current_audio_chunk.audio_array)
+                    response = httpx.post(TRANSCRIBING_SERVER, data=serialized)
+                    print('chunk done', response.text, response.status_code)
                     # text = transcribe_model.transcribe(current_audio_chunk.audio_array)
                     # sentence = Sentence(
                     #     start_time=current_audio_chunk.start_time, end_time=current_audio_chunk.end_time, text=text

server/src/main.py CHANGED Viewed

@@ -10,6 +10,6 @@ def read_root():
     return {"status": "ok"}
-@app.get("/items/{item_id}")
-def read_item(item_id: int, q: Union[str, None] = None):
-    return {"item_id": item_id, "q": q}

     return {"status": "ok"}
+@app.post("/transcribe")
+def transcribe(audio: bytes):
+    return {"transcribe": "hello"}