Spaces:

MothersTongue
/

voice-matcher-api

Running on T4

App Files Files Community

arnabg95 commited on Jun 21, 2024

Commit

82f2206

1 Parent(s): b4a191d

model updated

Browse files

Files changed (2) hide show

app/passing.py +4 -4
app/routers/V1/voice/voice_router.py +19 -18

app/passing.py CHANGED Viewed

@@ -17,10 +17,10 @@ def calculate_passing(sequence, phonetic, cosine=0, euclidean=0, passing_thresho
     # Calculate the weighted average
     weights = {
-        'sequence': 0.50,
-        'phonetic': 0.50,
-        'cosine': 0,
-        'euclidean': 0
     }
     weighted_score = (

     # Calculate the weighted average
     weights = {
+        'sequence': 0.35,
+        'phonetic': 0.35,
+        'cosine': 0.15,
+        'euclidean': 0.15
     }
     weighted_score = (

app/routers/V1/voice/voice_router.py CHANGED Viewed

@@ -23,25 +23,25 @@ async def transcribe_audio(
 ):
     try:
         # Validate URL
-        # if not original_url.endswith(".wav"):
-        #     raise HTTPException(
-        #         status_code=status.HTTP_400_BAD_REQUEST,
-        #         detail="Invalid URL. Please provide a URL pointing to a wav file.",
-        #     )
-        # # Download the audio file from the URL
-        # response = requests.get(original_url)
-        # if response.status_code != 200:
-        #     raise HTTPException(
-        #         status_code=status.HTTP_400_BAD_REQUEST,
-        #         detail="Unable to download the audio file from the URL.",
-        #     )
-        # filename_original = f"audio_{int(time.time())}_original.wav"
-        # # Save the downloaded file temporarily
-        # with open(filename_original, "wb") as buffer:
-        #     buffer.write(response.content)
         # Read file bytes
         recorded_bytes = await recorded.read()
@@ -55,7 +55,8 @@ async def transcribe_audio(
             text = get_transcription(filename_recorded)
             text = clean_transcription(text)
             sequence, phonetic = match(matcher_text, text)
-            weighted_score, is_passing = calculate_passing(sequence, phonetic)
             return JSONResponse(
                 {
                     "transcription": text,
@@ -65,7 +66,7 @@ async def transcribe_audio(
             )
         finally:
             # Clean up the temporary file
-            # os.remove(filename_original)
             os.remove(filename_recorded)
     except Exception as e:

 ):
     try:
         # Validate URL
+        if not original_url.endswith(".wav"):
+            raise HTTPException(
+                status_code=status.HTTP_400_BAD_REQUEST,
+                detail="Invalid URL. Please provide a URL pointing to a wav file.",
+            )
+        # Download the audio file from the URL
+        response = requests.get(original_url)
+        if response.status_code != 200:
+            raise HTTPException(
+                status_code=status.HTTP_400_BAD_REQUEST,
+                detail="Unable to download the audio file from the URL.",
+            )
+        filename_original = f"audio_{int(time.time())}_original.wav"
+        # Save the downloaded file temporarily
+        with open(filename_original, "wb") as buffer:
+            buffer.write(response.content)
         # Read file bytes
         recorded_bytes = await recorded.read()
             text = get_transcription(filename_recorded)
             text = clean_transcription(text)
             sequence, phonetic = match(matcher_text, text)
+            Euclidean, Cosine = mfcc_similarty_check(filename_original, filename_recorded)
+            weighted_score, is_passing = calculate_passing(sequence, phonetic, Cosine, Euclidean)
             return JSONResponse(
                 {
                     "transcription": text,
             )
         finally:
             # Clean up the temporary file
+            os.remove(filename_original)
             os.remove(filename_recorded)
     except Exception as e: