IT2091024v2

Paused

App Files Files Community

Pijush2023 commited on Aug 11, 2024

Commit

83586d7

verified ·

1 Parent(s): 91df8fc

Update app.py

Browse files

Files changed (1) hide show

app.py +37 -4

app.py CHANGED Viewed

@@ -442,6 +442,26 @@ base_audio_drive = "/data/audio"
 #Normal Code with sample rate is 44100 Hz
 def transcribe_function(stream, new_chunk):
     try:
         sr, y = new_chunk[0], new_chunk[1]
@@ -449,16 +469,29 @@ def transcribe_function(stream, new_chunk):
         print(f"Error chunk structure: {type(new_chunk)}, content: {new_chunk}")
         return stream, "", None
-    y = y.astype(np.float32) / np.max(np.abs(y))
     if stream is not None:
-        stream = np.concatenate([stream, y])
     else:
-        stream = y
     result = pipe_asr({"array": stream, "sampling_rate": sr}, return_timestamps=False)
-    full_text = result.get("text","")
     return stream, full_text, result

 #Normal Code with sample rate is 44100 Hz
+# def transcribe_function(stream, new_chunk):
+#     try:
+#         sr, y = new_chunk[0], new_chunk[1]
+#     except TypeError:
+#         print(f"Error chunk structure: {type(new_chunk)}, content: {new_chunk}")
+#         return stream, "", None
+#     y = y.astype(np.float32) / np.max(np.abs(y))
+#     if stream is not None:
+#         stream = np.concatenate([stream, y])
+#     else:
+#         stream = y
+#     result = pipe_asr({"array": stream, "sampling_rate": sr}, return_timestamps=False)
+#     full_text = result.get("text","")
+#     return stream, full_text, result
 def transcribe_function(stream, new_chunk):
     try:
         sr, y = new_chunk[0], new_chunk[1]
         print(f"Error chunk structure: {type(new_chunk)}, content: {new_chunk}")
         return stream, "", None
+    # Check if the array is empty
+    if y.size == 0:
+        print("Received an empty audio chunk, skipping processing.")
+        return stream, "", None
+    y = y.astype(np.float32)
+    # Check if y is all zeros or contains no valid data
+    if np.max(np.abs(y)) == 0:
+        print("Audio chunk contains only zeros, skipping normalization.")
+        normalized_y = y
+    else:
+        normalized_y = y / np.max(np.abs(y))
     if stream is not None:
+        stream = np.concatenate([stream, normalized_y])
     else:
+        stream = normalized_y
+    # Placeholder for ASR pipeline; replace with actual pipeline
     result = pipe_asr({"array": stream, "sampling_rate": sr}, return_timestamps=False)
+    full_text = result.get("text", "")
     return stream, full_text, result