Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -7,8 +7,10 @@ from pydub import AudioSegment
|
|
7 |
import os
|
8 |
import scipy.signal as signal
|
9 |
import torch
|
10 |
-
|
11 |
from pydub.silence import detect_nonsilent # Correct import
|
|
|
|
|
12 |
|
13 |
hf_token = os.getenv('diarizationToken')
|
14 |
|
@@ -29,26 +31,28 @@ def remove_phone_tonalities(audio, sr):
|
|
29 |
filtered_audio = signal.filtfilt(b, a, audio)
|
30 |
return filtered_audio
|
31 |
|
|
|
|
|
32 |
def convert_audio_to_wav(audio_path):
|
33 |
-
#
|
34 |
-
|
35 |
-
|
36 |
-
|
37 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
38 |
|
39 |
|
40 |
|
41 |
-
import gradio as gr
|
42 |
-
import librosa
|
43 |
-
import numpy as np
|
44 |
-
import whisperx
|
45 |
-
from transformers import pipeline
|
46 |
-
from pydub import AudioSegment
|
47 |
-
import os
|
48 |
-
import scipy.signal as signal
|
49 |
-
import torch
|
50 |
-
import pandas as pd
|
51 |
-
from pydub.silence import detect_nonsilent
|
52 |
|
53 |
hf_token = os.getenv('diarizationToken')
|
54 |
|
@@ -70,6 +74,8 @@ def remove_phone_tonalities(audio, sr):
|
|
70 |
filtered_audio = signal.filtfilt(b, a, audio)
|
71 |
return filtered_audio
|
72 |
|
|
|
|
|
73 |
def process_audio(audio_path):
|
74 |
print(f"Received audio file: {audio_path}")
|
75 |
|
|
|
7 |
import os
|
8 |
import scipy.signal as signal
|
9 |
import torch
|
10 |
+
from pydub.utils import mediainfo
|
11 |
from pydub.silence import detect_nonsilent # Correct import
|
12 |
+
import pandas as pd
|
13 |
+
|
14 |
|
15 |
hf_token = os.getenv('diarizationToken')
|
16 |
|
|
|
31 |
filtered_audio = signal.filtfilt(b, a, audio)
|
32 |
return filtered_audio
|
33 |
|
34 |
+
|
35 |
+
|
36 |
def convert_audio_to_wav(audio_path):
|
37 |
+
# Check the audio file format before conversion
|
38 |
+
audio_info = mediainfo(audio_path)
|
39 |
+
print(f"Audio file info: {audio_info}")
|
40 |
+
|
41 |
+
if audio_info['format_name'] not in ['wav', 'mp3', 'flac', 'ogg']: # Add other valid formats if necessary
|
42 |
+
raise ValueError(f"Unsupported audio format: {audio_info['format_name']}")
|
43 |
+
|
44 |
+
try:
|
45 |
+
# Convert any audio format to WAV using pydub
|
46 |
+
sound = AudioSegment.from_file(audio_path)
|
47 |
+
wav_path = "converted_audio.wav"
|
48 |
+
sound.export(wav_path, format="wav")
|
49 |
+
return wav_path
|
50 |
+
except Exception as e:
|
51 |
+
print(f"Error converting audio: {e}")
|
52 |
+
raise
|
53 |
|
54 |
|
55 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
56 |
|
57 |
hf_token = os.getenv('diarizationToken')
|
58 |
|
|
|
74 |
filtered_audio = signal.filtfilt(b, a, audio)
|
75 |
return filtered_audio
|
76 |
|
77 |
+
|
78 |
+
|
79 |
def process_audio(audio_path):
|
80 |
print(f"Received audio file: {audio_path}")
|
81 |
|