Short-Faceless / utility /text_audio_cleaner.py
codewithdark's picture
Upload 9 files
9b70717 verified
raw
history blame
1.3 kB
import re
import os
from pydub import AudioSegment
def clean_text(text):
"""
Removes symbols and cleans the input text.
"""
text = re.sub(r'[^\w\s]', '', text) # Remove punctuation
text = text.strip() # Remove leading/trailing whitespace
return text
def process_audio(audio_path, output_path):
"""
Cleans and normalizes the audio.
"""
try:
audio = AudioSegment.from_file(audio_path)
# Simple normalization (you can add more sophisticated methods)
normalized_audio = audio.normalize()
normalized_audio.export(output_path, format="wav")
return output_path
except Exception as e:
print(f"Error processing audio: {e}")
return None
def convert_to_wav(input_file):
"""
Convert any audio file to WAV format.
"""
try:
# Load the audio file
audio = AudioSegment.from_file(input_file)
# Define the output WAV file path
output_wav = os.path.splitext(input_file)[0] + ".wav"
# Export the audio to WAV format
audio.export(output_wav, format="wav")
return output_wav
except Exception as e:
print(f"Error converting to WAV: {e}")
return None