import re import os from pydub import AudioSegment def clean_text(text): """ Removes symbols and cleans the input text. """ text = re.sub(r'[^\w\s]', '', text) # Remove punctuation text = text.strip() # Remove leading/trailing whitespace return text def process_audio(audio_path, output_path): """ Cleans and normalizes the audio. """ try: audio = AudioSegment.from_file(audio_path) # Simple normalization (you can add more sophisticated methods) normalized_audio = audio.normalize() normalized_audio.export(output_path, format="wav") return output_path except Exception as e: print(f"Error processing audio: {e}") return None def convert_to_wav(input_file): """ Convert any audio file to WAV format. """ try: # Load the audio file audio = AudioSegment.from_file(input_file) # Define the output WAV file path output_wav = os.path.splitext(input_file)[0] + ".wav" # Export the audio to WAV format audio.export(output_wav, format="wav") return output_wav except Exception as e: print(f"Error converting to WAV: {e}") return None