Spaces:

pratikshahp
/

audio-to-text-conversion

Runtime error

App Files Files Community

pratikshahp commited on Mar 26, 2024

Commit

0d2601e

verified ·

1 Parent(s): d1035a0

Update app.py

Browse files

Files changed (1) hide show

app.py +0 -23

app.py CHANGED Viewed

@@ -1,6 +1,5 @@
 # Transform an audio to text script with language detection.
 # Author: Pratiksha Patel
 # Description: This script record the audio, transform it to text, detect the language of the file and save it to a txt file.
 # import required modules
 import os
@@ -9,17 +8,12 @@ import streamlit as st
 from audio_recorder_streamlit import audio_recorder
 from langdetect import detect
 import numpy as np
-# Use a pipeline as a high-level helper
-#from transformers import pipeline
-#pipe = pipeline("automatic-speech-recognition", model="openai/whisper-large")
-# Load model directly
 from transformers import AutoProcessor, AutoModelForSpeechSeq2Seq
 def transcribe_audio(audio_bytes):
     processor = AutoProcessor.from_pretrained("openai/whisper-large")
     model = AutoModelForSpeechSeq2Seq.from_pretrained("openai/whisper-large")
     audio_array = np.frombuffer(audio_bytes, dtype=np.int16)
-    # Cast audio array to double precision and normalize
     audio_tensor = torch.tensor(audio_array, dtype=torch.float64) / 32768.0
     input_values = processor(audio_tensor, return_tensors="pt", sampling_rate=16000).input_values
     logits = model(input_values).logits
@@ -27,17 +21,6 @@ def transcribe_audio(audio_bytes):
     transcription = processor.decode(predicted_ids[0])
     return transcription
-# Function to open a file
-#def startfile(fn):
- #   os.system('open %s' % fn)
-# Function to create and open a txt file
-#def create_and_open_txt(text, filename):
-    # Create and write the text to a txt file
- #   with open(filename, "w") as file:
-  #      file.write(text)
-   # startfile(filename)
 # Streamlit app
 st.title("Audio to Text Transcription..")
@@ -55,9 +38,3 @@ if audio_bytes:
         st.write("Error: Failed to transcribe audio.")
 else:
     st.write("No audio recorded.")
-# Detect the language
-#language = detect(transcription)
-#st.write(f"Detected language: {language}")
-# Create and open a txt file with the text
-#create_and_open_txt(transcription, f"output_{language}.txt")

 # Transform an audio to text script with language detection.
 # Author: Pratiksha Patel
 # Description: This script record the audio, transform it to text, detect the language of the file and save it to a txt file.
 # import required modules
 import os
 from audio_recorder_streamlit import audio_recorder
 from langdetect import detect
 import numpy as np
 from transformers import AutoProcessor, AutoModelForSpeechSeq2Seq
 def transcribe_audio(audio_bytes):
     processor = AutoProcessor.from_pretrained("openai/whisper-large")
     model = AutoModelForSpeechSeq2Seq.from_pretrained("openai/whisper-large")
     audio_array = np.frombuffer(audio_bytes, dtype=np.int16)
     audio_tensor = torch.tensor(audio_array, dtype=torch.float64) / 32768.0
     input_values = processor(audio_tensor, return_tensors="pt", sampling_rate=16000).input_values
     logits = model(input_values).logits
     transcription = processor.decode(predicted_ids[0])
     return transcription
 # Streamlit app
 st.title("Audio to Text Transcription..")
         st.write("Error: Failed to transcribe audio.")
 else:
     st.write("No audio recorded.")