arshadrana commited on
Commit
ae43f08
·
verified ·
1 Parent(s): a562e5f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +25 -36
app.py CHANGED
@@ -1,46 +1,35 @@
1
  import gradio as gr
2
- import speech_recognition as sr
3
- from pydub import AudioSegment
4
- from io import BytesIO
5
- import tempfile
6
 
7
- def transcribe_audio(audio_input):
8
- recognizer = sr.Recognizer()
9
-
10
- if isinstance(audio_input, tuple) and len(audio_input) == 2:
11
- audio_data_bytes = audio_input[1]
12
- else:
13
- raise ValueError("Expected audio_input to be a tuple with audio data bytes.")
14
-
15
- # Load audio as raw data
16
- try:
17
- audio_segment = AudioSegment.from_file(BytesIO(audio_data_bytes), format="mp3")
18
- except Exception as e:
19
- return f"Error loading audio file: {e}"
20
 
21
- # Save as WAV to a temporary file
22
- with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as wav_file:
23
- audio_segment.export(wav_file.name, format="wav")
24
- wav_file_path = wav_file.name
25
-
26
- # Transcribe the audio
27
- try:
28
- with sr.AudioFile(wav_file_path) as source:
29
- audio_data = recognizer.record(source)
30
- text = recognizer.recognize_google(audio_data)
31
- return text
32
- except sr.UnknownValueError:
33
- return "Google Speech Recognition could not understand audio"
34
- except sr.RequestError as e:
35
- return f"Could not request results from Google Speech Recognition service; {e}"
36
 
37
- # Gradio Interface
38
  iface = gr.Interface(
39
- fn=transcribe_audio,
40
- inputs="audio",
41
  outputs="text",
42
  title="Voice to Text Converter",
43
- description="Upload an audio file and get the transcribed text."
44
  )
45
 
46
  iface.launch()
 
1
  import gradio as gr
2
+ import requests
 
 
 
3
 
4
+ # Function to send audio to Groq API and get transcription
5
+ def transcribe(audio):
6
+ # Load audio data
7
+ audio_data = audio.read()
8
+
9
+ # Replace these placeholders with your actual Groq API endpoint and headers
10
+ groq_api_endpoint = "https://api.groq.com/transcribe" # Example endpoint
11
+ headers = {
12
+ "Authorization": "Bearer YOUR_GROQ_API_KEY",
13
+ "Content-Type": "audio/wav",
14
+ }
 
 
15
 
16
+ # Send audio to Groq API
17
+ response = requests.post(groq_api_endpoint, headers=headers, data=audio_data)
18
+
19
+ # Parse response
20
+ if response.status_code == 200:
21
+ result = response.json()
22
+ return result.get("transcription", "No transcription available.")
23
+ else:
24
+ return f"Error: {response.status_code}, {response.text}"
 
 
 
 
 
 
25
 
26
+ # Gradio interface
27
  iface = gr.Interface(
28
+ fn=transcribe,
29
+ inputs=gr.Audio(source="microphone", type="file"),
30
  outputs="text",
31
  title="Voice to Text Converter",
32
+ description="Record your voice, and it will be transcribed into text using Groq API."
33
  )
34
 
35
  iface.launch()