fcernafukuzaki commited on
Commit
a295231
·
verified ·
1 Parent(s): d9607d1

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +14 -13
app.py CHANGED
@@ -1,4 +1,5 @@
1
  import gradio as gr
 
2
  from google.cloud import speech_v1
3
  from google.protobuf import timestamp_pb2
4
 
@@ -6,23 +7,23 @@ from google.protobuf import timestamp_pb2
6
  def transcribe(stream, audio_bytes):
7
  """Transcribe audio bytes to text using Google Cloud Speech to Text."""
8
 
9
- # Crea un cliente de Speech to Text
10
- client = speech_v1.SpeechClient()
11
-
12
- # Configura la configuración de la solicitud
13
- config = speech_v1.RecognitionConfig()
14
- config.language_code = "es-ES"
15
- config.encoding = speech_v1.RecognitionConfig.Encoding.LINEAR16
16
- config.sample_rate_hertz = 16000
17
-
18
- # Crea una solicitud de reconocimiento de audio
19
- audio = speech_v1.RecognitionAudio(content=audio_bytes)
20
- request = speech_v1.RecognizeSpeechRequest(config=config, audio=audio)
21
-
22
  sr, y = audio_bytes
23
  y = y.astype(np.float32)
24
  y /= np.max(np.abs(y))
25
  if stream is not None:
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  # Realiza la transcripción
27
  response = client.recognize_speech(request)
28
 
 
1
  import gradio as gr
2
+ import numpy as np
3
  from google.cloud import speech_v1
4
  from google.protobuf import timestamp_pb2
5
 
 
7
  def transcribe(stream, audio_bytes):
8
  """Transcribe audio bytes to text using Google Cloud Speech to Text."""
9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
10
  sr, y = audio_bytes
11
  y = y.astype(np.float32)
12
  y /= np.max(np.abs(y))
13
  if stream is not None:
14
+ # Crea un cliente de Speech to Text
15
+ client = speech_v1.SpeechClient()
16
+
17
+ # Configura la configuración de la solicitud
18
+ config = speech_v1.RecognitionConfig()
19
+ config.language_code = "es-ES"
20
+ config.encoding = speech_v1.RecognitionConfig.Encoding.LINEAR16
21
+ config.sample_rate_hertz = 16000
22
+
23
+ # Crea una solicitud de reconocimiento de audio
24
+ audio = speech_v1.RecognitionAudio(content=audio_bytes)
25
+ request = speech_v1.RecognizeSpeechRequest(config=config, audio=audio)
26
+
27
  # Realiza la transcripción
28
  response = client.recognize_speech(request)
29