Spaces:

SamuelMiller
/

sum_it

Sleeping

File size: 1,887 Bytes

9ba153c
 
fb1bb66
 
 
9ba153c
18526df
337d2a4
 
18526df
b7ea2f1
 
 
 
3ff502d
b7ea2f1
 
b992dd8
23e1010
da27dba
68856b5
 
23e1010
1e4e32f
090d19c
195ae3a
ab046ec
b7ea2f1
fb1bb66
 
b7ea2f1
 
 
 
 
 
da27dba
ab046ec
b7ea2f1
ab046ec
 
 
 
b7ea2f1
 
68856b5
b7ea2f1
ab046ec
0a8189c
ab046ec

# >>>>>>   Adapted/frankensteined from these scripts:   <<<<<<<
#                 for Summary Interface:
# >>>> https://huggingface.co/spaces/khxu/pegasus-text-summarizers/blob/main/app.py
#                      Audio Interface
# >>>> https://huggingface.co/spaces/iSky/Speech-audio-to-text-with-grammar-correction/blob/main/app.py

import gradio as gr
from transformers import pipeline
from gradio.mix import Parallel, Series

# >>>>>>>>>>>>>>>>>>>> Danger Below <<<<<<<<<<<<<<<<<<<<<<
# Load Interfaces:
s2t = gr.Interface.load('huggingface/facebook/s2t-medium-librispeech-asr')
grammar = gr.Interface.load('huggingface/prithivida/grammar_error_correcter_v1')
sum_it = gr.Interface.load('huggingface/SamuelMiller/lil_sumsum') 

# Audio Functions:
def out(audio):
  flag = True
  if audio==None:
    return "no audio" 
  
  elif flag:               
    a = s2t(audio)
    #g = grammar(a)
    #s = sum_it(g)                              # Summarize Audio with sum_it
    return a, grammar(a) # grammar(s),                       # Grammar Filter 

  else:
    return "something is wrong in the function?"

# Construct Interfaces:
iface = gr.Interface(
  fn=out, 
  title="Speech Audio to text (with corrected grammar)",
  description="Let's Hear It!! This app transforms your speech (input) to text with corrected grammar after (output)!",
  inputs= gr.inputs.Audio(source="microphone", type="filepath", label=None, optional=True),
  outputs= ['text','text']
)

# Launch Interface
iface.launch(enable_queue=True,show_error=True)

  # From Original Code:
# gr.inputs.Audio(source="upload", type="filepath", label=None, optional=True),  
# examples=[["Grammar-Correct-Sample.mp3"], ["Grammar-Wrong-Sample.mp3"],],

#def speech_to_text(inp):
    #pass  # speech recognition model defined here

#gr.Interface(speech_to_text, inputs="mic", outputs=gr.Textbox(label="Predicted text", lines=4))