Spaces:

JothishJJ
/

AudioForEveryone

Runtime error

App Files Files Community

JothishJJ commited on Mar 9

Commit

6fffa48

verified ·

1 Parent(s): 115f47b

Update app.py

Browse files

Files changed (1) hide show

app.py +41 -22

app.py CHANGED Viewed

@@ -1,38 +1,57 @@
-import PyPDF2
-from transformers import pipeline
 import gradio as gr
 # Function to extract text from PDF
-def extract_text_from_pdf(pdf_file):
-    reader = PyPDF2.PdfReader(pdf_file)
     text = ""
     for page in reader.pages:
         if page and page.extract_text():
             text += page.extract_text()
     return text
-# Load text-to-speech pipeline from Hugging Face
-tts = pipeline("text-to-speech", model="facebook/fastspeech2-en-ljspeech")
-# Function to convert PDF to audio with no text limit
-def pdf_to_audio(pdf_file):
-    text = extract_text_from_pdf(pdf_file)
-    if not text.strip():
-        return "", "No text found in PDF"
-    audio = tts(text)
-    audio_path = "output_audio.wav"
-    with open(audio_path, "wb") as f:
-        f.write(audio["audio"])  # Hugging Face TTS returns audio data
-    return audio_path, "Audio generated successfully"
 # Gradio interface
-interface = gr.Interface(
-    fn=pdf_to_audio,
-    inputs=gr.File(type="file"),
-    outputs=[gr.Audio(type="filepath"), gr.Text()]
 )
-if __name__ == "__main__":
-    interface.launch()

 import gradio as gr
+from transformers import pipeline
+from PyPDF2 import PdfReader
+from ebooklib import epub
+from bs4 import BeautifulSoup
+# Load the VITS model from Hugging Face
+text_to_speech = pipeline("text-to-speech", model="efficient-speech/lite-whisper-large-v3-turbo")
 # Function to extract text from PDF
+def extract_pdf_text(file):
+    reader = PdfReader(file)
     text = ""
     for page in reader.pages:
         if page and page.extract_text():
             text += page.extract_text()
     return text
+# Function to extract text from EPUB
+def extract_epub_text(file):
+    book = epub.read_epub(file)
+    text = ""
+    for item in book.get_items():
+        if item.get_type() == epub.ITEM_DOCUMENT:
+            soup = BeautifulSoup(item.content, 'html.parser')
+            text += soup.get_text()
+    return text
+# Unified function to convert text to speech
+def convert_to_audio(file, file_type):
+    if file_type == 'PDF':
+        text = extract_pdf_text(file)
+    elif file_type == 'EPUB':
+        text = extract_epub_text(file)
+    else:
+        text = file.read().decode('utf-8')
+    if not text.strip():
+        return "No text found in the file."
+    # Convert text to speech
+    audio = text_to_speech(text[:5000])  # Limiting input to avoid model constraints
+    return (audio["audio"],)
 # Gradio interface
+demo = gr.Interface(
+    fn=convert_to_audio,
+    inputs=[
+        gr.File(label="Upload PDF, EPUB, or Text File"),
+        gr.Radio(["PDF", "EPUB", "TXT"], label="File Type")
+    ],
+    outputs="audio",
+    title="Unlimited Text-to-Speech Converter",
+    description="Upload PDF, EPUB, or text files — convert them into audio with no limits!"
 )
+demo.launch()