varl42 commited on
Commit
4563676
·
1 Parent(s): cc6af15

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +17 -5
app.py CHANGED
@@ -7,6 +7,8 @@ import scipy
7
  from gtts import gTTS
8
  from io import BytesIO
9
  from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
 
 
10
 
11
  def extract_text(pdf_file):
12
  pdfReader = PyPDF2.PdfReader(pdf_file)
@@ -53,11 +55,21 @@ def summarize_text(text):
53
  return summary
54
 
55
  def text_to_audio(text):
56
- tts = gTTS(text, lang='en')
57
- buffer = BytesIO()
58
- tts.write_to_fp(buffer)
59
- buffer.seek(0)
60
- return buffer.read()
 
 
 
 
 
 
 
 
 
 
61
 
62
  def audio_pdf(pdf_file):
63
  text = extract_text(pdf_file)
 
7
  from gtts import gTTS
8
  from io import BytesIO
9
  from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
10
+ from transformers import VitsTokenizer, VitsModel
11
+
12
 
13
  def extract_text(pdf_file):
14
  pdfReader = PyPDF2.PdfReader(pdf_file)
 
55
  return summary
56
 
57
  def text_to_audio(text):
58
+ #tts = gTTS(text, lang='en')
59
+ #buffer = BytesIO()
60
+ #tts.write_to_fp(buffer)
61
+ #buffer.seek(0)
62
+ #return buffer.read()
63
+
64
+ tokenizer = VitsTokenizer.from_pretrained("facebook/mms-tts-eng")
65
+ model = VitsModel.from_pretrained("facebook/mms-tts-eng")
66
+
67
+ inputs = tokenizer([text], return_tensors="pt")
68
+
69
+ with torch.no_grad():
70
+ outputs = model(**inputs)
71
+
72
+ return outputs.waveform[0]
73
 
74
  def audio_pdf(pdf_file):
75
  text = extract_text(pdf_file)