Spaces:

Niansuh
/

elve

Running

App Files Files Community

Niansuh commited on Mar 9

Commit

8662041

verified ·

1 Parent(s): c27ae83

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -16

app.py CHANGED Viewed

@@ -21,7 +21,6 @@ class SentenceTokenizer:
     def tokenize(self, text: str) -> List[str]:
         if not text or not text.strip():
             return []
-        # Simple sentence splitting
         sentences = self.SENTENCE_END.split(text.strip())
         return [s.strip() for s in sentences if s.strip()]
@@ -35,21 +34,26 @@ class ElevenlabsTTS:
     def __init__(self):
         self.session = requests.Session()
         self.session.headers.update({"User-Agent": "Mozilla/5.0"})
-        # Use temporary directory instead of fixed cache_dir
         self.cache_dir = Path(tempfile.gettempdir())
         self.all_voices = {
-            "Brian": "nPczCjzI2devNBz1zQrb",
-            "Alice": "Xb7hH8MSUJpSbSDYk0k2",
-            "Neal": "Zp1aWhL05Pi5BkhizFC3",
-            # Add other voices as needed
         }
         self.params = {'allow_unauthenticated': '1'}
     def tts(self, text: str, voice: str = "Brian") -> str:
         if voice not in self.all_voices:
             raise ValueError(f"Voice '{voice}' not available")
-        filename = self.cache_dir / f"tts_{int(time.time())}.mp3"
         sentences = split_sentences(text)
         audio_chunks = {}
@@ -64,7 +68,6 @@ class ElevenlabsTTS:
             response.raise_for_status()
             audio_chunks[i] = response.content
-        # No need to create directory as tempfile.gettempdir() already exists
         combined_audio = BytesIO()
         for i in sorted(audio_chunks.keys()):
             combined_audio.write(audio_chunks[i])
@@ -73,20 +76,37 @@ class ElevenlabsTTS:
             f.write(combined_audio.getvalue())
         return filename.as_posix()
 # Web Interface
 tts_provider = ElevenlabsTTS()
 @app.route('/', methods=['GET', 'POST'])
 def index():
     if request.method == 'POST':
-        text = request.form.get('text')
-        voice = request.form.get('voice', 'Brian')
-        try:
-            audio_file = tts_provider.tts(text, voice)
-            return send_file(audio_file, mimetype='audio/mpeg', as_attachment=True)
-        except Exception as e:
-            return render_template('index.html', error=str(e), voices=tts_provider.all_voices.keys())
-    return render_template('index.html', voices=tts_provider.all_voices.keys())
 if __name__ == "__main__":
     app.run(host='0.0.0.0', port=5000)

     def tokenize(self, text: str) -> List[str]:
         if not text or not text.strip():
             return []
         sentences = self.SENTENCE_END.split(text.strip())
         return [s.strip() for s in sentences if s.strip()]
     def __init__(self):
         self.session = requests.Session()
         self.session.headers.update({"User-Agent": "Mozilla/5.0"})
         self.cache_dir = Path(tempfile.gettempdir())
         self.all_voices = {
+            "Brian": "nPczCjzI2devNBz1zQrb", "Alice": "Xb7hH8MSUJpSbSDYk0k2",
+            "Bill": "pqHfZKP75CvOlQylNhV4", "Callum": "N2lVS1w4EtoT3dr4eOWO",
+            "Charlie": "IKne3meq5aSn9XLyUdCD", "Charlotte": "XB0fDUnXU5powFXDhCwa",
+            "Chris": "iP95p4xoKVk53GoZ742B", "Daniel": "onwK4e9ZLuTAKqWW03F9",
+            "Eric": "cjVigY5qzO86Huf0OWal", "George": "JBFqnCBsd6RMkjVDRZzb",
+            "Jessica": "cgSgspJ2msm6clMCkdW9", "Laura": "FGY2WhTYpPnrIDTdsKH5",
+            "Liam": "TX3LPaxmHKxFdv7VOQHJ", "Lily": "pFZP5JQG7iQjIQuC4Bku",
+            "Matilda": "XrExE9yKIg1WjnnlVkGX", "Sarah": "EXAVITQu4vr4xnSDxMaL",
+            "Will": "bIHbv24MWmeRgasZH58o", "Neal": "Zp1aWhL05Pi5BkhizFC3"
         }
         self.params = {'allow_unauthenticated': '1'}
+        self.preview_text = "Hello, this is a sample of my voice."
     def tts(self, text: str, voice: str = "Brian") -> str:
         if voice not in self.all_voices:
             raise ValueError(f"Voice '{voice}' not available")
+        filename = self.cache_dir / f"tts_{voice}_{int(time.time())}.mp3"
         sentences = split_sentences(text)
         audio_chunks = {}
             response.raise_for_status()
             audio_chunks[i] = response.content
         combined_audio = BytesIO()
         for i in sorted(audio_chunks.keys()):
             combined_audio.write(audio_chunks[i])
             f.write(combined_audio.getvalue())
         return filename.as_posix()
+    def generate_preview(self, voice: str) -> str:
+        preview_file = self.cache_dir / f"preview_{voice}.mp3"
+        if not preview_file.exists():
+            return self.tts(self.preview_text, voice)
+        return preview_file.as_posix()
 # Web Interface
 tts_provider = ElevenlabsTTS()
 @app.route('/', methods=['GET', 'POST'])
 def index():
     if request.method == 'POST':
+        if 'generate' in request.form:
+            text = request.form.get('text')
+            voice = request.form.get('voice', 'Brian')
+            try:
+                audio_file = tts_provider.tts(text, voice)
+                return send_file(audio_file, mimetype='audio/mpeg', as_attachment=True, download_name=f"{voice}_output.mp3")
+            except Exception as e:
+                return render_template('index.html', error=str(e), voices=tts_provider.all_voices.keys())
+    # Generate previews on startup or first visit
+    previews = {voice: tts_provider.generate_preview(voice) for voice in tts_provider.all_voices.keys()}
+    return render_template('index.html', voices=tts_provider.all_voices.keys(), previews=previews)
+@app.route('/preview/<voice>')
+def preview(voice):
+    try:
+        audio_file = tts_provider.generate_preview(voice)
+        return send_file(audio_file, mimetype='audio/mpeg')
+    except Exception as e:
+        return str(e), 500
 if __name__ == "__main__":
     app.run(host='0.0.0.0', port=5000)