Spaces:

Yogya12
/

SpeakEasyAI

Running

App Files Files Community

Yogya12 commited on Jun 9

Commit

8d29d40

1 Parent(s): f647470

updated ui

Browse files

Files changed (1) hide show

app.py +50 -48

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ from deep_translator import GoogleTranslator
 from transformers import BlenderbotTokenizer, BlenderbotForConditionalGeneration
 import torch
-# ===== TTS PART =====
 voice_characters = {
     "English - US": {
@@ -17,7 +17,8 @@ voice_characters = {
         "Guy": "en-US-GuyNeural",
     },
     "Hindi": {
-        "Swara": "hi-IN-SwaraNeural"  # Only one voice will be used for Hindi
     }
 }
@@ -33,37 +34,29 @@ def tts_wrapper(text, language, character, translation_direction):
     try:
         original_text = text.strip()
         if not original_text:
-            return "Input text is empty", None
         if translation_direction == "English to Hindi":
             text = GoogleTranslator(source='en', target='hi').translate(original_text)
         elif translation_direction == "Hindi to English":
             text = GoogleTranslator(source='hi', target='en').translate(original_text)
-        # Hindi uses fixed voice "Swara"
-        if language == "Hindi":
-            voice = voice_characters["Hindi"]["Swara"]
-        else:
-            voice = voice_characters.get(language, {}).get(character)
         if not voice:
-            return f"No voice found for selected language and character", None
         filename = asyncio.run(generate_tts(text, voice))
         return text, filename
     except Exception as e:
-        return f"Error: {str(e)}", None
 def get_characters(language):
-    if language == "Hindi":
-        return gr.update(choices=[], value=None, visible=False)
-    else:
-        chars = list(voice_characters.get(language, {}).keys())
-        default_char = chars[0] if chars else None
-        return gr.update(choices=chars, value=default_char, visible=True)
-# ===== CHATBOT PART USING BLENDERBOT =====
 model_name = "facebook/blenderbot-400M-distill"
 tokenizer = BlenderbotTokenizer.from_pretrained(model_name)
@@ -80,60 +73,69 @@ def chatbot_response(history, user_message):
     if history is None:
         history = []
-    history.append(("User", user_message))
     conversation_text = " ".join([msg for _, msg in history]) + " " + user_message
     inputs = tokenizer([conversation_text], return_tensors="pt").to(device)
     reply_ids = model.generate(**inputs, max_length=200)
     response = tokenizer.decode(reply_ids[0], skip_special_tokens=True)
-    history.append(("Bot", response))
-    chat_str = ""
-    for speaker, msg in history:
-        chat_str += f"{speaker}: {msg}\n"
     try:
         audio_path = asyncio.run(generate_bot_tts(response))
     except Exception as e:
         audio_path = None
-        print(f"TTS generation failed: {e}")
     return history, chat_str, audio_path
-# ===== GRADIO UI =====
 def create_app():
-    with gr.Blocks() as app:
-        gr.Markdown("## 🎙️ Multi-Voice AI TTS with Translation + 🤖 BlenderBot Chatbot")
-        with gr.Tab("TTS"):
-            text_input = gr.Textbox(label="Enter Text", placeholder="Type something...", lines=4)
-            language_dropdown = gr.Dropdown(choices=list(voice_characters.keys()), value="English - US", label="Language")
-            character_dropdown = gr.Dropdown(choices=list(voice_characters["English - US"].keys()), value="Aria", label="Voice Character", visible=True)
-            translation_dropdown = gr.Dropdown(choices=["None", "English to Hindi", "Hindi to English"], value="None", label="Translation Direction")
-            tts_button = gr.Button("🔊 Generate Voice")
-            output_text = gr.Textbox(label="Translated Text or Error")
-            output_audio = gr.Audio(label="Generated Voice")
             language_dropdown.change(fn=get_characters, inputs=language_dropdown, outputs=character_dropdown)
             tts_button.click(fn=tts_wrapper,
                              inputs=[text_input, language_dropdown, character_dropdown, translation_dropdown],
                              outputs=[output_text, output_audio])
-        with gr.Tab("Chatbot"):
-            chat_history = gr.State([])
-            user_input = gr.Textbox(label="Enter your message", lines=2, placeholder="Say something...")
-            chat_display = gr.Textbox(label="Chat History", interactive=False, lines=15)
-            audio_output = gr.Audio(label="Bot Voice Reply")
-            send_button = gr.Button("Send")
-            def respond(user_message, history):
-                return chatbot_response(history, user_message)
-            send_button.click(fn=respond, inputs=[user_input, chat_history], outputs=[chat_history, chat_display, audio_output])
-            user_input.submit(fn=respond, inputs=[user_input, chat_history], outputs=[chat_history, chat_display, audio_output])
     return app

 from transformers import BlenderbotTokenizer, BlenderbotForConditionalGeneration
 import torch
+# ===== TTS Setup =====
 voice_characters = {
     "English - US": {
         "Guy": "en-US-GuyNeural",
     },
     "Hindi": {
+        "Swara": "hi-IN-SwaraNeural",
+        "Madhur": "hi-IN-MadhurNeural"
     }
 }
     try:
         original_text = text.strip()
         if not original_text:
+            return "⚠️ Please enter some text.", None
         if translation_direction == "English to Hindi":
             text = GoogleTranslator(source='en', target='hi').translate(original_text)
         elif translation_direction == "Hindi to English":
             text = GoogleTranslator(source='hi', target='en').translate(original_text)
+        voice = voice_characters.get(language, {}).get(character)
         if not voice:
+            return f"⚠️ Voice '{character}' not available for '{language}'.", None
         filename = asyncio.run(generate_tts(text, voice))
         return text, filename
     except Exception as e:
+        return f"❌ Error: {str(e)}", None
 def get_characters(language):
+    chars = list(voice_characters.get(language, {}).keys())
+    default_char = chars[0] if chars else None
+    return gr.update(choices=chars, value=default_char)
+# ===== Chatbot Setup =====
 model_name = "facebook/blenderbot-400M-distill"
 tokenizer = BlenderbotTokenizer.from_pretrained(model_name)
     if history is None:
         history = []
+    history.append(("🧑", user_message))
     conversation_text = " ".join([msg for _, msg in history]) + " " + user_message
     inputs = tokenizer([conversation_text], return_tensors="pt").to(device)
     reply_ids = model.generate(**inputs, max_length=200)
     response = tokenizer.decode(reply_ids[0], skip_special_tokens=True)
+    history.append(("🤖", response))
+    chat_str = "\n".join([f"{speaker}: {msg}" for speaker, msg in history])
     try:
         audio_path = asyncio.run(generate_bot_tts(response))
     except Exception as e:
         audio_path = None
+        print(f"TTS failed: {e}")
     return history, chat_str, audio_path
+# ===== UI =====
 def create_app():
+    with gr.Blocks(css="footer {text-align: center; padding: 10px;}") as app:
+        gr.Markdown("""
+        # 🗣️ SpeakEasy AI
+        A simple and fun **Text-to-Speech + Translator + Chatbot** app!
+        """)
+        with gr.Tab("🎧 Text to Speech + Translator"):
+            with gr.Row():
+                with gr.Column(scale=2):
+                    text_input = gr.Textbox(label="💬 Your Text", placeholder="Enter text here...", lines=4)
+                    language_dropdown = gr.Dropdown(choices=list(voice_characters.keys()), value="English - US", label="🌐 Language")
+                    character_dropdown = gr.Dropdown(choices=list(voice_characters["English - US"].keys()), value="Aria", label="🧑‍🎤 Voice Character")
+                    with gr.Accordion("🔁 Translation Options", open=False):
+                        translation_dropdown = gr.Dropdown(choices=["None", "English to Hindi", "Hindi to English"],
+                                                           value="None", label="🔄 Translate Text")
+                    tts_button = gr.Button("🎙️ Generate Voice")
+                    output_text = gr.Textbox(label="📝 Final Output / Translation")
+                with gr.Column(scale=1):
+                    output_audio = gr.Audio(label="🔊 Listen Here", autoplay=True)
             language_dropdown.change(fn=get_characters, inputs=language_dropdown, outputs=character_dropdown)
             tts_button.click(fn=tts_wrapper,
                              inputs=[text_input, language_dropdown, character_dropdown, translation_dropdown],
                              outputs=[output_text, output_audio])
+        with gr.Tab("🤖 Chatbot"):
+            with gr.Row():
+                with gr.Column(scale=2):
+                    user_input = gr.Textbox(label="💬 Ask Anything", lines=2, placeholder="Try: What's your name?")
+                    chat_display = gr.Textbox(label="📜 Conversation", interactive=False, lines=15)
+                    send_button = gr.Button("📩 Send")
+                with gr.Column(scale=1):
+                    audio_output = gr.Audio(label="🔊 Bot's Voice Reply", autoplay=True)
+            chat_history = gr.State([])
+            send_button.click(fn=chatbot_response, inputs=[chat_history, user_input],
+                              outputs=[chat_history, chat_display, audio_output])
+            user_input.submit(fn=chatbot_response, inputs=[chat_history, user_input],
+                              outputs=[chat_history, chat_display, audio_output])
+        gr.HTML("<footer>🔧 Made by using Gradio, Edge TTS, and Hugging Face 🤗</footer>")
     return app