PeterPinetree commited on
Commit
f989e9b
Β·
verified Β·
1 Parent(s): ce209de

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +205 -117
app.py CHANGED
@@ -1,121 +1,209 @@
1
  import streamlit as st
2
- import requests
3
- import os
4
- os.environ["SDL_AUDIODRIVER"] = "alsa"
5
- os.environ["PULSE_SERVER"] = "127.0.0.1" # Ensures it looks for a PulseAudio server
6
- os.environ["PA_ALSA_PLUGHW"] = "1" # Ensures ALSA hardware compatibility
7
- import sounddevice as sd
8
- import base64
9
- import tempfile
10
- import io
11
  import numpy as np
12
- import librosa
13
- from scipy.io.wavfile import write
14
- from PIL import Image
15
-
16
- # Hugging Face API Keys
17
- HF_API_KEY = os.getenv("HF_API_KEY")
18
- HEADERS = {"Authorization": f"Bearer {HF_API_KEY}"}
19
-
20
- # Hugging Face API Endpoints
21
- HF_SPEECH_TO_TEXT_API = "https://api-inference.huggingface.co/models/openai/whisper-small"
22
- HF_CHATBOT_API = "https://api-inference.huggingface.co/models/mistralai/Mistral-7B-Instruct"
23
- HF_TEXT_TO_SPEECH_API = "https://api-inference.huggingface.co/models/facebook/mms-tts-eng"
24
-
25
- # Avatars and their personalities
26
- avatars = {
27
- "rat": {"desc": "Clever and resourceful. Loves puzzles and word games.", "voice": "Hello! Let's solve some fun puzzles together!"},
28
- "ox": {"desc": "Steady and dependable. Encourages patience in learning.", "voice": "Consistency is key! Let's learn step by step."},
29
- "tiger": {"desc": "Bold and adventurous. Loves dynamic conversations.", "voice": "Let's jump into an exciting conversation!"},
30
- "rabbit": {"desc": "Gentle and kind. A patient and encouraging teacher.", "voice": "Take your time. Learning should be fun!"},
31
- "dragon": {"desc": "Wise and powerful. Inspires confidence in learning.", "voice": "Believe in yourself! You can do this!"},
32
- "snake": {"desc": "Calm and analytical. Gives insightful explanations.", "voice": "Let's explore the beauty of language together."},
33
- "horse": {"desc": "Energetic and friendly. Encourages active learning.", "voice": "Let's have fun while we learn!"},
34
- "goat": {"desc": "Gentle and artistic. Uses creativity to teach.", "voice": "Imagine and express yourself freely!"},
35
- "monkey": {"desc": "Playful and clever. Loves challenges and fun exercises.", "voice": "I love games! Let's play with words!"},
36
- "rooster": {"desc": "Confident and expressive. Loves discussions.", "voice": "Speak up! Let's share ideas together."},
37
- "dog": {"desc": "Loyal and friendly. Encourages persistence.", "voice": "I'll always be here to help you practice!"},
38
- "pig": {"desc": "Warm and cheerful. Creates a positive learning atmosphere.", "voice": "Learning is fun! Let's enjoy this together!"},
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
39
  }
40
 
41
- # Function to process speech-to-text
42
- def speech_to_text(audio_bytes):
43
- files = {"file": ("audio.wav", audio_bytes, "audio/wav")}
44
- response = requests.post(HF_SPEECH_TO_TEXT_API, headers=HEADERS, files=files)
45
- text = response.json().get("text", "Sorry, could not transcribe audio.")
46
- return text
47
-
48
- # Function to get chatbot response
49
- def chatbot_response(user_input):
50
- payload = {"inputs": f"You are a friendly AI coach for English learners. Help them practice speaking naturally with supportive feedback.\nUser: {user_input}\nAI:"}
51
- response = requests.post(HF_CHATBOT_API, headers=HEADERS, json=payload)
52
- ai_reply = response.json().get("generated_text", "I'm here to help! Keep practicing.")
53
- return ai_reply
54
-
55
- # Function for text-to-speech
56
- def text_to_speech(text):
57
- payload = {"inputs": text}
58
- response = requests.post(HF_TEXT_TO_SPEECH_API, headers=HEADERS, json=payload)
59
- return response.content
60
-
61
- # Function to record audio using sounddevice
62
- def record_audio(duration=5, samplerate=16000):
63
- st.write("πŸŽ™οΈ Recording... Speak now!")
64
- audio_data = sd.rec(int(duration * samplerate), samplerate=samplerate, channels=1, dtype="float32")
65
- sd.wait()
66
- st.write("βœ… Recording finished!")
67
-
68
- # Convert to WAV format
69
- audio_data = (audio_data * 32767).astype(np.int16) # Convert to 16-bit PCM
70
-
71
- with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmpfile:
72
- write(tmpfile.name, samplerate, audio_data)
73
- tmpfile.seek(0)
74
- return tmpfile.read()
75
-
76
- # Streamlit UI
77
- st.title("πŸŽ™οΈ AI Speaking Pal")
78
- st.write("Press the button and chat with your pal!")
79
-
80
- # Start/Stop Conversation Button
81
- if "conversation_active" not in st.session_state:
82
- st.session_state.conversation_active = False
83
-
84
- def toggle_conversation():
85
- st.session_state.conversation_active = not st.session_state.conversation_active
86
-
87
- st.button("🎀 Start/Stop Conversation", on_click=toggle_conversation)
88
-
89
- # Conversation Text Box
90
- show_text = st.checkbox("Show conversation text")
91
- if show_text:
92
- conversation_box = st.text_area("Conversation:", height=200)
93
-
94
- # Handle microphone input
95
- if st.session_state.conversation_active:
96
- audio_bytes = record_audio(duration=5) # Record for 5 seconds
97
- user_text = speech_to_text(audio_bytes)
98
- st.write(f"**You:** {user_text}")
99
-
100
- ai_reply = chatbot_response(user_text)
101
- st.write(f"**AI:** {ai_reply}")
102
-
103
- speech_audio = text_to_speech(ai_reply)
104
- st.audio(io.BytesIO(speech_audio), format="audio/wav")
105
-
106
- # Swiper Carousel Component
107
- avatar_list = list(avatars.keys())
108
- selected_index = st.slider("Pick your pal:", 0, len(avatar_list) - 1, 0)
109
- selected_avatar = avatar_list[selected_index]
110
- avatar_info = avatars[selected_avatar]
111
-
112
- # Display Avatar Image
113
- avatar_img = Image.open(f"images/{selected_avatar}.png")
114
- st.image(avatar_img, caption=f"{selected_avatar.capitalize()} - {avatar_info['desc']}", use_column_width=True)
115
-
116
- # Play avatar's sample voice
117
- if st.button("Hear Sample"):
118
- audio_bytes = text_to_speech(avatar_info["voice"])
119
- st.audio(io.BytesIO(audio_bytes), format="audio/wav")
120
-
121
- st.write("Have fun learning English with your AI pal!")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  import streamlit as st
2
+ import torch
 
 
 
 
 
 
 
 
3
  import numpy as np
4
+ import re
5
+ from transformers import (
6
+ AutoModelForCausalLM,
7
+ AutoTokenizer,
8
+ AutoModelForSpeechSeq2Seq,
9
+ AutoProcessor
10
+ )
11
+ import speech_recognition as sr
12
+ import streamlit.components.v1 as components
13
+
14
+ # Avatar Personas (same as previous implementation)
15
+ AVATAR_PERSONAS = {
16
+ "Rat": {
17
+ "image": "rat.png",
18
+ "name": "Puzzle Master Rat",
19
+ "description": """
20
+ 🧩 Clever and curious, I turn language learning into an exciting puzzle!
21
+ I love breaking down complex ideas into fun, logical challenges.
22
+ My teaching style is all about critical thinking and playful problem-solving.
23
+ """,
24
+ "teaching_style": "Analytical and game-based learning",
25
+ "sample_phrase": "Let's solve this English mystery together!",
26
+ "voice_sample": "I love solving word puzzles and learning new things!"
27
+ },
28
+ "Ox": {
29
+ "image": "ox.png",
30
+ "name": "Professor Ox",
31
+ "description": """
32
+ πŸ“š Patient and methodical, I guide you through English step by step.
33
+ I break down grammar and vocabulary into clear, manageable segments.
34
+ Learning is a journey, and I'll be your steady companion.
35
+ """,
36
+ "teaching_style": "Structured and systematic approach",
37
+ "sample_phrase": "Let's learn English systematically!",
38
+ "voice_sample": "English learning is about understanding each concept carefully."
39
+ },
40
+ "Tiger": {
41
+ "image": "tiger.png",
42
+ "name": "Adventure Coach Tiger",
43
+ "description": """
44
+ πŸ† Energetic and brave, I make English learning an exciting adventure!
45
+ I turn every lesson into a challenge, motivating you to push your limits
46
+ and discover the joy of language learning.
47
+ """,
48
+ "teaching_style": "High-energy and challenge-driven",
49
+ "sample_phrase": "Are you ready to level up your English?",
50
+ "voice_sample": "Let's make learning English an exciting journey!"
51
+ }
52
  }
53
 
54
+ class AdvancedLanguageLearningAssistant:
55
+ def __init__(self, avatar_name):
56
+ # Existing implementation from previous version
57
+ self.avatar = AVATAR_PERSONAS[avatar_name]
58
+
59
+ # Simplified model loading for Hugging Face Spaces
60
+ try:
61
+ self.llm_model = AutoModelForCausalLM.from_pretrained("microsoft/DialoGPT-small")
62
+ self.llm_tokenizer = AutoTokenizer.from_pretrained("microsoft/DialoGPT-small")
63
+ except Exception as e:
64
+ st.error(f"Model loading error: {e}")
65
+ self.llm_model = None
66
+ self.llm_tokenizer = None
67
+
68
+ def generate_response(self, user_input):
69
+ if not self.llm_model:
70
+ return "Sorry, I'm having trouble generating a response."
71
+
72
+ # Incorporate avatar's unique personality
73
+ prompt = f"""
74
+ Avatar: {self.avatar['name']}
75
+ Teaching Style: {self.avatar['teaching_style']}
76
+ User Input: {user_input}
77
+
78
+ Generate a response that:
79
+ 1. Reflects the avatar's unique personality
80
+ 2. Provides encouraging language learning support
81
+ 3. Maintains an engaging tone
82
+ """
83
+
84
+ try:
85
+ inputs = self.llm_tokenizer.encode(prompt, return_tensors='pt')
86
+ outputs = self.llm_model.generate(
87
+ inputs,
88
+ max_length=150,
89
+ temperature=0.7
90
+ )
91
+
92
+ response = self.llm_tokenizer.decode(outputs[0], skip_special_tokens=True)
93
+ return response
94
+ except Exception as e:
95
+ return f"Sorry, I'm having trouble generating a response. Error: {e}"
96
+
97
+ def avatar_selection_page():
98
+ """
99
+ First stage: Avatar Selection
100
+ """
101
+ st.title("Choose Your Learning Companion")
102
+
103
+ # Custom CSS for avatar selection
104
+ st.markdown("""
105
+ <style>
106
+ .avatar-grid {
107
+ display: grid;
108
+ grid-template-columns: repeat(3, 1fr);
109
+ gap: 20px;
110
+ padding: 20px;
111
+ }
112
+ .avatar-card {
113
+ border: 2px solid #f0f0f0;
114
+ border-radius: 10px;
115
+ padding: 15px;
116
+ text-align: center;
117
+ transition: all 0.3s ease;
118
+ }
119
+ .avatar-card:hover {
120
+ transform: scale(1.05);
121
+ border-color: #4CAF50;
122
+ }
123
+ .avatar-image {
124
+ width: 200px;
125
+ height: 200px;
126
+ object-fit: cover;
127
+ border-radius: 50%;
128
+ }
129
+ </style>
130
+ """, unsafe_allow_html=True)
131
+
132
+ # Avatar Selection Grid
133
+ st.markdown('<div class="avatar-grid">', unsafe_allow_html=True)
134
+
135
+ for avatar_key, avatar_info in AVATAR_PERSONAS.items():
136
+ st.markdown(f'''
137
+ <div class="avatar-card">
138
+ <img src="images/{avatar_info['image']}" class="avatar-image" alt="{avatar_info['name']}">
139
+ <h3>{avatar_info['name']}</h3>
140
+ <p>{avatar_info['description']}</p>
141
+ <button onclick="selectAvatar('{avatar_key}')">Select {avatar_info['name']}</button>
142
+ </div>
143
+ ''', unsafe_allow_html=True)
144
+
145
+ st.markdown('</div>', unsafe_allow_html=True)
146
+
147
+ # JavaScript to handle avatar selection
148
+ st.markdown("""
149
+ <script>
150
+ function selectAvatar(avatarKey) {
151
+ window.parent.postMessage({type: 'avatarSelected', avatarKey: avatarKey}, '*');
152
+ }
153
+ </script>
154
+ """, unsafe_allow_html=True)
155
+
156
+ def conversation_page(selected_avatar):
157
+ """
158
+ Second stage: Conversation Interface
159
+ """
160
+ st.title(f"Learning English with {AVATAR_PERSONAS[selected_avatar]['name']}")
161
+
162
+ # Initialize Assistant
163
+ assistant = AdvancedLanguageLearningAssistant(selected_avatar)
164
+
165
+ # Conversation Interface
166
+ user_input = st.text_input("Type your message in English:")
167
+
168
+ if st.button("Send"):
169
+ if user_input:
170
+ response = assistant.generate_response(user_input)
171
+ st.write(f"πŸ€– {response}")
172
+
173
+ def main():
174
+ # Initialize session state for tracking app stage
175
+ if 'stage' not in st.session_state:
176
+ st.session_state.stage = 'avatar_selection'
177
+ if 'selected_avatar' not in st.session_state:
178
+ st.session_state.selected_avatar = None
179
+
180
+ # Handle avatar selection
181
+ components.html("""
182
+ <script>
183
+ window.addEventListener('message', function(event) {
184
+ if (event.data.type === 'avatarSelected') {
185
+ window.parent.postMessage({
186
+ type: 'streamlit:setComponentValue',
187
+ key: 'selected_avatar',
188
+ value: event.data.avatarKey
189
+ }, '*');
190
+ }
191
+ });
192
+ </script>
193
+ """, height=0)
194
+
195
+ # Retrieve selected avatar
196
+ selected_avatar = st.experimental_get_query_params().get('selected_avatar', [None])[0]
197
+
198
+ if selected_avatar:
199
+ st.session_state.selected_avatar = selected_avatar
200
+ st.session_state.stage = 'conversation'
201
+
202
+ # Render appropriate page based on stage
203
+ if st.session_state.stage == 'avatar_selection':
204
+ avatar_selection_page()
205
+ elif st.session_state.stage == 'conversation':
206
+ conversation_page(st.session_state.selected_avatar)
207
+
208
+ if __name__ == "__main__":
209
+ main()