Spaces:

awacke1
/

RescuerOfStolenBikes

Sleeping

App Files Files Community

awacke1 commited on Dec 1, 2024

Commit

65a0e2e

verified ·

1 Parent(s): c0bb5a2

Update app.py

Browse files

Files changed (1) hide show

app.py +46 -31

app.py CHANGED Viewed

@@ -55,9 +55,8 @@ st.set_page_config(
 def create_speech_component():
-    """Create a custom speech recognition component with bidirectional communication."""
     speech_recognition_html = """
     <!DOCTYPE html>
@@ -65,7 +64,36 @@ def create_speech_component():
     <head>
         <title>Continuous Speech Demo</title>
         <style>
-            /* Your existing styles here */
         </style>
     </head>
     <body>
@@ -78,14 +106,6 @@ def create_speech_component():
         <div id="output"></div>
         <script>
-            // Function to send data back to Streamlit
-            function sendToStreamlit(data) {
-                window.parent.postMessage({
-                    type: 'streamlit:setComponentValue',
-                    value: data
-                }, '*');
-            }
             if (!('webkitSpeechRecognition' in window)) {
                 alert('Speech recognition not supported');
             } else {
@@ -97,7 +117,6 @@ def create_speech_component():
                 const output = document.getElementById('output');
                 let fullTranscript = '';
-                // Configure recognition
                 recognition.continuous = true;
                 recognition.interimResults = true;
@@ -113,14 +132,17 @@ def create_speech_component():
                     status.textContent = 'Stopped';
                     startButton.disabled = false;
                     stopButton.disabled = true;
-                    // Send final transcript to Streamlit
-                    sendToStreamlit(fullTranscript);
                 };
                 clearButton.onclick = () => {
                     fullTranscript = '';
                     output.textContent = '';
-                    sendToStreamlit('');
                 };
                 recognition.onresult = (event) => {
@@ -132,8 +154,6 @@ def create_speech_component():
                         if (event.results[i].isFinal) {
                             finalTranscript += transcript + '\\n';
                             fullTranscript += transcript + '\\n';
-                            // Send update to Streamlit
-                            sendToStreamlit(fullTranscript);
                         } else {
                             interimTranscript += transcript;
                         }
@@ -141,6 +161,13 @@ def create_speech_component():
                     output.textContent = fullTranscript + (interimTranscript ? '... ' + interimTranscript : '');
                     output.scrollTop = output.scrollHeight;
                 };
                 recognition.onend = () => {
@@ -161,14 +188,8 @@ def create_speech_component():
     </html>
     """
-    # Create the component with a key
-    component_value = components.html(
-        speech_recognition_html,
-        height=400,
-        key="speech_recognition"
-    )
-    return component_value
 def integrate_speech_component():
     """Integrate the speech component into the main app."""
@@ -178,13 +199,7 @@ def integrate_speech_component():
     # Get the transcript from the component
     transcript = create_speech_component()
-    # Update session state if there's new data
-    if transcript is not None and transcript != "":
-        st.session_state.voice_transcript = transcript
     return st.session_state.voice_transcript

 def create_speech_component():
+    """Create a speech recognition component compatible with basic Streamlit HTML."""
     speech_recognition_html = """
     <!DOCTYPE html>
     <head>
         <title>Continuous Speech Demo</title>
         <style>
+            body {
+                font-family: sans-serif;
+                padding: 20px;
+                max-width: 800px;
+                margin: 0 auto;
+            }
+            button {
+                padding: 10px 20px;
+                margin: 10px 5px;
+                font-size: 16px;
+            }
+            #status {
+                margin: 10px 0;
+                padding: 10px;
+                background: #e8f5e9;
+                border-radius: 4px;
+            }
+            #output {
+                white-space: pre-wrap;
+                padding: 15px;
+                background: #f5f5f5;
+                border-radius: 4px;
+                margin: 10px 0;
+                min-height: 100px;
+                max-height: 400px;
+                overflow-y: auto;
+            }
+            .controls {
+                margin: 10px 0;
+            }
         </style>
     </head>
     <body>
         <div id="output"></div>
         <script>
             if (!('webkitSpeechRecognition' in window)) {
                 alert('Speech recognition not supported');
             } else {
                 const output = document.getElementById('output');
                 let fullTranscript = '';
                 recognition.continuous = true;
                 recognition.interimResults = true;
                     status.textContent = 'Stopped';
                     startButton.disabled = false;
                     stopButton.disabled = true;
                 };
                 clearButton.onclick = () => {
                     fullTranscript = '';
                     output.textContent = '';
+                    if (window.parent.document) {
+                        const event = new CustomEvent('transcript-update', {
+                            detail: { transcript: '' }
+                        });
+                        window.parent.document.dispatchEvent(event);
+                    }
                 };
                 recognition.onresult = (event) => {
                         if (event.results[i].isFinal) {
                             finalTranscript += transcript + '\\n';
                             fullTranscript += transcript + '\\n';
                         } else {
                             interimTranscript += transcript;
                         }
                     output.textContent = fullTranscript + (interimTranscript ? '... ' + interimTranscript : '');
                     output.scrollTop = output.scrollHeight;
+                    // Update hidden input with the current transcript
+                    const hiddenInput = document.createElement('input');
+                    hiddenInput.type = 'hidden';
+                    hiddenInput.value = fullTranscript;
+                    hiddenInput.id = 'transcript-value';
+                    document.body.appendChild(hiddenInput);
                 };
                 recognition.onend = () => {
     </html>
     """
+    # Create the component without a key
+    return components.html(speech_recognition_html, height=400)
 def integrate_speech_component():
     """Integrate the speech component into the main app."""
     # Get the transcript from the component
     transcript = create_speech_component()
     return st.session_state.voice_transcript