Spaces:

Gopikanth123
/

check

Sleeping

App Files Files Community

Gopikanth123 commited on Dec 17, 2024

Commit

040d848

verified ·

1 Parent(s): 8010b1d

Update app.py

Browse files

Files changed (1) hide show

app.py +31 -62

app.py CHANGED Viewed

@@ -1,67 +1,36 @@
 import streamlit as st
-import streamlit.components.v1 as components
-# HTML and JavaScript for Speech Recognition using webkitSpeechRecognition
-speech_recognition_html = """
-<html>
-  <body>
-    <button onclick="startRecognition()">Start Speech Recognition</button>
-    <p id="output">Speak something...</p>
-    <script>
-      // Check if the browser supports speech recognition
-      if (!('webkitSpeechRecognition' in window)) {
-        document.getElementById('output').textContent = "Speech recognition not supported in this browser.";
-      }
-      var recognition = new webkitSpeechRecognition();
-      recognition.continuous = false;  // Stops after speech input
-      recognition.interimResults = true;
-      recognition.lang = 'en-US';  // Set language for recognition (English)
-      recognition.onresult = function(event) {
-        var transcript = event.results[event.resultIndex][0].transcript;
-        document.getElementById('output').textContent = transcript;
-        // Send transcript back to Streamlit using postMessage
-        window.parent.postMessage({func: 'update_output', transcript: transcript}, '*');
-      };
-      recognition.onerror = function(event) {
-        console.error("Speech recognition error", event.error);
-        document.getElementById('output').textContent = "Error in recognition";
-      };
-      function startRecognition() {
-        recognition.start();
-      }
-    </script>
-  </body>
-</html>
-"""
 # Streamlit UI
-st.title("Speech-to-Text Demo")
-st.write("Click the button below and start speaking. The recognized text will be shown here:")
-# Display the HTML with the embedded speech recognition
-components.html(speech_recognition_html, height=200)
-# Output area where the recognized speech will be displayed
-output = st.empty()
-# This is where the recognized text will be shown on the Streamlit side
-st.write("Recognized Text:")
-transcript = st.text_area("Transcript:", "", height=150)
-# Listen for postMessage events from the iframe to update the text area
-components.html("""
-<script>
-  window.addEventListener('message', function(event) {
-    if (event.data.func === 'update_output') {
-      document.getElementById('output').textContent = event.data.transcript;
-      // Update the Streamlit text area with the transcript
-      window.parent.postMessage({func: 'update_text_area', text: event.data.transcript}, '*');
-    }
-  });
-</script>
-""", height=0)

 import streamlit as st
+from transformers import pipeline
+from streamlit_webrtc import webrtc_streamer, WebRtcMode, ClientSettings
+import av
+import numpy as np
+# ASR Model
+pipe = pipeline("automatic-speech-recognition", model="facebook/s2t-medium-mustc-multilingual-st")
+# Function to process audio frames
+def audio_callback(frame: av.AudioFrame) -> av.AudioFrame:
+    audio_data = frame.to_ndarray().mean(axis=1).astype(np.int16)  # Convert to mono
+    if "audio_buffer" not in st.session_state:
+        st.session_state.audio_buffer = b""
+    st.session_state.audio_buffer += audio_data.tobytes()
+    return frame
+# Transcribe audio buffer
+def transcribe_audio():
+    if "audio_buffer" in st.session_state:
+        audio_data = st.session_state.audio_buffer
+        result = pipe(audio_data)
+        st.write("Transcription:", result["text"])
 # Streamlit UI
+st.title("Voice Recognition App")
+webrtc_streamer(
+    key="audio",
+    mode=WebRtcMode.SENDRECV,
+    audio_processor_factory=lambda: audio_callback,
+    media_stream_constraints={"audio": True, "video": False},
+)
+if st.button("Transcribe Audio"):
+    transcribe_audio()