Spaces:

TruthLens
/

sAIvahini

Sleeping

App Files Files Community

TruthLens commited on Mar 18

Commit

48d87a8

verified ·

1 Parent(s): 314672c

Update app.py

Browse files

Files changed (1) hide show

app.py +67 -58

app.py CHANGED Viewed

@@ -1,9 +1,7 @@
 import streamlit as st
 import requests
-import numpy as np
-import sounddevice as sd
-import wave
 import io
 # ✅ Set Streamlit Page Config
 st.set_page_config(page_title="Sai Vahini AI Assistant", layout="centered")
@@ -14,70 +12,81 @@ RENDER_API_URL = "https://saivahini.onrender.com/process_audio"
 # ✅ UI Header
 st.markdown("<h1 style='text-align: center; color: #ff5733;'>Sai Vahini AI Voice Assistant 🕉️</h1>", unsafe_allow_html=True)
-# ✅ Audio recording parameters
-DURATION = 5  # Recording duration in seconds
-SAMPLE_RATE = 16000
-# ✅ Function to record audio
-def record_audio():
-    """Records live audio and saves it as a WAV file"""
-    st.info("🎤 Recording... Speak now!")
-    audio = sd.rec(int(DURATION * SAMPLE_RATE), samplerate=SAMPLE_RATE, channels=1, dtype=np.int16)
-    sd.wait()  # Wait until recording is finished
-    st.success("✅ Recording completed!")
-    # ✅ Save the audio as a WAV file
-    audio_bytes = io.BytesIO()
-    with wave.open(audio_bytes, "wb") as wf:
-        wf.setnchannels(1)
-        wf.setsampwidth(2)
-        wf.setframerate(SAMPLE_RATE)
-        wf.writeframes(audio.tobytes())
-    audio_bytes.seek(0)
-    return audio_bytes
-# ✅ Record button
-if st.button("🎤 Record Live Audio"):
-    audio_file = record_audio()
-    st.session_state["audio_data"] = audio_file
-# ✅ Play recorded audio before sending
-if "audio_data" in st.session_state:
-    st.audio(st.session_state["audio_data"], format="audio/wav")
 # ✅ Process Button
 if st.button("✅ Process Recorded Audio"):
-    if "audio_data" in st.session_state:
-        with st.spinner("🔄 Sending audio to AI model..."):
-            try:
-                # ✅ Send recorded audio to Render API
-                response = requests.post(RENDER_API_URL, files={"file": ("audio.wav", st.session_state["audio_data"], "audio/wav")})
-                # ✅ Handle API response
-                if response.status_code == 200:
-                    result = response.json()
-                    st.success("✅ AI Response:")
-                    st.write("📝 **Transcription:**", result.get("transcription", "No transcription"))
-                    st.write("🤖 **Answer:**", result.get("response", "No response found."))
-                    # ✅ Fetch and play AI-generated voice response
-                    audio_response_url = result.get("audio")
-                    if audio_response_url:
-                        st.write("🔊 **AI-generated voice response:**")
-                        audio_response = requests.get(audio_response_url)
-                        if audio_response.status_code == 200:
-                            st.audio(audio_response.content, format="audio/wav")
-                        else:
-                            st.error(f"❌ Failed to load AI audio ({audio_response.status_code})")
-                    else:
-                        st.warning("⚠️ No audio response received from API.")
                 else:
-                    st.error(f"❌ API Error: {response.status_code} - {response.text}")
-            except requests.exceptions.RequestException as e:
-                st.error(f"❌ Failed to connect to API: {str(e)}")
-    else:
-        st.error("⚠️ No audio recorded. Click 'Record Live Audio' first!")

 import streamlit as st
 import requests
 import io
+import base64
 # ✅ Set Streamlit Page Config
 st.set_page_config(page_title="Sai Vahini AI Assistant", layout="centered")
 # ✅ UI Header
 st.markdown("<h1 style='text-align: center; color: #ff5733;'>Sai Vahini AI Voice Assistant 🕉️</h1>", unsafe_allow_html=True)
+# ✅ HTML5 Audio Recorder (JavaScript + Streamlit)
+audio_recorder_html = """
+    <script>
+        let mediaRecorder;
+        let audioChunks = [];
+        function startRecording() {
+            navigator.mediaDevices.getUserMedia({ audio: true }).then(stream => {
+                mediaRecorder = new MediaRecorder(stream);
+                mediaRecorder.start();
+                mediaRecorder.ondataavailable = event => {
+                    audioChunks.push(event.data);
+                };
+                mediaRecorder.onstop = () => {
+                    const audioBlob = new Blob(audioChunks, { type: 'audio/wav' });
+                    const reader = new FileReader();
+                    reader.readAsDataURL(audioBlob);
+                    reader.onloadend = () => {
+                        fetch("/upload_audio", {
+                            method: "POST",
+                            headers: { "Content-Type": "application/json" },
+                            body: JSON.stringify({ audio: reader.result })
+                        }).then(response => response.json()).then(data => {
+                            document.getElementById("audio_url").value = data.audio_url;
+                        });
+                    };
+                };
+            });
+        }
+        function stopRecording() {
+            mediaRecorder.stop();
+        }
+    </script>
+    <button onclick="startRecording()">🎤 Start Recording</button>
+    <button onclick="stopRecording()">⏹ Stop Recording</button>
+    <input type="hidden" id="audio_url">
+"""
+# ✅ Display HTML5 Recorder
+st.components.v1.html(audio_recorder_html, height=150)
 # ✅ Process Button
 if st.button("✅ Process Recorded Audio"):
+    with st.spinner("🔄 Sending audio to AI model..."):
+        audio_url = st.session_state.get("audio_url", None)
+        if audio_url:
+            # Convert Base64 audio to WAV format
+            audio_data = base64.b64decode(audio_url.split(",")[1])
+            audio_bytes = io.BytesIO(audio_data)
+            # ✅ Send recorded audio to Render API
+            response = requests.post(RENDER_API_URL, files={"file": ("audio.wav", audio_bytes, "audio/wav")})
+            # ✅ Handle API response
+            if response.status_code == 200:
+                result = response.json()
+                st.success("✅ AI Response:")
+                st.write("📝 **Transcription:**", result.get("transcription", "No transcription"))
+                st.write("🤖 **Answer:**", result.get("response", "No response found."))
+                # ✅ Fetch and play AI-generated voice response
+                audio_response_url = result.get("audio")
+                if audio_response_url:
+                    st.write("🔊 **AI-generated voice response:**")
+                    audio_response = requests.get(audio_response_url)
+                    if audio_response.status_code == 200:
+                        st.audio(audio_response.content, format="audio/wav")
+                    else:
+                        st.error(f"❌ Failed to load AI audio ({audio_response.status_code})")
                 else:
+                    st.warning("⚠️ No audio response received from API.")
+            else:
+                st.error(f"❌ API Error: {response.status_code} - {response.text}")
+        else:
+            st.error("⚠️ No audio recorded. Please record first!")