Spaces:

TruthLens
/

sAIvahini

Sleeping

App Files Files Community

TruthLens commited on Mar 18

Commit

88ba4c2

verified ·

1 Parent(s): f170e39

Update app.py

Browse files

Files changed (1) hide show

app.py +32 -22

app.py CHANGED Viewed

@@ -4,23 +4,28 @@ import av
 import wave
 import requests
 import io
-st.title("Sai Vahini AI Voice Assistant 🕉️")
-# ✅ Render API URL (Make sure this matches your deployed API on Render)
-RENDER_API_URL = "https://saivahini.onrender.com/process_audio"  # Update if needed
 # ✅ WebRTC audio processing
 def audio_frame_callback(frame):
     audio = frame.to_ndarray(format="s16le")
     audio_bytes = audio.tobytes()
     st.session_state.frames.append(audio_bytes)
     return av.AudioFrame.from_ndarray(audio, format="s16", layout="mono")
-if "frames" not in st.session_state:
-    st.session_state.frames = []
-# ✅ WebRTC streamer for automatic audio capture
 webrtc_streamer(
     key="audio-recorder",
     mode=WebRtcMode.SENDRECV,
@@ -28,34 +33,39 @@ webrtc_streamer(
     media_stream_constraints={"audio": True, "video": False},
 )
 if st.button("✅ Process Recorded Audio"):
-    if st.session_state.frames:
         with st.spinner("🔄 Processing your voice..."):
-            # ✅ Convert recorded audio frames into WAV format
-            audio_bytes = io.BytesIO()
-            with wave.open(audio_bytes, "wb") as wf:
-                wf.setnchannels(1)
-                wf.setsampwidth(2)
-                wf.setframerate(16000)
-                wf.writeframes(b''.join(st.session_state.frames))
-            audio_bytes.seek(0)
-            # ✅ Send recorded audio to Render API
-            try:
                 response = requests.post(RENDER_API_URL, files={"file": ("audio.wav", audio_bytes, "audio/wav")})
                 # ✅ Handle API response
                 if response.status_code == 200:
                     result = response.json()
                     st.success("✅ AI Response:")
-                    st.write("**Transcription:**", result.get("transcription", "No transcription"))
-                    st.write("**Answer:**", result.get("response", "No response found."))
-                    # ✅ Fetch and play AI-generated audio response
                     audio_response_url = result.get("audio")
                     if audio_response_url:
-                        st.write(f"🔊 Fetching AI-generated voice from: {audio_response_url}")
                         audio_response = requests.get(audio_response_url)
                         if audio_response.status_code == 200:
                             st.audio(audio_response.content, format="audio/wav")

 import wave
 import requests
 import io
+import numpy as np
+st.set_page_config(page_title="Sai Vahini AI Assistant", layout="centered")
+# ✅ Render API URL (Ensure this matches your deployed API on Render)
+RENDER_API_URL = "https://saivahini.onrender.com/process_audio"
+# ✅ UI Header
+st.markdown("<h1 style='text-align: center; color: #ff5733;'>Sai Vahini AI Voice Assistant 🕉️</h1>", unsafe_allow_html=True)
 # ✅ WebRTC audio processing
 def audio_frame_callback(frame):
+    """Handles incoming audio frames from WebRTC"""
     audio = frame.to_ndarray(format="s16le")
     audio_bytes = audio.tobytes()
+    if "frames" not in st.session_state:
+        st.session_state.frames = []
     st.session_state.frames.append(audio_bytes)
     return av.AudioFrame.from_ndarray(audio, format="s16", layout="mono")
+# ✅ WebRTC Streamer for recording
+st.write("🎤 **Click below to start speaking...**")
 webrtc_streamer(
     key="audio-recorder",
     mode=WebRtcMode.SENDRECV,
     media_stream_constraints={"audio": True, "video": False},
 )
+# ✅ Check if audio frames exist
+if "frames" not in st.session_state or not st.session_state.frames:
+    st.warning("⚠️ No audio recorded. Click the button above to start recording.")
+# ✅ Process Button
 if st.button("✅ Process Recorded Audio"):
+    if "frames" in st.session_state and st.session_state.frames:
         with st.spinner("🔄 Processing your voice..."):
+            try:
+                # ✅ Convert recorded audio frames into WAV format
+                audio_bytes = io.BytesIO()
+                with wave.open(audio_bytes, "wb") as wf:
+                    wf.setnchannels(1)
+                    wf.setsampwidth(2)
+                    wf.setframerate(16000)
+                    wf.writeframes(b''.join(st.session_state.frames))
+                audio_bytes.seek(0)  # Reset buffer pointer
+                # ✅ Send recorded audio to Render API
                 response = requests.post(RENDER_API_URL, files={"file": ("audio.wav", audio_bytes, "audio/wav")})
                 # ✅ Handle API response
                 if response.status_code == 200:
                     result = response.json()
                     st.success("✅ AI Response:")
+                    st.write("📝 **Transcription:**", result.get("transcription", "No transcription"))
+                    st.write("🤖 **Answer:**", result.get("response", "No response found."))
+                    # ✅ Fetch and play AI-generated voice response
                     audio_response_url = result.get("audio")
                     if audio_response_url:
+                        st.write(f"🔊 **AI-generated voice response:**")
                         audio_response = requests.get(audio_response_url)
                         if audio_response.status_code == 200:
                             st.audio(audio_response.content, format="audio/wav")