Spaces:

meraj12
/

cloningapp

Sleeping

App Files Files Community

meraj12 commited on Apr 7

Commit

b2cade9

verified ·

1 Parent(s): c22cdba

Update app.py

Browse files

Files changed (1) hide show

app.py +63 -36

app.py CHANGED Viewed

@@ -13,50 +13,77 @@ whisper_model = whisper.load_model("tiny")
 groq_client = Groq(api_key=os.environ.get("GROQ_API_KEY"))
 st.set_page_config(page_title="Voice Chat", layout="centered")
-st.title("🎤 Voice Chat using Your Cloned Voice")
 # Store cloned voice path
 if "clone_path" not in st.session_state:
     st.session_state.clone_path = None
-st.sidebar.header("Setup Your Clone Voice")
-voice_option = st.sidebar.radio("Choose how to provide clone voice", ["Upload Voice", "Record Voice"])
 if voice_option == "Upload Voice":
     uploaded = st.sidebar.file_uploader("Upload a voice sample", type=["wav", "mp3", "m4a", "flac", "ogg"])
     if uploaded:
         path = save_uploaded_audio(uploaded, "reference_voice.wav")
         st.session_state.clone_path = path
-        st.success("Voice uploaded and saved as your clone voice.")
-# --- Main conversation section ---
-st.subheader("🗣️ Ask something using your voice")
-user_voice = st.file_uploader("Upload your voice question", type=["wav", "mp3", "m4a", "flac", "ogg"])
-if user_voice:
-    user_voice_path = save_uploaded_audio(user_voice, "user_question.wav")
-    st.audio(user_voice_path)
-    # Step 1: Transcribe
-    st.info("Transcribing...")
-    result = whisper_model.transcribe(user_voice_path)
-    user_text = result["text"]
-    st.success(f"📝 You said: {user_text}")
-    # Step 2: Generate LLM response
-    st.info("Thinking...")
-    response = groq_client.chat.completions.create(
-        model="llama3-8b-8192",
-        messages=[{"role": "user", "content": user_text}]
-    )
-    reply = response.choices[0].message.content
-    st.success(f"🤖 AI says: {reply}")
-    # Step 3: Speak back in your clone voice
-    if st.session_state.clone_path:
-        st.info("Generating voice reply using your cloned voice...")
-        voice_output_path = clone_and_generate_text(reply, st.session_state.clone_path)
-        st.audio(voice_output_path)
-    else:
-        st.warning("Please upload your clone voice first in the sidebar.")

 groq_client = Groq(api_key=os.environ.get("GROQ_API_KEY"))
 st.set_page_config(page_title="Voice Chat", layout="centered")
+st.title("🎤💬 Voice & Text Chat using Your Cloned Voice")
 # Store cloned voice path
 if "clone_path" not in st.session_state:
     st.session_state.clone_path = None
+st.sidebar.header("🧬 Setup Your Clone Voice")
+voice_option = st.sidebar.radio("Choose how to provide clone voice", ["Upload Voice"])
 if voice_option == "Upload Voice":
     uploaded = st.sidebar.file_uploader("Upload a voice sample", type=["wav", "mp3", "m4a", "flac", "ogg"])
     if uploaded:
         path = save_uploaded_audio(uploaded, "reference_voice.wav")
         st.session_state.clone_path = path
+        st.success("✅ Voice uploaded and saved as your clone voice.")
+# --- Conversation section ---
+st.subheader("🗣️ Ask with voice or type text below")
+tab1, tab2 = st.tabs(["🎤 Voice Input", "💬 Text Input"])
+# --- VOICE INPUT TAB ---
+with tab1:
+    user_voice = st.file_uploader("Upload your voice question", type=["wav", "mp3", "m4a", "flac", "ogg"])
+    if user_voice:
+        user_voice_path = save_uploaded_audio(user_voice, "user_question.wav")
+        st.audio(user_voice_path)
+        # Step 1: Transcribe voice
+        st.info("Transcribing...")
+        result = whisper_model.transcribe(user_voice_path)
+        user_text = result["text"]
+        st.success(f"📝 You said: {user_text}")
+        # Step 2: Get LLM response
+        st.info("Thinking...")
+        response = groq_client.chat.completions.create(
+            model="llama3-8b-8192",
+            messages=[{"role": "user", "content": user_text}]
+        )
+        reply = response.choices[0].message.content
+        st.success(f"🤖 AI says: {reply}")
+        # Step 3: Voice reply
+        if st.session_state.clone_path:
+            st.info("Cloning voice reply...")
+            voice_output_path = clone_and_generate_text(reply, st.session_state.clone_path)
+            st.audio(voice_output_path)
+        else:
+            st.warning("Upload your voice clone first in the sidebar.")
+# --- TEXT INPUT TAB ---
+with tab2:
+    user_input = st.text_input("Type your question here:")
+    if st.button("Send Text"):
+        if user_input.strip() == "":
+            st.warning("Please enter a message.")
+        else:
+            # Step 1: Get LLM response
+            st.info("Thinking...")
+            response = groq_client.chat.completions.create(
+                model="llama3-8b-8192",
+                messages=[{"role": "user", "content": user_input}]
+            )
+            reply = response.choices[0].message.content
+            st.success(f"🤖 AI says: {reply}")
+            # Step 2: Voice reply
+            if st.session_state.clone_path:
+                st.info("Cloning voice reply...")
+                voice_output_path = clone_and_generate_text(reply, st.session_state.clone_path)
+                st.audio(voice_output_path)
+            else:
+                st.warning("Upload your voice clone first in the sidebar.")