Spaces:

Tanifh
/

phi3-chatbot

Sleeping

App Files Files Community

Tanifh commited on Mar 13

Commit

7ff24a3

verified ·

1 Parent(s): dbd53de

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -20

app.py CHANGED Viewed

@@ -21,7 +21,7 @@ if not os.path.exists(MODEL_PATH):
                     f.write(chunk)
         st.success("Model downloaded successfully!")
     except requests.exceptions.HTTPError as e:
-        st.error(f"🚨 Model download failed: {e}")
         st.stop()
 # ✅ Load optimized model with reduced context length
@@ -34,33 +34,30 @@ try:
             numa=True,
             n_batch=64  # ✅ Faster token processing
         )
-        st.write("✅ Model loaded successfully!")
 except Exception as e:
-    st.error(f"🚨 Error loading model: {e}")
     st.stop()
-# Streamlit UI setup
 st.title("🤖 Phi-3 Mini Chatbot")
-st.markdown("Enter a message and get responses from Phi-3 Mini!")
 # Chat history
 if "messages" not in st.session_state:
     st.session_state["messages"] = []
 # Display chat history
-for message in st.session_state["messages"]:
-    role, text = message
-    if role == "user":
-        st.chat_message("user").write(text)
-    else:
-        st.chat_message("assistant").write(text)
 # Input field for user message
 user_input = st.text_input("Your Message:", "", key="user_input")
 if st.button("Send") and user_input:
     # Add user input to chat history
     st.session_state["messages"].append(("user", user_input))
-    st.chat_message("user").write(user_input)
     # ✅ Use a minimal prompt format (no system message)
     formatted_messages = [{"role": "user", "content": user_input}]
@@ -68,24 +65,24 @@ if st.button("Send") and user_input:
     # ✅ Speed improvements: Increase max_tokens for full responses & ensure proper stopping
     response_data = st.session_state["model"].create_chat_completion(
         messages=formatted_messages,
-        max_tokens=128, temperature=0.5, top_p=0.8,
         stop=["\n", "<|endoftext|>"],  # ✅ Ensures responses end properly
-        stream=False  # ✅ No streaming for debugging
     )
-    # ✅ Debugging output
-    st.write("🔍 Debug: Raw Model Response:", response_data)
     if "choices" in response_data and len(response_data["choices"]) > 0:
         choice = response_data["choices"][0]
         if "message" in choice and "content" in choice["message"]:
             response_text = choice["message"]["content"].strip()
             st.session_state["messages"].append(("assistant", response_text))
-            st.chat_message("assistant").write(response_text)
         else:
-            st.error("⚠️ No valid response content found.")
     else:
-        st.error("⚠️ Model did not return any choices.")

                     f.write(chunk)
         st.success("Model downloaded successfully!")
     except requests.exceptions.HTTPError as e:
+        st.error("🚨 Model download failed. Please try again later.")
         st.stop()
 # ✅ Load optimized model with reduced context length
             numa=True,
             n_batch=64  # ✅ Faster token processing
         )
 except Exception as e:
+    st.error("🚨 Error loading model. Please restart the application.")
     st.stop()
+# 🌟 User-Friendly Chat Interface
 st.title("🤖 Phi-3 Mini Chatbot")
+st.markdown("### Ask me anything and I'll provide helpful responses!")
 # Chat history
 if "messages" not in st.session_state:
     st.session_state["messages"] = []
 # Display chat history
+for role, text in st.session_state["messages"]:
+    with st.chat_message(role):
+        st.write(text)
 # Input field for user message
 user_input = st.text_input("Your Message:", "", key="user_input")
 if st.button("Send") and user_input:
     # Add user input to chat history
     st.session_state["messages"].append(("user", user_input))
+    with st.chat_message("user"):
+        st.write(user_input)
     # ✅ Use a minimal prompt format (no system message)
     formatted_messages = [{"role": "user", "content": user_input}]
     # ✅ Speed improvements: Increase max_tokens for full responses & ensure proper stopping
     response_data = st.session_state["model"].create_chat_completion(
         messages=formatted_messages,
+        max_tokens=96, temperature=0.5, top_p=0.8,
         stop=["\n", "<|endoftext|>"],  # ✅ Ensures responses end properly
+        stream=False
     )
+    # ✅ Extract and display response
     if "choices" in response_data and len(response_data["choices"]) > 0:
         choice = response_data["choices"][0]
         if "message" in choice and "content" in choice["message"]:
             response_text = choice["message"]["content"].strip()
             st.session_state["messages"].append(("assistant", response_text))
+            with st.chat_message("assistant"):
+                st.write(response_text)
         else:
+            st.error("⚠️ Unable to generate a response. Please try again.")
     else:
+        st.error("⚠️ No response received. Please ask again.")