Spaces:

CamiloVega
/

aQuaBot

Sleeping

App Files Files Community

CamiloVega commited on Oct 30, 2024

Commit

89bb689

verified ·

1 Parent(s): f3affeb

Update app.py

Browse files

Files changed (1) hide show

app.py +4 -28

app.py CHANGED Viewed

@@ -94,12 +94,9 @@ def generate_response(user_input, chat_history):
         conversation_history = ""
         if chat_history:
             for message in chat_history:
-                # Remove any [INST] tags from the history
-                user_msg = message[0].replace("[INST]", "").replace("[/INST]", "").strip()
-                assistant_msg = message[1].replace("[INST]", "").replace("[/INST]", "").strip()
-                conversation_history += f"[INST] {user_msg} [/INST] {assistant_msg} "
-        prompt = f"<s>[INST] {system_message}\n\n{conversation_history}[INST] {user_input} [/INST]"
         logger.info("Generating model response...")
         outputs = model_gen(
@@ -107,38 +104,16 @@ def generate_response(user_input, chat_history):
             max_new_tokens=256,
             return_full_text=False,
             pad_token_id=tokenizer.eos_token_id,
-            do_sample=True,
-            temperature=0.7,
-            top_p=0.9,
-            repetition_penalty=1.1
         )
         logger.info("Model response generated successfully")
-        # Clean up the response by removing any [INST] tags and trimming
         assistant_response = outputs[0]['generated_text'].strip()
-        assistant_response = assistant_response.replace("[INST]", "").replace("[/INST]", "").strip()
-        # If the response is too short, try to generate a more detailed one
-        if len(assistant_response.split()) < 10:
-            prompt += "\nPlease provide a more detailed answer with context and explanation."
-            outputs = model_gen(
-                prompt,
-                max_new_tokens=256,
-                return_full_text=False,
-                pad_token_id=tokenizer.eos_token_id,
-                do_sample=True,
-                temperature=0.7,
-                top_p=0.9,
-                repetition_penalty=1.1
-            )
-            assistant_response = outputs[0]['generated_text'].strip()
-            assistant_response = assistant_response.replace("[INST]", "").replace("[/INST]", "").strip()
         # Calculate water consumption for output
         output_water_consumption = calculate_water_consumption(assistant_response, False)
         total_water_consumption += output_water_consumption
-        # Update chat history with the cleaned messages
         chat_history.append([user_input, assistant_response])
         # Prepare water consumption message
@@ -163,6 +138,7 @@ def generate_response(user_input, chat_history):
         error_message = f"An error occurred: {str(e)}"
         chat_history.append([user_input, error_message])
         return chat_history, show_water
 # Constants for water consumption calculation
 WATER_PER_TOKEN = {

         conversation_history = ""
         if chat_history:
             for message in chat_history:
+                conversation_history += f"{message[0]} {message[1]} "
+        prompt = f"[INST] {system_message}\n\n{conversation_history}{user_input}"
         logger.info("Generating model response...")
         outputs = model_gen(
             max_new_tokens=256,
             return_full_text=False,
             pad_token_id=tokenizer.eos_token_id,
         )
         logger.info("Model response generated successfully")
         assistant_response = outputs[0]['generated_text'].strip()
         # Calculate water consumption for output
         output_water_consumption = calculate_water_consumption(assistant_response, False)
         total_water_consumption += output_water_consumption
+        # Update chat history with the new formatted messages
         chat_history.append([user_input, assistant_response])
         # Prepare water consumption message
         error_message = f"An error occurred: {str(e)}"
         chat_history.append([user_input, error_message])
         return chat_history, show_water
 # Constants for water consumption calculation
 WATER_PER_TOKEN = {