Update app.py
Browse files
app.py
CHANGED
@@ -121,9 +121,11 @@ def generate_response_stream(prompt, history, max_length, temperature, top_p, to
|
|
121 |
|
122 |
params = og.GeneratorParams(model)
|
123 |
params.set_search_options(**search_options)
|
124 |
-
|
|
|
125 |
|
126 |
start_time = time.time()
|
|
|
127 |
generator = og.Generator(model, params)
|
128 |
model_status = "Generating..." # Update status indicator
|
129 |
logging.info("Streaming response...")
|
@@ -157,6 +159,11 @@ def generate_response_stream(prompt, history, max_length, temperature, top_p, to
|
|
157 |
logging.info(f"Generation complete. Tokens: {token_count}, Total Time: {total_time:.2f}s, TTFT: {ttft:.2f}ms, TPS: {tps:.2f}")
|
158 |
model_status = f"Model Ready ({EXECUTION_PROVIDER.upper()} / {model_variant_name})" # Reset status
|
159 |
|
|
|
|
|
|
|
|
|
|
|
160 |
except Exception as e:
|
161 |
logging.error(f"Error during generation: {e}", exc_info=True)
|
162 |
model_status = f"Error during generation: {e}"
|
|
|
121 |
|
122 |
params = og.GeneratorParams(model)
|
123 |
params.set_search_options(**search_options)
|
124 |
+
# FIX: Use the set_input_ids method instead of direct attribute assignment
|
125 |
+
params.set_input_ids(input_tokens)
|
126 |
|
127 |
start_time = time.time()
|
128 |
+
# Create generator AFTER setting parameters including input_ids
|
129 |
generator = og.Generator(model, params)
|
130 |
model_status = "Generating..." # Update status indicator
|
131 |
logging.info("Streaming response...")
|
|
|
159 |
logging.info(f"Generation complete. Tokens: {token_count}, Total Time: {total_time:.2f}s, TTFT: {ttft:.2f}ms, TPS: {tps:.2f}")
|
160 |
model_status = f"Model Ready ({EXECUTION_PROVIDER.upper()} / {model_variant_name})" # Reset status
|
161 |
|
162 |
+
except AttributeError as ae:
|
163 |
+
# Catch potential future API changes or issues during generation setup
|
164 |
+
logging.error(f"AttributeError during generation setup: {ae}", exc_info=True)
|
165 |
+
model_status = f"Generation Setup Error: {ae}"
|
166 |
+
yield f"\n\nSorry, an error occurred setting up generation: {ae}"
|
167 |
except Exception as e:
|
168 |
logging.error(f"Error during generation: {e}", exc_info=True)
|
169 |
model_status = f"Error during generation: {e}"
|