Spaces:
Sleeping
Sleeping
reduction
Browse files
app.py
CHANGED
@@ -47,14 +47,14 @@ def generate_response(user_input, history):
|
|
47 |
])
|
48 |
messages += f"\n<|user|>:{user_input}\n<|assistant|>:"
|
49 |
model_inputs = tokenizer([messages], return_tensors="pt").to(device)
|
50 |
-
streamer = TextIteratorStreamer(tokenizer, timeout=
|
51 |
generate_kwargs = dict(
|
52 |
**model_inputs,
|
53 |
streamer=streamer,
|
54 |
-
max_new_tokens=
|
55 |
do_sample=True,
|
56 |
-
top_p=0.
|
57 |
-
top_k=
|
58 |
temperature=0.7,
|
59 |
num_beams=1,
|
60 |
stopping_criteria=StoppingCriteriaList([stop])
|
|
|
47 |
])
|
48 |
messages += f"\n<|user|>:{user_input}\n<|assistant|>:"
|
49 |
model_inputs = tokenizer([messages], return_tensors="pt").to(device)
|
50 |
+
streamer = TextIteratorStreamer(tokenizer, timeout=5.0, skip_prompt=True, skip_special_tokens=True)
|
51 |
generate_kwargs = dict(
|
52 |
**model_inputs,
|
53 |
streamer=streamer,
|
54 |
+
max_new_tokens=256,
|
55 |
do_sample=True,
|
56 |
+
top_p=0.9,
|
57 |
+
top_k=12,
|
58 |
temperature=0.7,
|
59 |
num_beams=1,
|
60 |
stopping_criteria=StoppingCriteriaList([stop])
|