KraTUZen commited on
Commit
d8c974e
·
1 Parent(s): 4dbff1b
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -47,14 +47,14 @@ def generate_response(user_input, history):
47
  ])
48
  messages += f"\n<|user|>:{user_input}\n<|assistant|>:"
49
  model_inputs = tokenizer([messages], return_tensors="pt").to(device)
50
- streamer = TextIteratorStreamer(tokenizer, timeout=10.0, skip_prompt=True, skip_special_tokens=True)
51
  generate_kwargs = dict(
52
  **model_inputs,
53
  streamer=streamer,
54
- max_new_tokens=1024,
55
  do_sample=True,
56
- top_p=0.95,
57
- top_k=50,
58
  temperature=0.7,
59
  num_beams=1,
60
  stopping_criteria=StoppingCriteriaList([stop])
 
47
  ])
48
  messages += f"\n<|user|>:{user_input}\n<|assistant|>:"
49
  model_inputs = tokenizer([messages], return_tensors="pt").to(device)
50
+ streamer = TextIteratorStreamer(tokenizer, timeout=5.0, skip_prompt=True, skip_special_tokens=True)
51
  generate_kwargs = dict(
52
  **model_inputs,
53
  streamer=streamer,
54
+ max_new_tokens=256,
55
  do_sample=True,
56
+ top_p=0.9,
57
+ top_k=12,
58
  temperature=0.7,
59
  num_beams=1,
60
  stopping_criteria=StoppingCriteriaList([stop])