changed temperature to 0.5 for more focused response
Browse files
app.py
CHANGED
@@ -44,7 +44,7 @@ def llama_generation(input_text: str,
|
|
44 |
# llama generation looks for the numeric vectors not the tensors so there is no need for **input_ids rather just input_ids
|
45 |
output_ids = llama_model.generate(input_ids=input_ids,
|
46 |
max_new_tokens=256,
|
47 |
-
temperature=0.
|
48 |
top_p=0.9,
|
49 |
repetition_penalty=2.0)
|
50 |
|
|
|
44 |
# llama generation looks for the numeric vectors not the tensors so there is no need for **input_ids rather just input_ids
|
45 |
output_ids = llama_model.generate(input_ids=input_ids,
|
46 |
max_new_tokens=256,
|
47 |
+
temperature=0.5,
|
48 |
top_p=0.9,
|
49 |
repetition_penalty=2.0)
|
50 |
|