Spaces:

sandz7
/

loki

Runtime error

sandz7 commited on May 23, 2024

Commit

9633993

1 Parent(s): 516209b

max new tokens on generation 256

Files changed (1) hide show

app.py CHANGED Viewed

@@ -42,7 +42,8 @@ def llama_generation(input_text: str,
                                        return_tensors='pt').to('cuda')
     # llama generation looks for the numeric vectors not the tensors so there is no need for **input_ids rather just input_ids
-    output_ids = llama_model.generate(input_ids=input_ids)
     # Decode
     output_text = llama_tokenizer.decode(output_ids[0],

                                        return_tensors='pt').to('cuda')
     # llama generation looks for the numeric vectors not the tensors so there is no need for **input_ids rather just input_ids
+    output_ids = llama_model.generate(input_ids=input_ids,
+                                      max_new_tokens=256)
     # Decode
     output_text = llama_tokenizer.decode(output_ids[0],