Spaces:

sandz7
/

loki

Runtime error

sandz7 commited on May 23, 2024

Commit

c6e3099

1 Parent(s): ec72fe8

added another argument in output_ids

Files changed (1) hide show

app.py CHANGED Viewed

@@ -37,10 +37,11 @@ def llama_generation(input_text):
                                        return_tensors='pt').to('cuda')
     # llama generation looks for the numeric vectors not the tensors so there is no need for **input_ids rather just input_ids
-    output_ids = llama_model.generate(input_ids=input_ids)
     # Decode
-    output_text = llama_tokenizer.decode(output_ids,
                                          skip_special_tokens=True)
     return output_text

                                        return_tensors='pt').to('cuda')
     # llama generation looks for the numeric vectors not the tensors so there is no need for **input_ids rather just input_ids
+    output_ids = llama_model.generate(input_ids=input_ids,
+                                      max_new_tokens=400)
     # Decode
+    output_text = llama_tokenizer.decode(output_ids[0],
                                          skip_special_tokens=True)
     return output_text