Spaces:

Heit39
/

iris

Sleeping

IST199655 commited on Dec 2, 2024

Commit

4acb7f4

1 Parent(s): d44f7f3

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,7 +4,7 @@ from huggingface_hub import InferenceClient
 """
 Copied from inference in colab notebook
 """
-from unsloth.chat_templates import get_chat_template
 from unsloth import FastLanguageModel
 # IMPORTING MODEL AND TOKENIZER ————————
@@ -20,10 +20,10 @@ model, tokenizer = FastLanguageModel.from_pretrained(
     load_in_4bit = load_in_4bit,
 )
-tokenizer = get_chat_template(
-    tokenizer,
-    chat_template = "llama-3.1",
-)
 FastLanguageModel.for_inference(model) # Enable native 2x faster inference
 # RUNNING INFERENCE ————————————————————————

 """
 Copied from inference in colab notebook
 """
+# from unsloth.chat_templates import get_chat_template
 from unsloth import FastLanguageModel
 # IMPORTING MODEL AND TOKENIZER ————————
     load_in_4bit = load_in_4bit,
 )
+# tokenizer = get_chat_template(
+#     tokenizer,
+#     chat_template = "llama-3.1",
+# )
 FastLanguageModel.for_inference(model) # Enable native 2x faster inference
 # RUNNING INFERENCE ————————————————————————