nanoLLaVA

Runtime error

qnguyen3 commited on Apr 19

Commit

13b8f1b

verified ·

1 Parent(s): a2b8740

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -21,7 +21,8 @@ model = LlavaQwen2ForCausalLM.from_pretrained(
     'qnguyen3/nanoLLaVA-1.5',
     torch_dtype=torch.float16,
     attn_implementation="flash_attention_2",
-    trust_remote_code=True)
 class KeywordsStoppingCriteria(StoppingCriteria):
     def __init__(self, keywords, tokenizer, input_ids):

     'qnguyen3/nanoLLaVA-1.5',
     torch_dtype=torch.float16,
     attn_implementation="flash_attention_2",
+    trust_remote_code=True,
+    device_map='cpu')
 class KeywordsStoppingCriteria(StoppingCriteria):
     def __init__(self, keywords, tokenizer, input_ids):