Spaces:
Running
Running
Commit
·
1eb2d22
1
Parent(s):
4c090d8
Niente
Browse files
app.py
CHANGED
@@ -55,8 +55,8 @@ def load_model():
|
|
55 |
device_map="auto",
|
56 |
torch_dtype=torch.float16,
|
57 |
# quantization_config=quantization_config,
|
58 |
-
|
59 |
-
|
60 |
)
|
61 |
# model.to("cpu")
|
62 |
return tokenizer, model
|
|
|
55 |
device_map="auto",
|
56 |
torch_dtype=torch.float16,
|
57 |
# quantization_config=quantization_config,
|
58 |
+
# attn_implementation="flash_attention_2",
|
59 |
+
trust_remote_code = True
|
60 |
)
|
61 |
# model.to("cpu")
|
62 |
return tokenizer, model
|