davidizzle commited on
Commit
1eb2d22
·
1 Parent(s): 4c090d8
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -55,8 +55,8 @@ def load_model():
55
  device_map="auto",
56
  torch_dtype=torch.float16,
57
  # quantization_config=quantization_config,
58
- trust_remote_code = True,
59
- attn_implementation="flash_attention_2"
60
  )
61
  # model.to("cpu")
62
  return tokenizer, model
 
55
  device_map="auto",
56
  torch_dtype=torch.float16,
57
  # quantization_config=quantization_config,
58
+ # attn_implementation="flash_attention_2",
59
+ trust_remote_code = True
60
  )
61
  # model.to("cpu")
62
  return tokenizer, model