simonzhang5429 commited on
Commit
e376e0f
·
verified ·
1 Parent(s): c86f33b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -0
app.py CHANGED
@@ -9,6 +9,7 @@ model = AutoModelForCausalLM.from_pretrained(
9
  device_map="auto",
10
  local_files_only=True,
11
  torch_dtype=torch.bfloat16,
 
12
  )
13
 
14
 
 
9
  device_map="auto",
10
  local_files_only=True,
11
  torch_dtype=torch.bfloat16,
12
+ attn_implementation="flash_attention_2"
13
  )
14
 
15