Yoxas commited on
Commit
e81f48e
·
verified ·
1 Parent(s): bce5d54

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -37,7 +37,7 @@ model_id = "meta-llama/Meta-Llama-3-8B-Instruct"
37
 
38
  # use quantization to lower GPU usage
39
  bnb_config = BitsAndBytesConfig(
40
- load_in 4bit=True, bnb_4bit_use_double_quant=True, bnb_4bit_quant_type="nf4", bnb_4bit_compute_dtype=torch.bfloat16
41
  )
42
 
43
  tokenizer = AutoTokenizer.from_pretrained(model_id, token=token)
 
37
 
38
  # use quantization to lower GPU usage
39
  bnb_config = BitsAndBytesConfig(
40
+ load_in_4bit=True, bnb_4bit_use_double_quant=True, bnb_4bit_quant_type="nf4", bnb_4bit_compute_dtype=torch.bfloat16
41
  )
42
 
43
  tokenizer = AutoTokenizer.from_pretrained(model_id, token=token)