Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -37,7 +37,7 @@ model_id = "meta-llama/Meta-Llama-3-8B-Instruct"
|
|
37 |
|
38 |
# use quantization to lower GPU usage
|
39 |
bnb_config = BitsAndBytesConfig(
|
40 |
-
|
41 |
)
|
42 |
|
43 |
tokenizer = AutoTokenizer.from_pretrained(model_id, token=token)
|
|
|
37 |
|
38 |
# use quantization to lower GPU usage
|
39 |
bnb_config = BitsAndBytesConfig(
|
40 |
+
load_in_4bit=True, bnb_4bit_use_double_quant=True, bnb_4bit_quant_type="nf4", bnb_4bit_compute_dtype=torch.bfloat16
|
41 |
)
|
42 |
|
43 |
tokenizer = AutoTokenizer.from_pretrained(model_id, token=token)
|