Mohinikathro commited on
Commit
d45cf6b
·
verified ·
1 Parent(s): 5f41070

changes made to app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -2
app.py CHANGED
@@ -23,9 +23,12 @@ model.to(device)
23
  # ===============================
24
  # Load Evaluation Model (QwQ)
25
  # ===============================
 
26
  bnb_config = BitsAndBytesConfig(
27
- load_in_8bit=True,
28
- llm_int8_enable_fp32_cpu_offload=True,
 
 
29
  )
30
 
31
  qwq_model_id = "unsloth/QwQ-32B-unsloth-bnb-4bit"
 
23
  # ===============================
24
  # Load Evaluation Model (QwQ)
25
  # ===============================
26
+ # Set 4-bit quantization configuration
27
  bnb_config = BitsAndBytesConfig(
28
+ load_in_4bit=True,
29
+ bnb_4bit_compute_dtype=torch.bfloat16,
30
+ bnb_4bit_use_double_quant=True,
31
+ bnb_4bit_quant_type="nf4"
32
  )
33
 
34
  qwq_model_id = "unsloth/QwQ-32B-unsloth-bnb-4bit"