Mohinikathro commited on
Commit
dba1b37
·
verified ·
1 Parent(s): d45cf6b

changes made in app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -5
app.py CHANGED
@@ -23,12 +23,9 @@ model.to(device)
23
  # ===============================
24
  # Load Evaluation Model (QwQ)
25
  # ===============================
26
- # Set 4-bit quantization configuration
27
  bnb_config = BitsAndBytesConfig(
28
- load_in_4bit=True,
29
- bnb_4bit_compute_dtype=torch.bfloat16,
30
- bnb_4bit_use_double_quant=True,
31
- bnb_4bit_quant_type="nf4"
32
  )
33
 
34
  qwq_model_id = "unsloth/QwQ-32B-unsloth-bnb-4bit"
 
23
  # ===============================
24
  # Load Evaluation Model (QwQ)
25
  # ===============================
 
26
  bnb_config = BitsAndBytesConfig(
27
+ load_in_8bit=True,
28
+ llm_int8_enable_fp32_cpu_offload=True,
 
 
29
  )
30
 
31
  qwq_model_id = "unsloth/QwQ-32B-unsloth-bnb-4bit"