pmelnechuk commited on
Commit
df93760
·
verified ·
1 Parent(s): 097094f

Update src/model_load.py

Browse files
Files changed (1) hide show
  1. src/model_load.py +1 -1
src/model_load.py CHANGED
@@ -14,7 +14,7 @@ def load_model():
14
  tokenizer = AutoTokenizer.from_pretrained(model_name)
15
  model = AutoModelForCausalLM.from_pretrained(model_name,
16
  device_map="auto",
17
- quantization_config=BitsAndBytesConfig(load_in_4bit=True),
18
  torch_dtype=torch.float16,
19
  max_memory=max_memory)
20
 
 
14
  tokenizer = AutoTokenizer.from_pretrained(model_name)
15
  model = AutoModelForCausalLM.from_pretrained(model_name,
16
  device_map="auto",
17
+ quantization_config=BitsAndBytesConfig(load_in_8bit=True),
18
  torch_dtype=torch.float16,
19
  max_memory=max_memory)
20