Spaces:

pmelnechuk
/

MathQA

Running

pmelnechuk commited on Feb 20

Commit

896b328

verified ·

1 Parent(s): 3f9f23a

Update src/model_load.py

Files changed (1) hide show

src/model_load.py CHANGED Viewed

@@ -14,10 +14,7 @@ def load_model():
     tokenizer = AutoTokenizer.from_pretrained(model_name)
     model = AutoModelForCausalLM.from_pretrained(model_name,
                                                  torch_dtype=torch.float16,
-                                                 device_map={
-                                                     "transformer.h.0": "cpu",  # Por ejemplo, mover ciertas capas al CPU
-                                                     "transformer.h.1": "cuda",  # Mantener otras capas en la GPU
-                                                 },
                                                  quantization_config=BitsAndBytesConfig(load_in_8bit=True),
                                                  llm_int8_enable_fp32_cpu_offload=True)

     tokenizer = AutoTokenizer.from_pretrained(model_name)
     model = AutoModelForCausalLM.from_pretrained(model_name,
                                                  torch_dtype=torch.float16,
+                                                 device_map="auto"
                                                  quantization_config=BitsAndBytesConfig(load_in_8bit=True),
                                                  llm_int8_enable_fp32_cpu_offload=True)