Spaces:

pmelnechuk
/

MathQA

Running

pmelnechuk commited on Feb 20

Commit

3749dd3

verified ·

1 Parent(s): 926b261

prueba modificando la distribucion del modelo

Files changed (1) hide show

src/model_load.py CHANGED Viewed

@@ -14,7 +14,10 @@ def load_model():
     tokenizer = AutoTokenizer.from_pretrained(model_name)
     model = AutoModelForCausalLM.from_pretrained(model_name,
                                                  torch_dtype=torch.float16,
-                                                 device_map="auto",
                                                  quantization_config=BitsAndBytesConfig(load_in_8bit=True))
     # Crear pipeline de generación de texto

     tokenizer = AutoTokenizer.from_pretrained(model_name)
     model = AutoModelForCausalLM.from_pretrained(model_name,
                                                  torch_dtype=torch.float16,
+                                                 device_map={
+                                                     "transformer.h.0": "cpu",  # Por ejemplo, mover ciertas capas al CPU
+                                                     "transformer.h.1": "cuda",  # Mantener otras capas en la GPU
+                                                 },
                                                  quantization_config=BitsAndBytesConfig(load_in_8bit=True))
     # Crear pipeline de generación de texto