Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -13,9 +13,17 @@ offload_dir = "./offload"
|
|
13 |
tokenizer = AutoTokenizer.from_pretrained(model_dir)
|
14 |
|
15 |
# Load the base model with offloading support.
|
|
|
|
|
|
|
|
|
|
|
|
|
16 |
base_model = AutoModelForCausalLM.from_pretrained(
|
17 |
model_dir,
|
18 |
-
device_map="
|
|
|
|
|
19 |
offload_folder=offload_dir # Directory to offload layers (for larger models).
|
20 |
)
|
21 |
|
|
|
13 |
tokenizer = AutoTokenizer.from_pretrained(model_dir)
|
14 |
|
15 |
# Load the base model with offloading support.
|
16 |
+
# base_model = AutoModelForCausalLM.from_pretrained(
|
17 |
+
# model_dir,
|
18 |
+
# device_map="auto", # Automatically use available devices (GPU/CPU).
|
19 |
+
# offload_folder=offload_dir # Directory to offload layers (for larger models).
|
20 |
+
# )
|
21 |
+
|
22 |
base_model = AutoModelForCausalLM.from_pretrained(
|
23 |
model_dir,
|
24 |
+
device_map="cpu", # Force CPU usage
|
25 |
+
torch_dtype=torch.float32, # Use float32 for CPU
|
26 |
+
trust_remote_code=True,
|
27 |
offload_folder=offload_dir # Directory to offload layers (for larger models).
|
28 |
)
|
29 |
|