Spaces:

ericwithpy
/

Mental_Health

Sleeping

ericwithpy commited on Apr 4

Commit

7e55c71

verified ·

1 Parent(s): 911b23c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,7 +4,14 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
 device = "cuda" if torch.cuda.is_available() else "cpu"  # Automatically detect GPU or CPU
 model_name = "tanusrich/Mental_Health_Chatbot"
-model = AutoModelForCausalLM.from_pretrained(model_name)
 tokenizer = AutoTokenizer.from_pretrained(model_name)
 '''

 device = "cuda" if torch.cuda.is_available() else "cpu"  # Automatically detect GPU or CPU
 model_name = "tanusrich/Mental_Health_Chatbot"
+model = AutoModelForCausalLM.from_pretrained(
+    model_name,
+    torch_dtype=torch.float16,  # Reduce memory usage
+    device_map="auto",  # Automatically assigns to GPU if available
+    low_cpu_mem_usage=True,
+    max_memory={0: "4GiB", "cpu": "6GiB"}, # Optimize CPU memory
+    offload_folder=None
+)
 tokenizer = AutoTokenizer.from_pretrained(model_name)
 '''