Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -11,13 +11,13 @@ class RAGChatbot:
|
|
11 |
embedding_model="all-MiniLM-L6-v2"):
|
12 |
# Initialize tokenizer and model
|
13 |
self.tokenizer = AutoTokenizer.from_pretrained(model_name)
|
14 |
-
self.bnb_config = BitsAndBytesConfig(
|
15 |
-
|
16 |
-
|
17 |
-
|
18 |
self.model = AutoModelForCausalLM.from_pretrained(
|
19 |
model_name,
|
20 |
-
|
21 |
device_map="auto"
|
22 |
)
|
23 |
|
|
|
11 |
embedding_model="all-MiniLM-L6-v2"):
|
12 |
# Initialize tokenizer and model
|
13 |
self.tokenizer = AutoTokenizer.from_pretrained(model_name)
|
14 |
+
# self.bnb_config = BitsAndBytesConfig(
|
15 |
+
# load_in_8bit=True, # Enable 8-bit loading
|
16 |
+
# llm_int8_threshold=6.0, # Threshold for mixed-precision computation
|
17 |
+
# )
|
18 |
self.model = AutoModelForCausalLM.from_pretrained(
|
19 |
model_name,
|
20 |
+
torch_dtype=torch.bfloat16, ,
|
21 |
device_map="auto"
|
22 |
)
|
23 |
|