Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Update app.py
Browse files
app.py
CHANGED
@@ -11,9 +11,16 @@ from torch import cuda
|
|
11 |
import json
|
12 |
from datetime import datetime
|
13 |
|
14 |
-
|
|
|
|
|
15 |
###########
|
16 |
# ToDo move to functions
|
|
|
|
|
|
|
|
|
|
|
17 |
|
18 |
def get_rag_answer(query, top_results):
|
19 |
"""
|
|
|
11 |
import json
|
12 |
from datetime import datetime
|
13 |
|
14 |
+
|
15 |
+
|
16 |
+
#model_config = getconfig("model_params.cfg")
|
17 |
###########
|
18 |
# ToDo move to functions
|
19 |
+
# Configuration for the dedicated model
|
20 |
+
DEDICATED_MODEL = "meta-llama/Llama-3.1-8B-Instruct"
|
21 |
+
DEDICATED_ENDPOINT = "https://qu2d8m6dmsollhly.us-east-1.aws.endpoints.huggingface.cloud"
|
22 |
+
# Write access token from the settings
|
23 |
+
WRITE_ACCESS_TOKEN = st.secrets["Llama_3_1"]
|
24 |
|
25 |
def get_rag_answer(query, top_results):
|
26 |
"""
|