Spaces:

Lhumpal
/

hb-llm

Sleeping

Lhumpal commited on Mar 24

Commit

f1b182f

verified ·

1 Parent(s): 6641824

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -16,7 +16,8 @@ else:
     raise ValueError("HF_TOKEN environment variable not set. Please add it as a secret in your Hugging Face Space.")
 # model = ollama.pull('llama3.2')
-model = ollama.pull('hf.co/bartowski/Llama-3.2-3B-Instruct-GGUF:Q4_K_M')
 class ChatRequest(BaseModel):
     message: str
@@ -35,8 +36,13 @@ async def chat(request: ChatRequest):
     try:
         start_time = time.time()  # Start measuring time
         # Simulate getting the response from the model
-        response = ollama.chat(model='hf.co/bartowski/Llama-3.2-3B-Instruct-GGUF:Q4_K_M', messages=[{'role': 'user', 'content': request.message}])
         # response = "pending"
         response = str(response)

     raise ValueError("HF_TOKEN environment variable not set. Please add it as a secret in your Hugging Face Space.")
 # model = ollama.pull('llama3.2')
+model_name = 'hf.co/bartowski/Llama-3.2-3B-Instruct-GGUF:Q4_K_M'
+model = ollama.pull(model_name)
 class ChatRequest(BaseModel):
     message: str
     try:
         start_time = time.time()  # Start measuring time
+        messages = [
+            {'role': 'system', 'content': request.system_message}
+            {'role': 'user', 'content': request.message}
+        ]
         # Simulate getting the response from the model
+        response = ollama.chat(model=model_name, messages=messages)
         # response = "pending"
         response = str(response)