Petro commited on
Commit
dd25592
·
1 Parent(s): 6d588fe

Fix bug with weights.

Browse files
Files changed (1) hide show
  1. main.py +9 -7
main.py CHANGED
@@ -2,17 +2,18 @@ from ctransformers import AutoModelForCausalLM
2
  from fastapi import FastAPI
3
  from pydantic import BaseModel
4
 
5
-
6
- llm = AutoModelForCausalLM.from_pretrained("zephyr-7b-beta.Q4_K_S.gguf",
7
- model_type='mistral',
8
- max_new_tokens = 1096,
9
- threads = 3,
10
- )
11
 
12
  #Pydantic object
13
  class validation(BaseModel):
14
  prompt: str
15
  #Fast API
 
16
  app = FastAPI()
17
 
18
  @app.post("/llm_on_cpu")
@@ -21,4 +22,5 @@ async def stream(item: validation):
21
  E_INST = "</s>"
22
  user, assistant = "<|user|>", "<|assistant|>"
23
  prompt = f"{system_prompt}{E_INST}\n{user}\n{item.prompt}{E_INST}\n{assistant}\n"
24
- return llm(prompt)
 
 
2
  from fastapi import FastAPI
3
  from pydantic import BaseModel
4
 
5
+ #
6
+ # llm = AutoModelForCausalLM.from_pretrained("zephyr-7b-beta.Q4_K_S.gguf",
7
+ # model_type='mistral',
8
+ # max_new_tokens = 1096,
9
+ # threads = 3,
10
+ # )
11
 
12
  #Pydantic object
13
  class validation(BaseModel):
14
  prompt: str
15
  #Fast API
16
+
17
  app = FastAPI()
18
 
19
  @app.post("/llm_on_cpu")
 
22
  E_INST = "</s>"
23
  user, assistant = "<|user|>", "<|assistant|>"
24
  prompt = f"{system_prompt}{E_INST}\n{user}\n{item.prompt}{E_INST}\n{assistant}\n"
25
+ # return llm(prompt)
26
+ return prompt