darshan8950 commited on
Commit
644bd56
·
verified ·
1 Parent(s): 357cb8c

Update main.py

Browse files
Files changed (1) hide show
  1. main.py +1 -3
main.py CHANGED
@@ -5,9 +5,7 @@ device = "cuda" # the device to load the model onto
5
 
6
  from ctransformers import AutoModelForCausalLM
7
 
8
- llm = AutoModelForCausalLM.from_pretrained("TheBloke/Llama-2-7b-Chat-GGUF", model_file="llama-2-7b-chat.q4_K_M.gguf", model_type="llama", gpu_layers=0)
9
-
10
-
11
 
12
 
13
  @app.route('/recommend', methods=['POST'])
 
5
 
6
  from ctransformers import AutoModelForCausalLM
7
 
8
+ llm = AutoModelForCausalLM.from_pretrained("TheBloke/Mistral-7B-v0.1-GGUF", model_file="mistral-7b-v0.1.Q4_K_M.gguf", model_type="mistral", gpu_layers=0)
 
 
9
 
10
 
11
  @app.route('/recommend', methods=['POST'])