cortexso
/

tinyllama

jan-hq commited on Oct 7, 2024

Commit

7e59e04

verified ·

1 Parent(s): 5bb58f2

Upload folder using huggingface_hub

Files changed (1) hide show

model.yml CHANGED Viewed

@@ -1,4 +1,4 @@
-name: tinyllama 1B
 model: tinyllama:1B
 version: 1
@@ -15,5 +15,6 @@ stream: true # true | false
 # Engine / Model Settings
 ngl: 33 # Infer from base config.json -> num_attention_heads
 ctx_len: 4096 # Infer from base config.json -> max_position_embeddings
-engine: cortex.llamacpp
-prompt_template: "\n\n<|system|>\n{system_message}</s>\n\n\n\n\n<|user|>\n{prompt}</s>\n\n\n<|assistant|>\n\n"

+name: tinyllama:1b-gguf-q5-km
 model: tinyllama:1B
 version: 1
 # Engine / Model Settings
 ngl: 33 # Infer from base config.json -> num_attention_heads
 ctx_len: 4096 # Infer from base config.json -> max_position_embeddings
+engine: llama-cpp
+prompt_template: "\n\n<|system|>\n{system_message}</s>\n\n\n\n\n<|user|>\n{prompt}</s>\n\
+  \n\n<|assistant|>\n\n"