Upload folder using huggingface_hub
Browse files
model.yml
CHANGED
@@ -1,4 +1,4 @@
|
|
1 |
-
name: tinyllama
|
2 |
model: tinyllama:1B
|
3 |
version: 1
|
4 |
|
@@ -15,5 +15,6 @@ stream: true # true | false
|
|
15 |
# Engine / Model Settings
|
16 |
ngl: 33 # Infer from base config.json -> num_attention_heads
|
17 |
ctx_len: 4096 # Infer from base config.json -> max_position_embeddings
|
18 |
-
engine:
|
19 |
-
prompt_template: "\n\n<|system|>\n{system_message}</s>\n\n\n\n\n<|user|>\n{prompt}</s>\n\
|
|
|
|
1 |
+
name: tinyllama:1b-gguf-q5-km
|
2 |
model: tinyllama:1B
|
3 |
version: 1
|
4 |
|
|
|
15 |
# Engine / Model Settings
|
16 |
ngl: 33 # Infer from base config.json -> num_attention_heads
|
17 |
ctx_len: 4096 # Infer from base config.json -> max_position_embeddings
|
18 |
+
engine: llama-cpp
|
19 |
+
prompt_template: "\n\n<|system|>\n{system_message}</s>\n\n\n\n\n<|user|>\n{prompt}</s>\n\
|
20 |
+
\n\n<|assistant|>\n\n"
|