update tokenizer_config.json
Browse files- tokenizer_config.json +2 -10
tokenizer_config.json
CHANGED
@@ -236,17 +236,9 @@
|
|
236 |
"special": true
|
237 |
}
|
238 |
},
|
239 |
-
"additional_special_tokens":
|
240 |
-
"[AVAILABLE_TOOLS]",
|
241 |
-
"[/AVAILABLE_TOOLS]",
|
242 |
-
"[INST]",
|
243 |
-
"[/INST]",
|
244 |
-
"[TOOL_CALLS]",
|
245 |
-
"[TOOL_RESULTS]",
|
246 |
-
"[/TOOL_RESULTS]"
|
247 |
-
],
|
248 |
"bos_token": "<|begin▁of▁sentence|>",
|
249 |
-
"chat_template": "{% if
|
250 |
"clean_up_tokenization_spaces": false,
|
251 |
"eos_token": "<|end▁of▁sentence|>",
|
252 |
"legacy": true,
|
|
|
236 |
"special": true
|
237 |
}
|
238 |
},
|
239 |
+
"additional_special_tokens": null,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
240 |
"bos_token": "<|begin▁of▁sentence|>",
|
241 |
+
"chat_template": "\n{%- if not tools is defined %}\n {%- set tools = none %}\n{%- endif %}\n{%- set user_messages = messages | selectattr(\"role\", \"equalto\", \"user\") | list %}\n\n{%- for message in lmessages | rejectattr(\"role\", \"equalto\", \"tool\") | rejectattr(\"role\", \"equalto\", \"tool_results\") | selectattr(\"tool_calls\", \"undefined\") %}\n {%- if (message[\"role\"] == \"user\") != (loop.index0 % 2 == 0) %}\n {{- raise_exception(\"Conversation roles must alternate user/assistant/user/assistant/...\") }}\n {%- endif %}\n{%- endfor %}\n\n{{- bos_token }}\n{%- for message in messages %}\n {%- if message[\"role\"] == \"user\" %}\n {{- \"[INST] \" }}\n {%- if tools is not none and (message == user_messages[-1]) %}\n {{- \"[AVAILABLE_TOOLS] [\" }}\n {%- for tool in tools %}\n {%- set tool = tool.function %}\n {{- '{\"type\": \"function\", \"function\": {' }}\n {%- for key, val in tool.items() if key != \"return\" %}\n {%- if val is string %}\n {{- '\"' + key + '\": \"' + val + '\"' }}\n {%- else %}\n {{- '\"' + key + '\": ' + val|tojson }}\n {%- endif %}\n {%- if not loop.last %}\n {{- \", \" }}\n {%- endif %}\n {%- endfor %}\n {{- \"}}\" }}\n {%- if not loop.last %}\n {{- \", \" }}\n {%- else %}\n {{- \"]\" }}\n {%- endif %}\n {%- endfor %}\n {{- \"[/AVAILABLE_TOOLS]\" }}\n {%- endif %}\n {{- message[\"content\"] + \"[/INST]\" }}\n {%- elif message[\"role\"] == \"tool_calls\" or message.tool_calls is defined %}\n {%- if message.tool_calls is defined %}\n {%- set tool_calls = message.tool_calls %}\n {%- else %}\n {%- set tool_calls = message.content %}\n {%- endif %}\n {{- \"[TOOL_CALLS] [\" }}\n {%- for tool_call in tool_calls %}\n {%- set out = tool_call.function|tojson %}\n {{- out }}\n {%- if not loop.last %}\n {{- \", \" }}\n {%- else %}\n {{- \"]\" }}\n {%- endif %}\n {%- endfor %}\n {%- elif message[\"role\"] == \"assistant\" %}\n {{- \" \" + message[\"content\"] }}\n {%- elif message[\"role\"] == \"tool_results\" or message[\"role\"] == \"tool\" %}\n {%- if message.content is defined and message.content.content is defined %}\n {%- set content = message.content.content %}\n {%- else %}\n {%- set content = message.content %}\n {%- endif %}\n {{- '[TOOL_RESULTS] {\"content\": ' + content|string + \"}[/TOOL_RESULTS]\" }}\n {%- else %}\n {{- raise_exception(\"Only user and assistant roles are supported, with the exception of an initial optional system message!\") }}\n {%- endif %}\n{%- endfor %}\n",
|
242 |
"clean_up_tokenization_spaces": false,
|
243 |
"eos_token": "<|end▁of▁sentence|>",
|
244 |
"legacy": true,
|