Update tokenizer_config.json
Browse files- tokenizer_config.json +1 -1
tokenizer_config.json
CHANGED
@@ -315,7 +315,7 @@
|
|
315 |
],
|
316 |
"clean_up_tokenization_spaces": false,
|
317 |
"do_lower_case": false,
|
318 |
-
"chat_template": "
|
319 |
"eos_token": "<|endoftext|>",
|
320 |
"extra_special_tokens": {},
|
321 |
"model_max_length": 128000,
|
|
|
315 |
],
|
316 |
"clean_up_tokenization_spaces": false,
|
317 |
"do_lower_case": false,
|
318 |
+
"chat_template": "[gMASK]<sop>\n{%- macro visible_text(content) -%}\n{%- if content is string -%}\n{{- content }}\n{%- elif content is iterable and content is not mapping -%}\n{%- for item in content -%}\n{%- if item is mapping and item.type == 'text' -%}\n{{- item.text }}\n{%- elif item is string -%}\n{{- item }}\n{%- endif -%}\n{%- endfor -%}\n{%- else -%}\n{{- content }}\n{%- endif -%}\n{%- endmacro -%}\n{%- set today = strftime_now(\"%Y-%m-%d\") -%}\n{%- set default_system_message = \"You are a helpful AI assistant without a name or creator. The current date is \" + today + \".\" -%}\n{%- set sys = namespace(msg=default_system_message) -%}\n{%- for _m in messages -%}{%- if _m.role == 'system' -%}{% set sys.msg = visible_text(_m.content) %}{%- endif -%}{%- endfor -%}\n<|system|>\n{{ sys.msg }}\n{%- if tools -%}\n\n# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>\n{% for tool in tools %}\n{{ tool | tojson(ensure_ascii=False) }}\n{% endfor %}\n</tools>\n\nFor each function call, output the function name and arguments within the following XML format:\n<tool_call>{function-name}\n<arg_key>{arg-key-1}</arg_key>\n<arg_value>{arg-value-1}</arg_value>\n<arg_key>{arg-key-2}</arg_key>\n<arg_value>{arg-value-2}</arg_value>\n...\n</tool_call>\n{%- endif -%}\n{%- set ns = namespace(last_user_index=-1) %}\n{%- for m in messages %}\n{%- if m.role == 'user' %}\n{% set ns.last_user_index = loop.index0 -%}\n{%- endif %}\n{%- endfor %}\n{% for m in messages %}\n{%- if m.role == 'user' -%}<|user|>\n{{ visible_text(m.content) }}\n{{- '/nothink' if (enable_thinking is defined and not enable_thinking and not visible_text(m.content).endswith(\"/nothink\")) else '' -}}\n{%- elif m.role == 'assistant' -%}\n<|assistant|>\n{%- set reasoning_content = '' %}\n{%- set content = visible_text(m.content) %}\n{%- if m.reasoning_content is string %}\n{%- set reasoning_content = m.reasoning_content %}\n{%- else -%}\n{%- if '</think>' in content %}\n{%- set reasoning_content = content.split('</think>')[0].rstrip('\\n').split('<think>')[-1].lstrip('\\n') %}\n{%- set content = content.split('</think>')[-1].lstrip('\\n') %}\n{%- endif %}\n{%- endif %}\n{%- if loop.index0 > ns.last_user_index and reasoning_content -%}\n{{ '\\n<think>' + reasoning_content.strip() + '</think>'}}\n{%- else -%}\n{{ '\\n<think></think>' }}\n{%- endif -%}\n{%- if content.strip() -%}\n{{ '\\n' + content.strip() }}\n{%- endif -%}\n{% if m.tool_calls %}\n{% for tc in m.tool_calls %}\n{%- if tc.function %}\n{%- set tc = tc.function %}\n{%- endif %}\n{{ '\\n<tool_call>' + tc.name }}\n{% set _args = tc.arguments %}\n{% for k, v in _args.items() %}\n<arg_key>{{ k }}</arg_key>\n<arg_value>{{ v | tojson(ensure_ascii=False) if v is not string else v }}</arg_value>\n{% endfor %}\n</tool_call>{% endfor %}\n{% endif %}\n{%- elif m.role == 'tool' -%}\n{%- if m.content is string -%}\n{%- if loop.first or (messages[loop.index0 - 1].role != \"tool\") %}\n{{- '<|observation|>' }}\n{%- endif %}\n{{- '\\n<tool_response>\\n' }}\n{{- m.content }}\n{{- '\\n</tool_response>' }}\n{%- else -%}\n<|observation|>{% for tr in m.content %}\n<tool_response>\n{{ tr.output if tr.output is defined else tr }}\n</tool_response>{% endfor -%}\n{% endif -%}\n{%- endif -%}\n{%- endfor -%}\n{%- if add_generation_prompt is not defined or add_generation_prompt -%}\n<|assistant|>{{ '\\n<think></think>\\n' if (enable_thinking is defined and not enable_thinking) else '\\n' }}\n{%- endif -%}",
|
319 |
"eos_token": "<|endoftext|>",
|
320 |
"extra_special_tokens": {},
|
321 |
"model_max_length": 128000,
|