Spaces:

xu-song
/

tokenizer-arena

Running

App Files Files

xet

Community

xu-song commited on Aug 21

Commit

e584a13

1 Parent(s): d3ba21b

update

Browse files

Files changed (5) hide show

doc/chat-template/DeepSeek-R1/chat_template.jinja +1 -0
doc/chat-template/export_chat_template.py +2 -0
doc/chat-template/gemma-3-27b-it/chat_template.jinja +47 -0
doc/chat-template/tool_demo.py +6 -2
doc/chat-template/tools_and_llm_response.md +3 -0

doc/chat-template/DeepSeek-R1/chat_template.jinja ADDED Viewed

	@@ -0,0 +1 @@

+ {% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='', is_first_sp=true) %}{%- for message in messages %}{%- if message['role'] == 'system' %}{%- if ns.is_first_sp %}{% set ns.system_prompt = ns.system_prompt + message['content'] %}{% set ns.is_first_sp = false %}{%- else %}{% set ns.system_prompt = ns.system_prompt + '\n\n' + message['content'] %}{%- endif %}{%- endif %}{%- endfor %}{{ bos_token }}{{ ns.system_prompt }}{%- for message in messages %}{%- if message['role'] == 'user' %}{%- set ns.is_tool = false -%}{{'<｜User｜>' + message['content']}}{%- endif %}{%- if message['role'] == 'assistant' and 'tool_calls' in message %}{%- set ns.is_tool = false -%}{%- for tool in message['tool_calls'] %}{%- if not ns.is_first %}{%- if message['content'] is none %}{{'<｜Assistant｜><｜tool▁calls▁begin｜><｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\n' + '```json' + '\n' + tool['function']['arguments'] + '\n' + '```' + '<｜tool▁call▁end｜>'}}{%- else %}{{'<｜Assistant｜>' + message['content'] + '<｜tool▁calls▁begin｜><｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\n' + '```json' + '\n' + tool['function']['arguments'] + '\n' + '```' + '<｜tool▁call▁end｜>'}}{%- endif %}{%- set ns.is_first = true -%}{%- else %}{{'\n' + '<｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\n' + '```json' + '\n' + tool['function']['arguments'] + '\n' + '```' + '<｜tool▁call▁end｜>'}}{%- endif %}{%- endfor %}{{'<｜tool▁calls▁end｜><｜end▁of▁sentence｜>'}}{%- endif %}{%- if message['role'] == 'assistant' and 'tool_calls' not in message %}{%- if ns.is_tool %}{{'<｜tool▁outputs▁end｜>' + message['content'] + '<｜end▁of▁sentence｜>'}}{%- set ns.is_tool = false -%}{%- else %}{% set content = message['content'] %}{% if '</think>' in content %}{% set content = content.split('</think>')[-1] %}{% endif %}{{'<｜Assistant｜>' + content + '<｜end▁of▁sentence｜>'}}{%- endif %}{%- endif %}{%- if message['role'] == 'tool' %}{%- set ns.is_tool = true -%}{%- if ns.is_output_first %}{{'<｜tool▁outputs▁begin｜><｜tool▁output▁begin｜>' + message['content'] + '<｜tool▁output▁end｜>'}}{%- set ns.is_output_first = false %}{%- else %}{{'<｜tool▁output▁begin｜>' + message['content'] + '<｜tool▁output▁end｜>'}}{%- endif %}{%- endif %}{%- endfor -%}{% if ns.is_tool %}{{'<｜tool▁outputs▁end｜>'}}{% endif %}{% if add_generation_prompt and not ns.is_tool %}{{'<｜Assistant｜><think>\n'}}{% endif %}

doc/chat-template/export_chat_template.py CHANGED Viewed

@@ -15,6 +15,8 @@ MODEL_PATH = "NousResearch/Hermes-3-Llama-3.1-405B"  # messages里不支持tool_
 # MODEL_PATH = "mistralai/Ministral-8B-Instruct-2410" # 支持 tools, 支持tool_calls(必须要有id), 格式非主流
 MODEL_PATH = "deepseek-ai/DeepSeek-R1"
 # MODEL_PATH = "deepseek-ai/DeepSeek-R1-0528"
 tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH)
 chat_template = tokenizer.chat_template

 # MODEL_PATH = "mistralai/Ministral-8B-Instruct-2410" # 支持 tools, 支持tool_calls(必须要有id), 格式非主流
 MODEL_PATH = "deepseek-ai/DeepSeek-R1"
 # MODEL_PATH = "deepseek-ai/DeepSeek-R1-0528"
+MODEL_PATH = "google/gemma-3-27b-it"
 tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH)
 chat_template = tokenizer.chat_template

doc/chat-template/gemma-3-27b-it/chat_template.jinja ADDED Viewed

	@@ -0,0 +1,47 @@

+{{ bos_token }}
+{%- if messages[0]['role'] == 'system' -%}
+    {%- if messages[0]['content'] is string -%}
+        {%- set first_user_prefix = messages[0]['content'] + '
+' -%}
+    {%- else -%}
+        {%- set first_user_prefix = messages[0]['content'][0]['text'] + '
+' -%}
+    {%- endif -%}
+    {%- set loop_messages = messages[1:] -%}
+{%- else -%}
+    {%- set first_user_prefix = "" -%}
+    {%- set loop_messages = messages -%}
+{%- endif -%}
+{%- for message in loop_messages -%}
+    {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) -%}
+        {{ raise_exception("Conversation roles must alternate user/assistant/user/assistant/...") }}
+    {%- endif -%}
+    {%- if (message['role'] == 'assistant') -%}
+        {%- set role = "model" -%}
+    {%- else -%}
+        {%- set role = message['role'] -%}
+    {%- endif -%}
+    {{ '<start_of_turn>' + role + '
+' + (first_user_prefix if loop.first else "") }}
+    {%- if message['content'] is string -%}
+        {{ message['content'] | trim }}
+    {%- elif message['content'] is iterable -%}
+        {%- for item in message['content'] -%}
+            {%- if item['type'] == 'image' -%}
+                {{ '<start_of_image>' }}
+            {%- elif item['type'] == 'text' -%}
+                {{ item['text'] | trim }}
+            {%- endif -%}
+        {%- endfor -%}
+    {%- else -%}
+        {{ raise_exception("Invalid content type") }}
+    {%- endif -%}
+    {{ '<end_of_turn>
+' }}
+{%- endfor -%}
+{%- if add_generation_prompt -%}
+    {{'<start_of_turn>model
+'}}
+{%- endif -%}

doc/chat-template/tool_demo.py CHANGED Viewed

@@ -23,6 +23,9 @@ from transformers.utils import get_json_schema
 MODEL_PATH = "Qwen/Qwen3-235B-A22B-Instruct-2507"
 # MODEL_PATH = "mistralai/Mistral-7B-Instruct-v0.1"  # messages里不支持tool_calls，不支持 role=tool，不支持 tools
 # MODEL_PATH = "mistralai/Ministral-8B-Instruct-2410" # 支持 tools, 支持tool_calls(必须要有id), 格式非主流
 tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH)
 # First, define a tool
@@ -41,8 +44,8 @@ def get_current_temperature(location: str) -> float:
 messages = [
   {"role": "system", "content": "You are a bot that responds to weather queries."},
   {"role": "user", "content": "Hey, what's the temperature in Paris right now?"},
-  {"role": "assitant", "content": "test1"},
-  {"role": "user", "content": "test2"},
 ]
 # step1:
@@ -59,6 +62,7 @@ print(json.dumps(json_schema, ensure_ascii=False, indent=2))
 # step2: 调用 LLM，以下是LLM的返回
 tool_call = {"name": "get_current_temperature", "arguments": {"location": "Paris, France"}}
 messages.append({"role": "assistant", "tool_calls": [{"type": "function", "function": tool_call}]})
 # messages.append({"role": "assistant", "tool_calls": [{"id": "123456789", "type": "function", "function": tool_call}]})  # Ministral-8B-Instruct-2410 仍然报错
 # step3: 调用tool，以下是 tool 的返回

 MODEL_PATH = "Qwen/Qwen3-235B-A22B-Instruct-2507"
 # MODEL_PATH = "mistralai/Mistral-7B-Instruct-v0.1"  # messages里不支持tool_calls，不支持 role=tool，不支持 tools
 # MODEL_PATH = "mistralai/Ministral-8B-Instruct-2410" # 支持 tools, 支持tool_calls(必须要有id), 格式非主流
+# MODEL_PATH = "deepseek-ai/DeepSeek-R1"  # 不支持tools，tool_calls也有问题
+# MODEL_PATH = "google/gemma-3-27b-it"  # 不支持任何tool
+MODEL_PATH = "moonshotai/Kimi-K2-Instruct"
 tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH)
 # First, define a tool
 messages = [
   {"role": "system", "content": "You are a bot that responds to weather queries."},
   {"role": "user", "content": "Hey, what's the temperature in Paris right now?"},
+#   {"role": "assitant", "content": "test1"},
+#   {"role": "user", "content": "test2"},
 ]
 # step1:
 # step2: 调用 LLM，以下是LLM的返回
 tool_call = {"name": "get_current_temperature", "arguments": {"location": "Paris, France"}}
 messages.append({"role": "assistant", "tool_calls": [{"type": "function", "function": tool_call}]})
+# messages.append({"role": "assistant", "tool_calls": [{"type": "function", "function": tool_call}], "content": ""})
 # messages.append({"role": "assistant", "tool_calls": [{"id": "123456789", "type": "function", "function": tool_call}]})  # Ministral-8B-Instruct-2410 仍然报错
 # step3: 调用tool，以下是 tool 的返回

doc/chat-template/tools_and_llm_response.md CHANGED Viewed

@@ -241,3 +241,6 @@ Hey, what's the temperature in Paris right now?<|im_end|>
   - **tools在prompt中的位置**: 拼接到原始`system`的结尾。
 - **出参**: 返回的`respone` 要求是 `<tool_call>` 包裹的json
 `return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{"name": <function-name>, "arguments": <args-json-object>}\n</tool_call>`

   - **tools在prompt中的位置**: 拼接到原始`system`的结尾。
 - **出参**: 返回的`respone` 要求是 `<tool_call>` 包裹的json
 `return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{"name": <function-name>, "arguments": <args-json-object>}\n</tool_call>`
+##