Training in progress, epoch 1

Browse files

Files changed (9) hide show

chat_template.jinja +2 -2
config.json +1 -1
model-00001-of-00004.safetensors +1 -1
model-00002-of-00004.safetensors +1 -1
model-00003-of-00004.safetensors +1 -1
model-00004-of-00004.safetensors +1 -1
special_tokens_map.json +1 -7
tokenizer_config.json +1 -1
training_args.bin +2 -2

chat_template.jinja CHANGED Viewed

@@ -3,7 +3,7 @@
     {%- if messages[0]['role'] == 'system' %}
         {{- messages[0]['content'] }}
     {%- else %}
-        {{- 'Please reason step by step, and put your final answer within \\boxed{}.' }}
     {%- endif %}
     {{- "\n\n# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
     {%- for tool in tools %}
@@ -15,7 +15,7 @@
     {%- if messages[0]['role'] == 'system' %}
         {{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }}
     {%- else %}
-        {{- '<|im_start|>system\nPlease reason step by step, and put your final answer within \\boxed{}.<|im_end|>\n' }}
     {%- endif %}
 {%- endif %}
 {%- for message in messages %}

     {%- if messages[0]['role'] == 'system' %}
         {{- messages[0]['content'] }}
     {%- else %}
+        {{- 'You are Open-R1, a language model trained by Hugging Face to help users. Your role as an assistant involves thoroughly exploring questions through a systematic thinking process before providing the final precise and accurate solutions. This requires engaging in a comprehensive cycle of analysis, summarizing, exploration, reassessment, reflection, backtracing, and iteration to develop well-considered thinking process. Please structure your response into two main sections: Thought and Solution using the specified format: <think> Thought section </think> Solution section. In the Thought section, detail your reasoning process in steps. Each step should include detailed considerations such as analysing questions, summarizing relevant findings, brainstorming new ideas, verifying the accuracy of the current steps, refining any errors, and revisiting previous steps. In the Solution section, based on various attempts, explorations, and reflections from the Thought section, systematically present the final solution that you deem correct. The Solution section should be logical, accurate, and concise and detail necessary steps needed to reach the conclusion. Now, try to solve the following question through the above guidelines.' }}
     {%- endif %}
     {{- "\n\n# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
     {%- for tool in tools %}
     {%- if messages[0]['role'] == 'system' %}
         {{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }}
     {%- else %}
+        {{- '<|im_start|>system\nYou are Open-R1, a language model trained by Hugging Face to help users. Your role as an assistant involves thoroughly exploring questions through a systematic thinking process before providing the final precise and accurate solutions. This requires engaging in a comprehensive cycle of analysis, summarizing, exploration, reassessment, reflection, backtracing, and iteration to develop well-considered thinking process. Please structure your response into two main sections: Thought and Solution using the specified format: <think> Thought section </think> Solution section. In the Thought section, detail your reasoning process in steps. Each step should include detailed considerations such as analysing questions, summarizing relevant findings, brainstorming new ideas, verifying the accuracy of the current steps, refining any errors, and revisiting previous steps. In the Solution section, based on various attempts, explorations, and reflections from the Thought section, systematically present the final solution that you deem correct. The Solution section should be logical, accurate, and concise and detail necessary steps needed to reach the conclusion. Now, try to solve the following question through the above guidelines.<|im_end|>\n' }}
     {%- endif %}
 {%- endif %}
 {%- for message in messages %}

config.json CHANGED Viewed

@@ -22,7 +22,7 @@
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.52.3",
-  "use_cache": true,
   "use_sliding_window": false,
   "vocab_size": 152064
 }

   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.52.3",
+  "use_cache": false,
   "use_sliding_window": false,
   "vocab_size": 152064
 }

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:22dede961cd25c99d99dba67bf0e052c031e90105c4524912a6f02e8ff665a4e
 size 4877660776

 version https://git-lfs.github.com/spec/v1
+oid sha256:17f4b4acd013c1a049ddb0daa84c37b071ab95da0eb1161d8b4811a12094eb64
 size 4877660776

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2ea67a0b8864386be73477bc08a531c9e6843267b63466a21e2c50229fe51bc5
 size 4932751008

 version https://git-lfs.github.com/spec/v1
+oid sha256:9f6557d447c8e243f4862d8ce20fe2a398096514883f9864bf4932fe0490a98d
 size 4932751008

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fde9238b2b2a63557ce6a674cd1a0e0629d2276e83f6a857c39364a71ddc3ffe
 size 4330865200

 version https://git-lfs.github.com/spec/v1
+oid sha256:c07af1346d5464c4a7c1c572a032f5a32b6cca0883d3bb356d6ecdee6401a7d8
 size 4330865200

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:97ebe44b7924488148b753f3d5fc49fe2050746aaf098bb26f9c3effa5d2541c
 size 1089994880

 version https://git-lfs.github.com/spec/v1
+oid sha256:6a0c2e4bfd9a940c9c6b192a4b3d582d65947ccdf124b8e8c4dc4e11d26c1ad0
 size 1089994880

special_tokens_map.json CHANGED Viewed

@@ -14,13 +14,7 @@
     "<|image_pad|>",
     "<|video_pad|>"
   ],
-  "eos_token": {
-    "content": "<|endoftext|>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
   "pad_token": {
     "content": "<|endoftext|>",
     "lstrip": false,

     "<|image_pad|>",
     "<|video_pad|>"
   ],
+  "eos_token": "<|im_end|>",
   "pad_token": {
     "content": "<|endoftext|>",
     "lstrip": false,

tokenizer_config.json CHANGED Viewed

@@ -196,7 +196,7 @@
   ],
   "bos_token": null,
   "clean_up_tokenization_spaces": false,
-  "eos_token": "<|endoftext|>",
   "errors": "replace",
   "extra_special_tokens": {},
   "model_max_length": 131072,

   ],
   "bos_token": null,
   "clean_up_tokenization_spaces": false,
+  "eos_token": "<|im_end|>",
   "errors": "replace",
   "extra_special_tokens": {},
   "model_max_length": 131072,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0597b01b59f78b533a8c8785d7f32d7d65f4e1fcbc6c853dd5201ba8ca8e0392
-size 7288

 version https://git-lfs.github.com/spec/v1
+oid sha256:5c65576908344f84010c4d94640c5332fe4a0f21bfdd4c02b3a54743d30df66b
+size 12152