yanTemp commited on
Commit
da770c1
·
verified ·
1 Parent(s): 6678aaf

Training in progress, epoch 1

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7803832bbb135b2e0f33dec6f9c991f5885e75a2deedd28a6ee7c8fcbea2ba2
3
  size 10108960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36368dfd8991de06598b374b05f2982e3aefedbe4aeac760b8d6b8026242b0de
3
  size 10108960
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "best_global_step": 14,
3
- "best_metric": 7.821501731872559,
4
  "best_model_checkpoint": "qwen2.5-7b-instruct-sft/checkpoint-14",
5
  "epoch": 2.0,
6
  "eval_steps": 8,
@@ -11,36 +11,36 @@
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
- "eval_accuracy": 0.010252904989747097,
15
- "eval_entropy": 2.023237184474343,
16
- "eval_loss": 8.50821304321289,
17
- "eval_mean_token_accuracy": 0.33141817387781647,
18
- "eval_num_tokens": 10134.0,
19
- "eval_runtime": 5.8055,
20
- "eval_samples_per_second": 3.273,
21
- "eval_steps_per_second": 3.273,
22
  "step": 7
23
  },
24
  {
25
  "epoch": 2.0,
26
- "eval_accuracy": 0.011847801321485534,
27
- "eval_entropy": 2.32025314632215,
28
- "eval_loss": 7.821501731872559,
29
- "eval_mean_token_accuracy": 0.3833909505291989,
30
- "eval_num_tokens": 20268.0,
31
- "eval_runtime": 5.4711,
32
- "eval_samples_per_second": 3.473,
33
- "eval_steps_per_second": 3.473,
34
  "step": 14
35
  },
36
  {
37
  "epoch": 2.0,
38
  "step": 14,
39
- "total_flos": 942424595324928.0,
40
- "train_loss": 9.187333243233818,
41
- "train_runtime": 63.3043,
42
- "train_samples_per_second": 1.58,
43
- "train_steps_per_second": 0.221
44
  }
45
  ],
46
  "logging_steps": 20,
@@ -60,7 +60,7 @@
60
  "attributes": {}
61
  }
62
  },
63
- "total_flos": 942424595324928.0,
64
  "train_batch_size": 1,
65
  "trial_name": null,
66
  "trial_params": null
 
1
  {
2
  "best_global_step": 14,
3
+ "best_metric": 7.935835361480713,
4
  "best_model_checkpoint": "qwen2.5-7b-instruct-sft/checkpoint-14",
5
  "epoch": 2.0,
6
  "eval_steps": 8,
 
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
+ "eval_accuracy": 0.014050964515360804,
15
+ "eval_entropy": 2.0623741275385807,
16
+ "eval_loss": 8.619595527648926,
17
+ "eval_mean_token_accuracy": 0.318189589600814,
18
+ "eval_num_tokens": 10278.0,
19
+ "eval_runtime": 5.6586,
20
+ "eval_samples_per_second": 3.358,
21
+ "eval_steps_per_second": 3.358,
22
  "step": 7
23
  },
24
  {
25
  "epoch": 2.0,
26
+ "eval_accuracy": 0.01476542033817576,
27
+ "eval_entropy": 2.3609655405345715,
28
+ "eval_loss": 7.935835361480713,
29
+ "eval_mean_token_accuracy": 0.3734086673510702,
30
+ "eval_num_tokens": 20556.0,
31
+ "eval_runtime": 5.4063,
32
+ "eval_samples_per_second": 3.514,
33
+ "eval_steps_per_second": 3.514,
34
  "step": 14
35
  },
36
  {
37
  "epoch": 2.0,
38
  "step": 14,
39
+ "total_flos": 955816063819776.0,
40
+ "train_loss": 9.08677237374442,
41
+ "train_runtime": 64.7345,
42
+ "train_samples_per_second": 1.545,
43
+ "train_steps_per_second": 0.216
44
  }
45
  ],
46
  "logging_steps": 20,
 
60
  "attributes": {}
61
  }
62
  },
63
+ "total_flos": 955816063819776.0,
64
  "train_batch_size": 1,
65
  "trial_name": null,
66
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28a2a2a99dd14f22869563a396717cc0f93677e1ec5284c6dc50ac20ea7c9d57
3
  size 5752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5060514daa07d2cc108c95569ab29dbd15d3bf97638012471eb97161866abd71
3
  size 5752