yanTemp commited on
Commit
7fce770
·
verified ·
1 Parent(s): 6eecd0d

Training in progress, epoch 1

Browse files
adapter_config.json CHANGED
@@ -25,8 +25,8 @@
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "v_proj",
29
- "q_proj"
30
  ],
31
  "target_parameters": null,
32
  "task_type": "CAUSAL_LM",
 
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
+ "q_proj",
29
+ "v_proj"
30
  ],
31
  "target_parameters": null,
32
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52af2eba14357a8295689f041a36970347582ae25a07ec15f22b392c70a32ac0
3
  size 10108960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ad7cbf60dd99c739ae3769da5ab6dec2e4deefdf61e7ddea03b005f20466e20
3
  size 10108960
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "best_global_step": 14,
3
- "best_metric": 7.769174098968506,
4
  "best_model_checkpoint": "qwen2.5-7b-instruct-sft/checkpoint-14",
5
  "epoch": 2.0,
6
  "eval_steps": 8,
@@ -11,36 +11,36 @@
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
- "eval_accuracy": 0.011311172668513388,
15
- "eval_entropy": 1.995360060742027,
16
- "eval_loss": 8.486817359924316,
17
- "eval_mean_token_accuracy": 0.3320777494656412,
18
- "eval_num_tokens": 10173.0,
19
- "eval_runtime": 5.7445,
20
- "eval_samples_per_second": 3.308,
21
- "eval_steps_per_second": 3.308,
22
  "step": 7
23
  },
24
  {
25
  "epoch": 2.0,
26
- "eval_accuracy": 0.012003693444136657,
27
- "eval_entropy": 2.3059515451130115,
28
- "eval_loss": 7.769174098968506,
29
- "eval_mean_token_accuracy": 0.3835462488626179,
30
- "eval_num_tokens": 20346.0,
31
- "eval_runtime": 5.4565,
32
- "eval_samples_per_second": 3.482,
33
- "eval_steps_per_second": 3.482,
34
  "step": 14
35
  },
36
  {
37
  "epoch": 2.0,
38
  "step": 14,
39
- "total_flos": 946051451375616.0,
40
- "train_loss": 9.178882053920201,
41
- "train_runtime": 64.9953,
42
- "train_samples_per_second": 1.539,
43
- "train_steps_per_second": 0.215
44
  }
45
  ],
46
  "logging_steps": 20,
@@ -60,7 +60,7 @@
60
  "attributes": {}
61
  }
62
  },
63
- "total_flos": 946051451375616.0,
64
  "train_batch_size": 1,
65
  "trial_name": null,
66
  "trial_params": null
 
1
  {
2
  "best_global_step": 14,
3
+ "best_metric": 7.774374485015869,
4
  "best_model_checkpoint": "qwen2.5-7b-instruct-sft/checkpoint-14",
5
  "epoch": 2.0,
6
  "eval_steps": 8,
 
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
+ "eval_accuracy": 0.009382151029748284,
15
+ "eval_entropy": 1.9991131769983392,
16
+ "eval_loss": 8.462516784667969,
17
+ "eval_mean_token_accuracy": 0.3313447864432084,
18
+ "eval_num_tokens": 10200.0,
19
+ "eval_runtime": 5.9276,
20
+ "eval_samples_per_second": 3.205,
21
+ "eval_steps_per_second": 3.205,
22
  "step": 7
23
  },
24
  {
25
  "epoch": 2.0,
26
+ "eval_accuracy": 0.009382151029748282,
27
+ "eval_entropy": 2.2881032667661967,
28
+ "eval_loss": 7.774374485015869,
29
+ "eval_mean_token_accuracy": 0.38798953043787104,
30
+ "eval_num_tokens": 20400.0,
31
+ "eval_runtime": 5.6575,
32
+ "eval_samples_per_second": 3.358,
33
+ "eval_steps_per_second": 3.358,
34
  "step": 14
35
  },
36
  {
37
  "epoch": 2.0,
38
  "step": 14,
39
+ "total_flos": 948562351718400.0,
40
+ "train_loss": 9.186460222516741,
41
+ "train_runtime": 63.5624,
42
+ "train_samples_per_second": 1.573,
43
+ "train_steps_per_second": 0.22
44
  }
45
  ],
46
  "logging_steps": 20,
 
60
  "attributes": {}
61
  }
62
  },
63
+ "total_flos": 948562351718400.0,
64
  "train_batch_size": 1,
65
  "trial_name": null,
66
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:94d8482c3d536c482f9ff6dc3cc5cf37c97b34842af3ea1abd2e8a6ce1ad5ccc
3
  size 5752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17d8fae980fd538a4af1f30218f3a02c9953cd57289afafef173d0fa6bca5dfc
3
  size 5752