KevinKibe commited on
Commit
76ab158
·
verified ·
1 Parent(s): e000775

Training in progress, step 500, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- base_model: KevinKibe/whisper-medium-finetuned
3
  library_name: peft
4
  ---
5
 
 
1
  ---
2
+ base_model: openai/whisper-medium
3
  library_name: peft
4
  ---
5
 
last-checkpoint/adapter_config.json CHANGED
@@ -4,7 +4,7 @@
4
  "base_model_class": "WhisperForConditionalGeneration",
5
  "parent_library": "transformers.models.whisper.modeling_whisper"
6
  },
7
- "base_model_name_or_path": "KevinKibe/whisper-medium-finetuned",
8
  "bias": "none",
9
  "fan_in_fan_out": false,
10
  "inference_mode": true,
@@ -23,8 +23,8 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "v_proj",
27
- "q_proj"
28
  ],
29
  "task_type": null,
30
  "use_dora": false,
 
4
  "base_model_class": "WhisperForConditionalGeneration",
5
  "parent_library": "transformers.models.whisper.modeling_whisper"
6
  },
7
+ "base_model_name_or_path": "openai/whisper-medium",
8
  "bias": "none",
9
  "fan_in_fan_out": false,
10
  "inference_mode": true,
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
+ "q_proj",
27
+ "v_proj"
28
  ],
29
  "task_type": null,
30
  "use_dora": false,
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dad58bb931d9189bca63983c26d895b242c8ed4b633805e855e35ae2505f1a1b
3
  size 37789960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91bfd41a240d5f46e27df0fa8eaa4cba9b7ea12286c752f0cde6a821798de512
3
  size 37789960
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:638b41e99e1609cbcbab8219d0535a4ebcbc92a4099f06b7a52ef07f8639253d
3
- size 12832890
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c4726a0216e59e43ea0e92156c263db32490a1766082e0377e6be629da197ae
3
+ size 12833082
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98263ac62587796252c94311cc839dccae0b0ac4d75cd2ea9c2be57da9a15122
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b755517c5034c242c5d4f4c35049633483be35422a424d0ef852154ccb995195
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1986de5c7599722c0bc658aca1f6e53d646d865cffaac945a2d942205bc9fb1a
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:301b42e14f9709962c5351dead598e91b2add26553420de0920fa3b6e19b882a
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,85 +1,49 @@
1
  {
2
- "best_metric": 77.23864137626819,
3
- "best_model_checkpoint": "../KevinKibe/whisper-medium-finetuned-finetuned/checkpoint-100",
4
- "epoch": 1.37,
5
- "eval_steps": 25,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.25,
13
- "grad_norm": 1.408146858215332,
14
- "learning_rate": 7.7e-05,
15
- "loss": 3.9076,
16
- "step": 25
17
  },
18
  {
19
  "epoch": 0.25,
20
- "eval_loss": 3.914597749710083,
21
- "eval_runtime": 411.8208,
22
- "eval_samples_per_second": 0.607,
23
- "eval_steps_per_second": 0.039,
24
- "eval_wer": 106.30789589766212,
25
- "step": 25
26
- },
27
- {
28
- "epoch": 0.5,
29
- "grad_norm": 2.0066428184509277,
30
- "learning_rate": 5.2000000000000004e-05,
31
- "loss": 2.8203,
32
- "step": 50
33
- },
34
- {
35
- "epoch": 0.5,
36
- "eval_loss": 3.4905786514282227,
37
- "eval_runtime": 441.2692,
38
- "eval_samples_per_second": 0.567,
39
- "eval_steps_per_second": 0.036,
40
- "eval_wer": 84.11998235553595,
41
- "step": 50
42
- },
43
- {
44
- "epoch": 1.12,
45
- "grad_norm": 2.804873466491699,
46
- "learning_rate": 2.7000000000000002e-05,
47
- "loss": 2.5457,
48
- "step": 75
49
- },
50
- {
51
- "epoch": 1.12,
52
- "eval_loss": 3.293093204498291,
53
- "eval_runtime": 380.5263,
54
- "eval_samples_per_second": 0.657,
55
- "eval_steps_per_second": 0.042,
56
- "eval_wer": 77.63564181737979,
57
- "step": 75
58
- },
59
- {
60
- "epoch": 1.37,
61
- "grad_norm": 1.4536932706832886,
62
- "learning_rate": 2.0000000000000003e-06,
63
- "loss": 2.7631,
64
- "step": 100
65
- },
66
- {
67
- "epoch": 1.37,
68
- "eval_loss": 3.177401065826416,
69
- "eval_runtime": 382.2171,
70
- "eval_samples_per_second": 0.654,
71
- "eval_steps_per_second": 0.042,
72
- "eval_wer": 77.23864137626819,
73
- "step": 100
74
  }
75
  ],
76
- "logging_steps": 25,
77
- "max_steps": 100,
78
  "num_input_tokens_seen": 0,
79
  "num_train_epochs": 9223372036854775807,
80
- "save_steps": 25,
81
- "total_flos": 1.64643756834816e+18,
82
- "train_batch_size": 16,
 
 
 
 
 
 
 
 
 
 
 
 
83
  "trial_name": null,
84
  "trial_params": null
85
  }
 
1
  {
2
+ "best_metric": 103.4838076545633,
3
+ "best_model_checkpoint": "../KevinKibe/whisper-medium-finetuned-finetuned/checkpoint-500",
4
+ "epoch": 0.25,
5
+ "eval_steps": 500,
6
+ "global_step": 500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.25,
13
+ "grad_norm": 1.5150429010391235,
14
+ "learning_rate": 0.0007601010101010101,
15
+ "loss": 5.7804,
16
+ "step": 500
17
  },
18
  {
19
  "epoch": 0.25,
20
+ "eval_loss": 5.4739532470703125,
21
+ "eval_runtime": 542.8842,
22
+ "eval_samples_per_second": 0.461,
23
+ "eval_steps_per_second": 0.059,
24
+ "eval_wer": 103.4838076545633,
25
+ "step": 500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  }
27
  ],
28
+ "logging_steps": 500,
29
+ "max_steps": 2000,
30
  "num_input_tokens_seen": 0,
31
  "num_train_epochs": 9223372036854775807,
32
+ "save_steps": 500,
33
+ "stateful_callbacks": {
34
+ "TrainerControl": {
35
+ "args": {
36
+ "should_epoch_stop": false,
37
+ "should_evaluate": false,
38
+ "should_log": false,
39
+ "should_save": true,
40
+ "should_training_stop": false
41
+ },
42
+ "attributes": {}
43
+ }
44
+ },
45
+ "total_flos": 1.654711123968e+19,
46
+ "train_batch_size": 32,
47
  "trial_name": null,
48
  "trial_params": null
49
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70f645ad7125d347ac1e93f576f3d767a1196ab723edf8df4c89a0728bf7d029
3
- size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2da8df2c4627709c71886adfa00d7303e0de97e4f21a222bec7b34d9a9d527d
3
+ size 5368