cantillation commited on
Commit
c28657a
·
verified ·
1 Parent(s): 827824d

End of training

Browse files
README.md CHANGED
@@ -22,19 +22,19 @@ should probably proofread and complete it, then remove this comment. -->
22
 
23
  This model is a fine-tuned version of [openai/whisper-medium](https://huggingface.co/openai/whisper-medium) on an unknown dataset.
24
  It achieves the following results on the evaluation set:
25
- - Loss: 1.1249
26
- - Precision: 0.2559
27
- - Recall: 0.2742
28
- - F1: 0.2642
29
- - Precision Median: 0.25
30
- - Recall Median: 0.2727
31
- - F1 Median: 0.2609
32
- - Precision Max: 0.4211
33
- - Recall Max: 0.4706
34
- - F1 Max: 0.4444
35
- - Precision Min: 0.0526
36
- - Recall Min: 0.05
37
- - F1 Min: 0.0513
38
 
39
  ## Model description
40
 
@@ -53,25 +53,24 @@ More information needed
53
  ### Training hyperparameters
54
 
55
  The following hyperparameters were used during training:
56
- - learning_rate: 8e-05
57
- - train_batch_size: 12
58
  - eval_batch_size: 8
59
  - seed: 42
60
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
61
  - lr_scheduler_type: linear
62
- - lr_scheduler_warmup_steps: 20
63
- - training_steps: 25
64
  - mixed_precision_training: Native AMP
65
 
66
  ### Training results
67
 
68
  | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Precision Median | Recall Median | F1 Median | Precision Max | Recall Max | F1 Max | Precision Min | Recall Min | F1 Min |
69
  |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:----------------:|:-------------:|:---------:|:-------------:|:----------:|:------:|:-------------:|:----------:|:------:|
70
- | No log | 0.0 | 5 | 5.8029 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0 | 0 | 0 | 0 | 0 | 0 |
71
- | No log | 0.01 | 10 | 2.9216 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0 | 0 | 0 | 0 | 0 | 0 |
72
- | No log | 0.01 | 15 | 2.1863 | 0.0540 | 0.0710 | 0.0609 | 0.0476 | 0.0769 | 0.0541 | 0.2 | 0.2353 | 0.2162 | 0.0 | 0.0 | 0.0 |
73
- | No log | 0.01 | 20 | 1.1833 | 0.3468 | 0.3692 | 0.3565 | 0.4118 | 0.4286 | 0.4242 | 0.8 | 0.8 | 0.8000 | 0.0 | 0.0 | 0.0 |
74
- | 3.5014 | 0.01 | 25 | 1.1249 | 0.2559 | 0.2742 | 0.2642 | 0.25 | 0.2727 | 0.2609 | 0.4211 | 0.4706 | 0.4444 | 0.0526 | 0.05 | 0.0513 |
75
 
76
 
77
  ### Framework versions
 
22
 
23
  This model is a fine-tuned version of [openai/whisper-medium](https://huggingface.co/openai/whisper-medium) on an unknown dataset.
24
  It achieves the following results on the evaluation set:
25
+ - Loss: 1.3168
26
+ - Precision: 0.1010
27
+ - Recall: 0.1098
28
+ - F1: 0.1051
29
+ - Precision Median: 0.0
30
+ - Recall Median: 0.0
31
+ - F1 Median: 0.0
32
+ - Precision Max: 0.5
33
+ - Recall Max: 0.5333
34
+ - F1 Max: 0.5161
35
+ - Precision Min: 0.0
36
+ - Recall Min: 0.0
37
+ - F1 Min: 0.0
38
 
39
  ## Model description
40
 
 
53
  ### Training hyperparameters
54
 
55
  The following hyperparameters were used during training:
56
+ - learning_rate: 1e-06
57
+ - train_batch_size: 32
58
  - eval_batch_size: 8
59
  - seed: 42
60
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
61
  - lr_scheduler_type: linear
62
+ - lr_scheduler_warmup_steps: 200
63
+ - training_steps: 800
64
  - mixed_precision_training: Native AMP
65
 
66
  ### Training results
67
 
68
  | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Precision Median | Recall Median | F1 Median | Precision Max | Recall Max | F1 Max | Precision Min | Recall Min | F1 Min |
69
  |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:----------------:|:-------------:|:---------:|:-------------:|:----------:|:------:|:-------------:|:----------:|:------:|
70
+ | 3.5705 | 0.32 | 200 | 2.7306 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0 | 0 | 0 | 0 | 0 | 0 |
71
+ | 2.0183 | 0.63 | 400 | 1.6209 | 0.0341 | 0.0373 | 0.0356 | 0.0 | 0.0 | 0.0 | 0.4375 | 0.4667 | 0.4516 | 0.0 | 0.0 | 0.0 |
72
+ | 1.6646 | 0.95 | 600 | 1.3710 | 0.1062 | 0.1151 | 0.1103 | 0.0 | 0.0 | 0.0 | 0.5 | 0.5333 | 0.5161 | 0.0 | 0.0 | 0.0 |
73
+ | 1.6004 | 1.27 | 800 | 1.3168 | 0.1010 | 0.1098 | 0.1051 | 0.0 | 0.0 | 0.0 | 0.5 | 0.5333 | 0.5161 | 0.0 | 0.0 | 0.0 |
 
74
 
75
 
76
  ### Framework versions
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "openai/whisper-medium",
3
  "activation_dropout": 0.1,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
@@ -13,18 +13,18 @@
13
  ],
14
  "bos_token_id": 50257,
15
  "classifier_proj_size": 256,
16
- "d_model": 1024,
17
- "decoder_attention_heads": 16,
18
- "decoder_ffn_dim": 4096,
19
  "decoder_input_ids": null,
20
  "decoder_layerdrop": 0.0,
21
- "decoder_layers": 24,
22
  "decoder_start_token_id": 50258,
23
  "dropout": 0.1,
24
- "encoder_attention_heads": 16,
25
- "encoder_ffn_dim": 4096,
26
  "encoder_layerdrop": 0.0,
27
- "encoder_layers": 24,
28
  "eos_token_id": 50257,
29
  "forced_decoder_ids": null,
30
  "init_std": 0.02,
@@ -40,7 +40,7 @@
40
  "max_target_positions": 448,
41
  "median_filter_width": 7,
42
  "model_type": "whisper",
43
- "num_hidden_layers": 24,
44
  "num_mel_bins": 80,
45
  "pad_token_id": 50257,
46
  "scale_embedding": false,
 
1
  {
2
+ "_name_or_path": "openai/whisper-tiny",
3
  "activation_dropout": 0.1,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
 
13
  ],
14
  "bos_token_id": 50257,
15
  "classifier_proj_size": 256,
16
+ "d_model": 384,
17
+ "decoder_attention_heads": 6,
18
+ "decoder_ffn_dim": 1536,
19
  "decoder_input_ids": null,
20
  "decoder_layerdrop": 0.0,
21
+ "decoder_layers": 4,
22
  "decoder_start_token_id": 50258,
23
  "dropout": 0.1,
24
+ "encoder_attention_heads": 6,
25
+ "encoder_ffn_dim": 1536,
26
  "encoder_layerdrop": 0.0,
27
+ "encoder_layers": 4,
28
  "eos_token_id": 50257,
29
  "forced_decoder_ids": null,
30
  "init_std": 0.02,
 
40
  "max_target_positions": 448,
41
  "median_filter_width": 7,
42
  "model_type": "whisper",
43
+ "num_hidden_layers": 4,
44
  "num_mel_bins": 80,
45
  "pad_token_id": 50257,
46
  "scale_embedding": false,
generation_config.json CHANGED
@@ -1,28 +1,28 @@
1
  {
2
  "alignment_heads": [
3
  [
4
- 13,
5
- 15
6
  ],
7
  [
8
- 15,
9
- 4
10
  ],
11
  [
12
- 15,
13
- 15
14
  ],
15
  [
16
- 16,
17
- 1
18
  ],
19
  [
20
- 20,
21
- 0
22
  ],
23
  [
24
- 23,
25
- 4
26
  ]
27
  ],
28
  "begin_suppress_tokens": [
 
1
  {
2
  "alignment_heads": [
3
  [
4
+ 2,
5
+ 2
6
  ],
7
  [
8
+ 3,
9
+ 0
10
  ],
11
  [
12
+ 3,
13
+ 2
14
  ],
15
  [
16
+ 3,
17
+ 3
18
  ],
19
  [
20
+ 3,
21
+ 4
22
  ],
23
  [
24
+ 3,
25
+ 5
26
  ]
27
  ],
28
  "begin_suppress_tokens": [
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f54d42f49d8b09dd8b31b9c978a06fcf8845df57976a09f0a437e88625dc530e
3
- size 3055671280
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a58cfd5695b6da2e034f88595f4d5b0a2e8aac9f0a8d9dd68227f5d70451656
3
+ size 151109288
runs/Feb15_06-05-10_sipl-7542-ct/events.out.tfevents.1707977115.sipl-7542-ct.1319778.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab9bff1cf65c72f5ffe5cb8b214ed46e7a7c3834633412b5be2e9bf9cf8ac651
3
- size 21504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f4d87b8c190c180e9249887a9b57e46ec838dd420c3a1a830b4400edd3703fc
3
+ size 35073
runs/Feb15_09-46-30_sipl-7542-ct/events.out.tfevents.1707990393.sipl-7542-ct.1389393.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8258ec2b78bf46bc2d7a862d79fd276c0cda3e16529c7a50066675415d80c1a7
3
+ size 32996
runs/Feb15_09-56-22_sipl-7542-ct/events.out.tfevents.1707990986.sipl-7542-ct.1389393.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f54339a7fe03aff2d8a32382960ea502bb100b8776bb1f84d28f90f42ad51309
3
+ size 15061
runs/Feb15_10-14-35_sipl-7542-ct/events.out.tfevents.1707992078.sipl-7542-ct.1398486.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02b06356517f3d1ca7c488f2af5ffefb093e196a1f9e632497cef97521a8b691
3
+ size 14312
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72d81e4dee5fa4935124c935ad0735bba7504a6a2a97c04edab02cab35debb0d
3
  size 4475
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43481db32632992ddb738a945c08f45b8e22b8750f821072e117f72577ebc501
3
  size 4475