Theoreticallyhugo commited on
Commit
5cca7b7
·
verified ·
1 Parent(s): 412d7a4

Training in progress, epoch 1, checkpoint

Browse files
checkpoint-41/config.json CHANGED
@@ -55,7 +55,7 @@
55
  "pad_token_id": 1,
56
  "sep_token_id": 2,
57
  "torch_dtype": "float32",
58
- "transformers_version": "4.37.2",
59
  "type_vocab_size": 1,
60
  "vocab_size": 50265
61
  }
 
55
  "pad_token_id": 1,
56
  "sep_token_id": 2,
57
  "torch_dtype": "float32",
58
+ "transformers_version": "4.45.2",
59
  "type_vocab_size": 1,
60
  "vocab_size": 50265
61
  }
checkpoint-41/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4cde84e40589a581099de6ffd2b1dfb10787b5c8d90d303ed810a70a33697cd5
3
  size 592330980
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f14b7db205675e39b7bd2b7766040d5767ef618a5de3d85f933fd230453ae8bd
3
  size 592330980
checkpoint-41/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f651f65956ed08780348bf8bfcaac2b4e5a12648ffed35bb061a6ba26807bf7
3
  size 1014670074
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8084d789f6d3e39dd190d98c0ab12ad0a6482fc011929fa0f34d81d7f752888
3
  size 1014670074
checkpoint-41/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a939982f711c8a91f0893b4f281f0db4fd89d7ca52de2aed82098ef9ff76ea2
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:890a72e183ff8476ed86066068429358f1f4dfcd3a6900ecfd020262ecca5acf
3
  size 14244
checkpoint-41/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2edfde65f52fe0fcbc13f549dfed4fa891e3eb1476a6c03774294faa3865fa33
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea37e94b47f3f494a56a7641c427579f080658979e969fdceddf122598ddd745
3
  size 1064
checkpoint-41/tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
checkpoint-41/tokenizer_config.json CHANGED
@@ -43,12 +43,12 @@
43
  }
44
  },
45
  "bos_token": "<s>",
46
- "clean_up_tokenization_spaces": true,
47
  "cls_token": "<s>",
48
  "eos_token": "</s>",
49
  "errors": "replace",
50
  "mask_token": "<mask>",
51
- "model_max_length": 4096,
52
  "pad_token": "<pad>",
53
  "sep_token": "</s>",
54
  "tokenizer_class": "LongformerTokenizer",
 
43
  }
44
  },
45
  "bos_token": "<s>",
46
+ "clean_up_tokenization_spaces": false,
47
  "cls_token": "<s>",
48
  "eos_token": "</s>",
49
  "errors": "replace",
50
  "mask_token": "<mask>",
51
+ "model_max_length": 1000000000000000019884624838656,
52
  "pad_token": "<pad>",
53
  "sep_token": "</s>",
54
  "tokenizer_class": "LongformerTokenizer",
checkpoint-41/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
  "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 41,
@@ -14,69 +14,81 @@
14
  "f1-score": 0.0,
15
  "precision": 0.0,
16
  "recall": 0.0,
17
- "support": 271.0
18
  },
19
  "eval_B-MajorClaim": {
20
  "f1-score": 0.0,
21
  "precision": 0.0,
22
  "recall": 0.0,
23
- "support": 139.0
24
  },
25
  "eval_B-Premise": {
26
- "f1-score": 0.778263585259213,
27
- "precision": 0.643595041322314,
28
- "recall": 0.9842022116903634,
29
- "support": 633.0
30
  },
31
  "eval_I-Claim": {
32
- "f1-score": 0.5213290460878884,
33
- "precision": 0.4563708012760368,
34
- "recall": 0.6078480379905024,
35
- "support": 4001.0
36
  },
37
  "eval_I-MajorClaim": {
38
- "f1-score": 0.520462355513902,
39
- "precision": 0.7011784511784511,
40
- "recall": 0.4138102334823646,
41
- "support": 2013.0
42
  },
43
  "eval_I-Premise": {
44
- "f1-score": 0.8648793805666204,
45
- "precision": 0.8778050331607159,
46
- "recall": 0.8523288637967537,
47
- "support": 11336.0
48
  },
49
  "eval_O": {
50
- "f1-score": 0.9947169811320755,
51
- "precision": 0.9991081780076697,
52
- "recall": 0.9903642149929278,
53
- "support": 11312.0
54
  },
55
- "eval_accuracy": 0.8332940582393537,
56
- "eval_loss": 0.4083092212677002,
57
  "eval_macro avg": {
58
- "f1-score": 0.5256644783656713,
59
- "precision": 0.5254367864207411,
60
- "recall": 0.5497933659932731,
61
- "support": 29705.0
62
  },
63
- "eval_runtime": 1.4074,
64
- "eval_samples_per_second": 56.843,
65
- "eval_steps_per_second": 7.105,
66
  "eval_weighted avg": {
67
- "f1-score": 0.830926787853407,
68
- "precision": 0.8381591322948091,
69
- "recall": 0.8332940582393537,
70
- "support": 29705.0
71
  },
72
  "step": 41
73
  }
74
  ],
75
  "logging_steps": 500,
76
- "max_steps": 656,
77
  "num_input_tokens_seen": 0,
78
- "num_train_epochs": 16,
79
  "save_steps": 500,
 
 
 
 
 
 
 
 
 
 
 
 
80
  "total_flos": 143790812718000.0,
81
  "train_batch_size": 8,
82
  "trial_name": null,
 
1
  {
2
+ "best_metric": 0.44872575998306274,
3
+ "best_model_checkpoint": "longformer-sep_tok_full_labels/checkpoint-41",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 41,
 
14
  "f1-score": 0.0,
15
  "precision": 0.0,
16
  "recall": 0.0,
17
+ "support": 284.0
18
  },
19
  "eval_B-MajorClaim": {
20
  "f1-score": 0.0,
21
  "precision": 0.0,
22
  "recall": 0.0,
23
+ "support": 141.0
24
  },
25
  "eval_B-Premise": {
26
+ "f1-score": 0.8161057692307693,
27
+ "precision": 0.7102510460251046,
28
+ "recall": 0.9590395480225988,
29
+ "support": 708.0
30
  },
31
  "eval_I-Claim": {
32
+ "f1-score": 0.1270623933244832,
33
+ "precision": 0.5242566510172144,
34
+ "recall": 0.0722917565817868,
35
+ "support": 4634.0
36
  },
37
  "eval_I-MajorClaim": {
38
+ "f1-score": 0.6541305725755335,
39
+ "precision": 0.635728952772074,
40
+ "recall": 0.6736292428198434,
41
+ "support": 2298.0
42
  },
43
  "eval_I-Premise": {
44
+ "f1-score": 0.8604508262992788,
45
+ "precision": 0.7685153090699018,
46
+ "recall": 0.9773712438468886,
47
+ "support": 13611.0
48
  },
49
  "eval_O": {
50
+ "f1-score": 0.9838489353153878,
51
+ "precision": 0.9707444699912788,
52
+ "recall": 0.9973120469169993,
53
+ "support": 12277.0
54
  },
55
+ "eval_accuracy": 0.827879716078108,
56
+ "eval_loss": 0.44872575998306274,
57
  "eval_macro avg": {
58
+ "f1-score": 0.49165692810649325,
59
+ "precision": 0.5156423469822248,
60
+ "recall": 0.5256634054554452,
61
+ "support": 33953.0
62
  },
63
+ "eval_runtime": 1.5094,
64
+ "eval_samples_per_second": 53.001,
65
+ "eval_steps_per_second": 6.625,
66
  "eval_weighted avg": {
67
+ "f1-score": 0.7793158674251499,
68
+ "precision": 0.7884799553707518,
69
+ "recall": 0.827879716078108,
70
+ "support": 33953.0
71
  },
72
  "step": 41
73
  }
74
  ],
75
  "logging_steps": 500,
76
+ "max_steps": 205,
77
  "num_input_tokens_seen": 0,
78
+ "num_train_epochs": 5,
79
  "save_steps": 500,
80
+ "stateful_callbacks": {
81
+ "TrainerControl": {
82
+ "args": {
83
+ "should_epoch_stop": false,
84
+ "should_evaluate": false,
85
+ "should_log": false,
86
+ "should_save": true,
87
+ "should_training_stop": false
88
+ },
89
+ "attributes": {}
90
+ }
91
+ },
92
  "total_flos": 143790812718000.0,
93
  "train_batch_size": 8,
94
  "trial_name": null,
checkpoint-41/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e06f6b44c30fa94c6272333e445e6562930fffeb3ba856f3a9330b45193b951f
3
- size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6bd9d9433178bb46233a14964dd91f951626a7f2358aaa46af2107a2de9fad4
3
+ size 5240