Theoreticallyhugo commited on
Commit
964a551
1 Parent(s): 5922793

Training in progress, epoch 1, checkpoint

Browse files
checkpoint-81/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c387a25e4b00bd8cd7fa816321356f94c130c150563bb32e5f173abfddbaa7e
3
  size 592318676
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:081c2ef41ab09e428be3abf42fe6b940422819d1de460da39cf13185ce13fd5c
3
  size 592318676
checkpoint-81/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be01019aa5d358abf203d5f0c0ad0ce50e7a0f3e182476dd5c4a75be9820c050
3
  size 1014645498
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04be85650238dc1a273e204437d4286ace2eadafbdc6fe6d813f47f51409f779
3
  size 1014645498
checkpoint-81/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:153cfd77c5ddcff6dcd449eda1e20921f085ad496090dd7960aa7943b2fa3326
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a10709715b57c56c4e889a17baa14c8e503a7581e52966680626f29eada9d5ae
3
  size 1064
checkpoint-81/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
  "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 81,
@@ -11,47 +11,47 @@
11
  {
12
  "epoch": 1.0,
13
  "eval_B": {
14
- "f1-score": 0.8331822302810515,
15
- "precision": 0.7901977644024075,
16
- "recall": 0.8811121764141898,
17
- "support": 1043.0
18
  },
19
  "eval_I": {
20
- "f1-score": 0.9471294753175105,
21
- "precision": 0.9443616777446711,
22
- "recall": 0.9499135446685879,
23
- "support": 17350.0
24
  },
25
  "eval_O": {
26
- "f1-score": 0.8992868897421833,
27
- "precision": 0.9103731674811195,
28
- "recall": 0.8884673748103187,
29
- "support": 9226.0
30
  },
31
- "eval_accuracy": 0.9267895289474637,
32
- "eval_loss": 0.20478281378746033,
33
  "eval_macro avg": {
34
- "f1-score": 0.8931995317802484,
35
- "precision": 0.8816442032093993,
36
- "recall": 0.9064976986310321,
37
- "support": 27619.0
38
  },
39
- "eval_runtime": 4.6128,
40
- "eval_samples_per_second": 17.343,
41
- "eval_steps_per_second": 2.168,
42
  "eval_weighted avg": {
43
- "f1-score": 0.9268447919078652,
44
- "precision": 0.9271861479533134,
45
- "recall": 0.9267895289474637,
46
- "support": 27619.0
47
  },
48
  "step": 81
49
  }
50
  ],
51
  "logging_steps": 500,
52
- "max_steps": 4050,
53
  "num_input_tokens_seen": 0,
54
- "num_train_epochs": 50,
55
  "save_steps": 500,
56
  "total_flos": 143786652735600.0,
57
  "train_batch_size": 4,
 
1
  {
2
+ "best_metric": 0.2619660496711731,
3
+ "best_model_checkpoint": "longformer-spans/checkpoint-81",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 81,
 
11
  {
12
  "epoch": 1.0,
13
  "eval_B": {
14
+ "f1-score": 0.816,
15
+ "precision": 0.7461594732991953,
16
+ "recall": 0.9002647837599294,
17
+ "support": 1133.0
18
  },
19
  "eval_I": {
20
+ "f1-score": 0.9321376763813793,
21
+ "precision": 0.9024103768767235,
22
+ "recall": 0.9638902525500463,
23
+ "support": 18333.0
24
  },
25
  "eval_O": {
26
+ "f1-score": 0.8560784528570645,
27
+ "precision": 0.931782945736434,
28
+ "recall": 0.7917511147142278,
29
+ "support": 9868.0
30
  },
31
+ "eval_accuracy": 0.9035249198881844,
32
+ "eval_loss": 0.2619660496711731,
33
  "eval_macro avg": {
34
+ "f1-score": 0.8680720430794812,
35
+ "precision": 0.860117598637451,
36
+ "recall": 0.8853020503414012,
37
+ "support": 29334.0
38
  },
39
+ "eval_runtime": 5.5032,
40
+ "eval_samples_per_second": 14.537,
41
+ "eval_steps_per_second": 1.817,
42
  "eval_weighted avg": {
43
+ "f1-score": 0.9020655278480035,
44
+ "precision": 0.9062562975065145,
45
+ "recall": 0.9035249198881844,
46
+ "support": 29334.0
47
  },
48
  "step": 81
49
  }
50
  ],
51
  "logging_steps": 500,
52
+ "max_steps": 1620,
53
  "num_input_tokens_seen": 0,
54
+ "num_train_epochs": 20,
55
  "save_steps": 500,
56
  "total_flos": 143786652735600.0,
57
  "train_batch_size": 4,
checkpoint-81/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:821ca433db9ddb761291ab61fc06d651ad248cd9d560cdb25f7f905e5aaff14e
3
  size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1094850123635c13193a80398a7bb1e351dd871416d3ce265431b259bf603290
3
  size 4856