File size: 2,718 Bytes
fed6441
 
 
 
 
 
 
 
 
 
 
 
 
c432d27
 
 
 
fed6441
 
c432d27
 
 
 
fed6441
 
c432d27
 
 
 
fed6441
c432d27
 
fed6441
c432d27
 
 
 
fed6441
c432d27
 
 
fed6441
c432d27
 
 
 
fed6441
 
 
 
 
 
c432d27
 
 
 
fed6441
 
c432d27
 
 
 
fed6441
 
c432d27
 
 
 
fed6441
c432d27
 
fed6441
c432d27
 
 
 
fed6441
c432d27
 
 
fed6441
c432d27
 
 
 
fed6441
 
 
 
 
 
 
 
 
c432d27
fed6441
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 2.0,
  "eval_steps": 500,
  "global_step": 162,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 1.0,
      "eval_B": {
        "f1-score": 0.8331822302810515,
        "precision": 0.7901977644024075,
        "recall": 0.8811121764141898,
        "support": 1043.0
      },
      "eval_I": {
        "f1-score": 0.9471294753175105,
        "precision": 0.9443616777446711,
        "recall": 0.9499135446685879,
        "support": 17350.0
      },
      "eval_O": {
        "f1-score": 0.8992868897421833,
        "precision": 0.9103731674811195,
        "recall": 0.8884673748103187,
        "support": 9226.0
      },
      "eval_accuracy": 0.9267895289474637,
      "eval_loss": 0.20478281378746033,
      "eval_macro avg": {
        "f1-score": 0.8931995317802484,
        "precision": 0.8816442032093993,
        "recall": 0.9064976986310321,
        "support": 27619.0
      },
      "eval_runtime": 4.6128,
      "eval_samples_per_second": 17.343,
      "eval_steps_per_second": 2.168,
      "eval_weighted avg": {
        "f1-score": 0.9268447919078652,
        "precision": 0.9271861479533134,
        "recall": 0.9267895289474637,
        "support": 27619.0
      },
      "step": 81
    },
    {
      "epoch": 2.0,
      "eval_B": {
        "f1-score": 0.8682547399124939,
        "precision": 0.8806706114398422,
        "recall": 0.8561840843720039,
        "support": 1043.0
      },
      "eval_I": {
        "f1-score": 0.9590983771942466,
        "precision": 0.9592919333448654,
        "recall": 0.9589048991354466,
        "support": 17350.0
      },
      "eval_O": {
        "f1-score": 0.9226525313717006,
        "precision": 0.9208594256100194,
        "recall": 0.9244526338608281,
        "support": 9226.0
      },
      "eval_accuracy": 0.9435171439950758,
      "eval_loss": 0.16574698686599731,
      "eval_macro avg": {
        "f1-score": 0.9166685494928136,
        "precision": 0.9202739901315756,
        "recall": 0.9131805391227594,
        "support": 27619.0
      },
      "eval_runtime": 4.6238,
      "eval_samples_per_second": 17.302,
      "eval_steps_per_second": 2.163,
      "eval_weighted avg": {
        "f1-score": 0.9434932036816766,
        "precision": 0.9434846863370583,
        "recall": 0.9435171439950758,
        "support": 27619.0
      },
      "step": 162
    }
  ],
  "logging_steps": 500,
  "max_steps": 4050,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 50,
  "save_steps": 500,
  "total_flos": 287573305471200.0,
  "train_batch_size": 4,
  "trial_name": null,
  "trial_params": null
}