File size: 2,717 Bytes
fed6441
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 2.0,
  "eval_steps": 500,
  "global_step": 162,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 1.0,
      "eval_B": {
        "f1-score": 0.8087666523420713,
        "precision": 0.8189730200174065,
        "recall": 0.7988115449915111,
        "support": 1178.0
      },
      "eval_I": {
        "f1-score": 0.9374597034171502,
        "precision": 0.9521418826739427,
        "recall": 0.9232234509762421,
        "support": 18899.0
      },
      "eval_O": {
        "f1-score": 0.8881362400419788,
        "precision": 0.863303347862376,
        "recall": 0.9144400785854617,
        "support": 10180.0
      },
      "eval_accuracy": 0.9154245298608586,
      "eval_loss": 0.2228638380765915,
      "eval_macro avg": {
        "f1-score": 0.8781208652670669,
        "precision": 0.8781394168512416,
        "recall": 0.8788250248510717,
        "support": 30257.0
      },
      "eval_runtime": 4.7167,
      "eval_samples_per_second": 17.173,
      "eval_steps_per_second": 2.332,
      "eval_weighted avg": {
        "f1-score": 0.9158543469268937,
        "precision": 0.9170673807540184,
        "recall": 0.9154245298608586,
        "support": 30257.0
      },
      "step": 81
    },
    {
      "epoch": 2.0,
      "eval_B": {
        "f1-score": 0.8401515151515152,
        "precision": 0.7585499316005472,
        "recall": 0.9414261460101867,
        "support": 1178.0
      },
      "eval_I": {
        "f1-score": 0.9568235603470944,
        "precision": 0.9510219016256338,
        "recall": 0.9626964389650247,
        "support": 18899.0
      },
      "eval_O": {
        "f1-score": 0.9185648054827655,
        "precision": 0.9430877483443708,
        "recall": 0.8952848722986247,
        "support": 10180.0
      },
      "eval_accuracy": 0.9391876260038999,
      "eval_loss": 0.16692574322223663,
      "eval_macro avg": {
        "f1-score": 0.905179960327125,
        "precision": 0.8842198605235172,
        "recall": 0.9331358190912787,
        "support": 30257.0
      },
      "eval_runtime": 4.7116,
      "eval_samples_per_second": 17.192,
      "eval_steps_per_second": 2.335,
      "eval_weighted avg": {
        "f1-score": 0.9394089523635119,
        "precision": 0.9408589092241132,
        "recall": 0.9391876260038999,
        "support": 30257.0
      },
      "step": 162
    }
  ],
  "logging_steps": 500,
  "max_steps": 4050,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 50,
  "save_steps": 500,
  "total_flos": 286680220671600.0,
  "train_batch_size": 4,
  "trial_name": null,
  "trial_params": null
}