Rodrigo1771 commited on
Commit
2ad910b
β€’
1 Parent(s): 3ad9b1a

Training in progress, epoch 0

Browse files
config.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "michiyasunaga/BioLinkBERT-base",
3
+ "architectures": [
4
+ "BertForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "finetuning_task": "ner",
9
+ "gradient_checkpointing": false,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 768,
13
+ "id2label": {
14
+ "0": "O",
15
+ "1": "B-FARMACO",
16
+ "2": "I-FARMACO"
17
+ },
18
+ "initializer_range": 0.02,
19
+ "intermediate_size": 3072,
20
+ "label2id": {
21
+ "B-FARMACO": 1,
22
+ "I-FARMACO": 2,
23
+ "O": 0
24
+ },
25
+ "layer_norm_eps": 1e-12,
26
+ "max_position_embeddings": 512,
27
+ "model_type": "bert",
28
+ "num_attention_heads": 12,
29
+ "num_hidden_layers": 12,
30
+ "pad_token_id": 0,
31
+ "position_embedding_type": "absolute",
32
+ "torch_dtype": "float32",
33
+ "transformers_version": "4.44.2",
34
+ "type_vocab_size": 2,
35
+ "use_cache": true,
36
+ "vocab_size": 28895
37
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f57f8cb32ba197018ff5f8c352f86bd900630969a6d2cf89b36c87aa65389a35
3
+ size 430601004
special_tokens_map.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
+ }
tb/events.out.tfevents.1725907965.3d77e24b7860.2139.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b09dccec4feec9f85899797939be45f6c969cc7741b0a6a1e7a8430350527727
3
+ size 5593
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "4": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_basic_tokenize": true,
47
+ "do_lower_case": true,
48
+ "mask_token": "[MASK]",
49
+ "model_max_length": 1000000000000000019884624838656,
50
+ "never_split": null,
51
+ "pad_token": "[PAD]",
52
+ "sep_token": "[SEP]",
53
+ "strip_accents": null,
54
+ "tokenize_chinese_chars": true,
55
+ "tokenizer_class": "BertTokenizer",
56
+ "unk_token": "[UNK]"
57
+ }
train.log ADDED
@@ -0,0 +1,329 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0
  0%| | 0/4350 [00:00<?, ?it/s]
1
  0%| | 1/4350 [00:01<2:12:56, 1.83s/it]
2
  0%| | 2/4350 [00:02<1:07:15, 1.08it/s]
3
  0%| | 3/4350 [00:02<45:13, 1.60it/s]
4
  0%| | 4/4350 [00:02<39:57, 1.81it/s]
5
  0%| | 5/4350 [00:03<35:34, 2.04it/s]
6
  0%| | 6/4350 [00:03<33:09, 2.18it/s]
7
  0%| | 7/4350 [00:03<28:41, 2.52it/s]
8
  0%| | 8/4350 [00:04<30:05, 2.40it/s]
9
  0%| | 9/4350 [00:04<29:31, 2.45it/s]
10
  0%| | 10/4350 [00:05<28:23, 2.55it/s]
11
  0%| | 11/4350 [00:05<30:05, 2.40it/s]
12
  0%| | 12/4350 [00:05<29:20, 2.46it/s]
13
  0%| | 13/4350 [00:06<27:44, 2.61it/s]
14
  0%| | 14/4350 [00:06<24:59, 2.89it/s]
15
  0%| | 15/4350 [00:06<24:46, 2.92it/s]
16
  0%| | 16/4350 [00:07<26:04, 2.77it/s]
17
  0%| | 17/4350 [00:07<24:24, 2.96it/s]
18
  0%| | 18/4350 [00:08<27:09, 2.66it/s]
19
  0%| | 19/4350 [00:08<24:24, 2.96it/s]
20
  0%| | 20/4350 [00:08<24:05, 3.00it/s]
21
  0%| | 21/4350 [00:09<30:36, 2.36it/s]
22
  1%| | 22/4350 [00:09<28:18, 2.55it/s]
23
  1%| | 23/4350 [00:09<27:57, 2.58it/s]
24
  1%| | 24/4350 [00:10<26:27, 2.72it/s]
25
  1%| | 25/4350 [00:10<26:40, 2.70it/s]
26
  1%| | 26/4350 [00:10<26:40, 2.70it/s]
27
  1%| | 27/4350 [00:11<24:01, 3.00it/s]
28
  1%| | 28/4350 [00:11<24:02, 3.00it/s]
29
  1%| | 29/4350 [00:11<24:01, 3.00it/s]
30
  1%| | 30/4350 [00:12<23:34, 3.05it/s]
31
  1%| | 31/4350 [00:12<24:18, 2.96it/s]
32
  1%| | 32/4350 [00:12<23:32, 3.06it/s]
33
  1%| | 33/4350 [00:13<24:37, 2.92it/s]
34
  1%| | 34/4350 [00:13<23:50, 3.02it/s]
35
  1%| | 35/4350 [00:13<23:51, 3.01it/s]
36
  1%| | 36/4350 [00:14<24:55, 2.88it/s]
37
  1%| | 37/4350 [00:14<24:01, 2.99it/s]
38
  1%| | 38/4350 [00:14<22:33, 3.19it/s]
39
  1%| | 39/4350 [00:15<25:07, 2.86it/s]
40
  1%| | 40/4350 [00:15<29:00, 2.48it/s]
41
  1%| | 41/4350 [00:16<28:27, 2.52it/s]
42
  1%| | 42/4350 [00:16<28:13, 2.54it/s]
43
  1%| | 43/4350 [00:17<29:44, 2.41it/s]
44
  1%| | 44/4350 [00:17<27:34, 2.60it/s]
45
  1%| | 45/4350 [00:17<28:06, 2.55it/s]
46
  1%| | 46/4350 [00:18<27:16, 2.63it/s]
47
  1%| | 47/4350 [00:18<27:55, 2.57it/s]
48
  1%| | 48/4350 [00:18<26:50, 2.67it/s]
49
  1%| | 49/4350 [00:19<25:00, 2.87it/s]
50
  1%| | 50/4350 [00:19<24:40, 2.90it/s]
51
  1%| | 51/4350 [00:19<25:36, 2.80it/s]
52
  1%| | 52/4350 [00:20<24:53, 2.88it/s]
53
  1%| | 53/4350 [00:20<24:14, 2.95it/s]
54
  1%| | 54/4350 [00:21<28:01, 2.55it/s]
55
  1%|▏ | 55/4350 [00:21<25:47, 2.77it/s]
56
  1%|▏ | 56/4350 [00:21<23:08, 3.09it/s]
57
  1%|▏ | 57/4350 [00:22<26:16, 2.72it/s]
58
  1%|▏ | 58/4350 [00:22<27:50, 2.57it/s]
59
  1%|▏ | 59/4350 [00:22<29:53, 2.39it/s]
60
  1%|▏ | 60/4350 [00:23<28:31, 2.51it/s]
61
  1%|▏ | 61/4350 [00:23<27:04, 2.64it/s]
62
  1%|▏ | 62/4350 [00:23<25:53, 2.76it/s]
63
  1%|▏ | 63/4350 [00:24<26:30, 2.70it/s]
64
  1%|▏ | 64/4350 [00:24<28:35, 2.50it/s]
65
  1%|▏ | 65/4350 [00:25<25:48, 2.77it/s]
66
  2%|▏ | 66/4350 [00:25<25:04, 2.85it/s]
67
  2%|▏ | 67/4350 [00:25<24:52, 2.87it/s]
68
  2%|▏ | 68/4350 [00:26<27:19, 2.61it/s]
69
  2%|▏ | 69/4350 [00:26<25:42, 2.78it/s]
70
  2%|▏ | 70/4350 [00:26<25:14, 2.83it/s]
71
  2%|▏ | 71/4350 [00:27<25:14, 2.82it/s]
72
  2%|▏ | 72/4350 [00:27<23:56, 2.98it/s]
73
  2%|▏ | 73/4350 [00:27<22:54, 3.11it/s]
74
  2%|▏ | 74/4350 [00:28<28:00, 2.55it/s]
75
  2%|▏ | 75/4350 [00:28<26:37, 2.68it/s]
76
  2%|▏ | 76/4350 [00:29<25:57, 2.74it/s]
77
  2%|▏ | 77/4350 [00:29<24:17, 2.93it/s]
78
  2%|▏ | 78/4350 [00:29<24:17, 2.93it/s]
79
  2%|▏ | 79/4350 [00:29<23:24, 3.04it/s]
80
  2%|▏ | 80/4350 [00:30<27:57, 2.55it/s]
81
  2%|▏ | 81/4350 [00:30<27:40, 2.57it/s]
82
  2%|▏ | 82/4350 [00:31<25:47, 2.76it/s]
83
  2%|▏ | 83/4350 [00:31<25:12, 2.82it/s]
84
  2%|▏ | 84/4350 [00:32<28:43, 2.48it/s]
85
  2%|▏ | 85/4350 [00:32<27:43, 2.56it/s]
86
  2%|▏ | 86/4350 [00:32<26:44, 2.66it/s]
87
  2%|▏ | 87/4350 [00:32<23:57, 2.97it/s]
88
  2%|▏ | 88/4350 [00:33<22:46, 3.12it/s]
89
  2%|▏ | 89/4350 [00:33<22:05, 3.22it/s]
90
  2%|▏ | 90/4350 [00:33<23:12, 3.06it/s]
91
  2%|▏ | 91/4350 [00:34<23:42, 2.99it/s]
92
  2%|▏ | 92/4350 [00:34<24:55, 2.85it/s]
93
  2%|▏ | 93/4350 [00:35<25:03, 2.83it/s]
94
  2%|▏ | 94/4350 [00:35<24:31, 2.89it/s]
95
  2%|▏ | 95/4350 [00:35<24:28, 2.90it/s]
96
  2%|▏ | 96/4350 [00:36<25:09, 2.82it/s]
97
  2%|▏ | 97/4350 [00:36<25:18, 2.80it/s]
98
  2%|▏ | 98/4350 [00:36<24:34, 2.88it/s]
99
  2%|▏ | 99/4350 [00:37<23:06, 3.07it/s]
100
  2%|▏ | 100/4350 [00:37<25:02, 2.83it/s]
101
  2%|▏ | 101/4350 [00:37<24:55, 2.84it/s]
102
  2%|▏ | 102/4350 [00:38<26:01, 2.72it/s]
103
  2%|▏ | 103/4350 [00:38<24:38, 2.87it/s]
104
  2%|▏ | 104/4350 [00:38<24:56, 2.84it/s]
105
  2%|▏ | 105/4350 [00:39<24:00, 2.95it/s]
106
  2%|▏ | 106/4350 [00:39<22:39, 3.12it/s]
107
  2%|▏ | 107/4350 [00:39<21:17, 3.32it/s]
108
  2%|▏ | 108/4350 [00:40<21:47, 3.24it/s]
109
  3%|β–Ž | 109/4350 [00:40<21:16, 3.32it/s]
110
  3%|β–Ž | 110/4350 [00:40<22:04, 3.20it/s]
111
  3%|β–Ž | 111/4350 [00:41<22:32, 3.13it/s]
112
  3%|β–Ž | 112/4350 [00:41<21:56, 3.22it/s]
113
  3%|β–Ž | 113/4350 [00:41<23:45, 2.97it/s]
114
  3%|β–Ž | 114/4350 [00:42<26:21, 2.68it/s]
115
  3%|β–Ž | 115/4350 [00:42<24:32, 2.88it/s]
116
  3%|β–Ž | 116/4350 [00:42<23:14, 3.04it/s]
117
  3%|β–Ž | 117/4350 [00:43<23:19, 3.03it/s]
118
  3%|β–Ž | 118/4350 [00:43<22:47, 3.10it/s]
119
  3%|β–Ž | 119/4350 [00:43<23:32, 2.99it/s]
120
  3%|β–Ž | 120/4350 [00:43<21:34, 3.27it/s]
121
  3%|β–Ž | 121/4350 [00:44<22:33, 3.12it/s]
122
  3%|β–Ž | 122/4350 [00:44<24:02, 2.93it/s]
123
  3%|β–Ž | 123/4350 [00:44<22:52, 3.08it/s]
124
  3%|β–Ž | 124/4350 [00:45<23:48, 2.96it/s]
125
  3%|β–Ž | 125/4350 [00:45<23:16, 3.03it/s]
126
  3%|β–Ž | 126/4350 [00:45<22:53, 3.08it/s]
127
  3%|β–Ž | 127/4350 [00:46<24:18, 2.89it/s]
128
  3%|β–Ž | 128/4350 [00:46<27:49, 2.53it/s]
129
  3%|β–Ž | 129/4350 [00:47<26:33, 2.65it/s]
130
  3%|β–Ž | 130/4350 [00:47<27:10, 2.59it/s]
131
  3%|β–Ž | 131/4350 [00:47<25:19, 2.78it/s]
132
  3%|β–Ž | 132/4350 [00:48<25:45, 2.73it/s]
133
  3%|β–Ž | 133/4350 [00:48<29:04, 2.42it/s]
134
  3%|β–Ž | 134/4350 [00:49<29:58, 2.34it/s]
135
  3%|β–Ž | 135/4350 [00:49<31:40, 2.22it/s]
136
  3%|β–Ž | 136/4350 [00:50<30:30, 2.30it/s]
137
  3%|β–Ž | 137/4350 [00:50<27:22, 2.56it/s]
138
  3%|β–Ž | 138/4350 [00:50<25:51, 2.71it/s]
139
  3%|β–Ž | 139/4350 [00:51<26:03, 2.69it/s]
140
  3%|β–Ž | 140/4350 [00:51<24:06, 2.91it/s]
141
  3%|β–Ž | 141/4350 [00:51<23:46, 2.95it/s]
142
  3%|β–Ž | 142/4350 [00:52<22:27, 3.12it/s]
143
  3%|β–Ž | 143/4350 [00:52<22:25, 3.13it/s]
144
  3%|β–Ž | 144/4350 [00:52<21:37, 3.24it/s]
145
  3%|β–Ž | 145/4350 [00:53<24:18, 2.88it/s]
146
  3%|β–Ž | 146/4350 [00:53<22:25, 3.12it/s]
147
  3%|β–Ž | 147/4350 [00:53<21:27, 3.26it/s]
148
  3%|β–Ž | 148/4350 [00:53<21:06, 3.32it/s]
149
  3%|β–Ž | 149/4350 [00:54<23:46, 2.95it/s]
150
  3%|β–Ž | 150/4350 [00:54<24:06, 2.90it/s]
151
  3%|β–Ž | 151/4350 [00:55<24:54, 2.81it/s]
152
  3%|β–Ž | 152/4350 [00:55<23:49, 2.94it/s]
153
  4%|β–Ž | 153/4350 [00:55<25:34, 2.74it/s]
154
  4%|β–Ž | 154/4350 [00:56<24:10, 2.89it/s]
155
  4%|β–Ž | 155/4350 [00:56<24:19, 2.88it/s]
156
  4%|β–Ž | 156/4350 [00:56<23:13, 3.01it/s]
157
  4%|β–Ž | 157/4350 [00:57<25:11, 2.77it/s]
158
  4%|β–Ž | 158/4350 [00:57<24:25, 2.86it/s]
159
  4%|β–Ž | 159/4350 [00:57<23:44, 2.94it/s]
160
  4%|β–Ž | 160/4350 [00:58<22:35, 3.09it/s]
161
  4%|β–Ž | 161/4350 [00:58<22:00, 3.17it/s]
162
  4%|β–Ž | 162/4350 [00:58<22:49, 3.06it/s]
163
  4%|β–Ž | 163/4350 [00:59<26:36, 2.62it/s]
164
  4%|▍ | 164/4350 [00:59<25:37, 2.72it/s]
165
  4%|▍ | 165/4350 [00:59<25:31, 2.73it/s]
166
  4%|▍ | 166/4350 [01:00<26:19, 2.65it/s]
167
  4%|▍ | 167/4350 [01:00<24:27, 2.85it/s]
168
  4%|▍ | 168/4350 [01:00<23:39, 2.95it/s]
169
  4%|▍ | 169/4350 [01:01<22:04, 3.16it/s]
170
  4%|▍ | 170/4350 [01:01<23:16, 2.99it/s]
171
  4%|▍ | 171/4350 [01:02<25:14, 2.76it/s]
172
  4%|▍ | 172/4350 [01:02<25:29, 2.73it/s]
173
  4%|▍ | 173/4350 [01:02<24:27, 2.85it/s]
174
  4%|▍ | 174/4350 [01:03<23:42, 2.93it/s]
175
  4%|▍ | 175/4350 [01:03<25:38, 2.71it/s]
176
  4%|▍ | 176/4350 [01:04<29:19, 2.37it/s]
177
  4%|▍ | 177/4350 [01:04<26:11, 2.66it/s]
178
  4%|▍ | 178/4350 [01:04<25:03, 2.77it/s]
179
  4%|▍ | 179/4350 [01:05<27:02, 2.57it/s]
180
  4%|▍ | 180/4350 [01:05<25:35, 2.72it/s]
181
  4%|▍ | 181/4350 [01:06<30:51, 2.25it/s]
182
  4%|▍ | 182/4350 [01:06<27:49, 2.50it/s]
183
  4%|▍ | 183/4350 [01:06<24:28, 2.84it/s]
184
  4%|▍ | 184/4350 [01:06<23:31, 2.95it/s]
185
  4%|▍ | 185/4350 [01:07<22:51, 3.04it/s]
186
  4%|▍ | 186/4350 [01:07<23:20, 2.97it/s]
187
  4%|▍ | 187/4350 [01:07<23:48, 2.92it/s]
188
  4%|▍ | 188/4350 [01:08<22:44, 3.05it/s]
189
  4%|▍ | 189/4350 [01:08<22:45, 3.05it/s]
190
  4%|▍ | 190/4350 [01:08<23:19, 2.97it/s]
191
  4%|▍ | 191/4350 [01:09<23:47, 2.91it/s]
192
  4%|▍ | 192/4350 [01:09<25:42, 2.70it/s]
193
  4%|▍ | 193/4350 [01:09<24:41, 2.81it/s]
194
  4%|▍ | 194/4350 [01:10<22:46, 3.04it/s]
195
  4%|▍ | 195/4350 [01:10<26:31, 2.61it/s]
196
  5%|▍ | 196/4350 [01:11<26:26, 2.62it/s]
197
  5%|▍ | 197/4350 [01:11<25:04, 2.76it/s]
198
  5%|▍ | 198/4350 [01:11<23:15, 2.98it/s]
199
  5%|▍ | 199/4350 [01:12<23:17, 2.97it/s]
200
  5%|▍ | 200/4350 [01:12<25:40, 2.69it/s]
201
  5%|▍ | 201/4350 [01:12<24:17, 2.85it/s]
202
  5%|▍ | 202/4350 [01:13<23:54, 2.89it/s]
203
  5%|▍ | 203/4350 [01:13<23:43, 2.91it/s]
204
  5%|▍ | 204/4350 [01:13<24:44, 2.79it/s]
205
  5%|▍ | 205/4350 [01:14<24:15, 2.85it/s]
206
  5%|▍ | 206/4350 [01:14<23:12, 2.98it/s]
207
  5%|▍ | 207/4350 [01:14<23:25, 2.95it/s]
208
  5%|▍ | 208/4350 [01:15<26:19, 2.62it/s]
209
  5%|▍ | 209/4350 [01:15<24:53, 2.77it/s]
210
  5%|▍ | 210/4350 [01:15<22:57, 3.01it/s]
211
  5%|▍ | 211/4350 [01:16<24:11, 2.85it/s]
212
  5%|▍ | 212/4350 [01:16<22:46, 3.03it/s]
213
  5%|▍ | 213/4350 [01:16<23:04, 2.99it/s]
214
  5%|▍ | 214/4350 [01:17<29:05, 2.37it/s]
215
  5%|▍ | 215/4350 [01:17<27:47, 2.48it/s]
216
  5%|▍ | 216/4350 [01:18<27:23, 2.52it/s]
217
  5%|▍ | 217/4350 [01:18<25:58, 2.65it/s]
218
  5%|β–Œ | 218/4350 [01:18<24:47, 2.78it/s]
219
  5%|β–Œ | 219/4350 [01:19<27:15, 2.53it/s]
220
  5%|β–Œ | 220/4350 [01:19<27:40, 2.49it/s]
221
  5%|β–Œ | 221/4350 [01:20<28:06, 2.45it/s]
222
  5%|β–Œ | 222/4350 [01:20<26:57, 2.55it/s]
223
  5%|β–Œ | 223/4350 [01:21<28:14, 2.44it/s]
224
  5%|β–Œ | 224/4350 [01:21<28:53, 2.38it/s]
225
  5%|β–Œ | 225/4350 [01:21<29:20, 2.34it/s]
226
  5%|β–Œ | 226/4350 [01:22<27:47, 2.47it/s]
227
  5%|β–Œ | 227/4350 [01:22<26:55, 2.55it/s]
228
  5%|β–Œ | 228/4350 [01:23<25:30, 2.69it/s]
229
  5%|β–Œ | 229/4350 [01:23<23:06, 2.97it/s]
230
  5%|β–Œ | 230/4350 [01:23<22:14, 3.09it/s]
231
  5%|β–Œ | 231/4350 [01:23<23:09, 2.97it/s]
232
  5%|β–Œ | 232/4350 [01:24<23:03, 2.98it/s]
233
  5%|β–Œ | 233/4350 [01:24<22:17, 3.08it/s]
234
  5%|β–Œ | 234/4350 [01:24<23:21, 2.94it/s]
235
  5%|β–Œ | 235/4350 [01:25<23:27, 2.92it/s]
236
  5%|β–Œ | 236/4350 [01:25<23:20, 2.94it/s]
237
  5%|β–Œ | 237/4350 [01:25<22:38, 3.03it/s]
238
  5%|β–Œ | 238/4350 [01:26<21:16, 3.22it/s]
239
  5%|β–Œ | 239/4350 [01:26<27:58, 2.45it/s]
240
  6%|β–Œ | 240/4350 [01:27<26:00, 2.63it/s]
241
  6%|β–Œ | 241/4350 [01:27<23:48, 2.88it/s]
242
  6%|β–Œ | 242/4350 [01:27<26:38, 2.57it/s]
243
  6%|β–Œ | 243/4350 [01:28<25:21, 2.70it/s]
244
  6%|β–Œ | 244/4350 [01:28<29:04, 2.35it/s]
245
  6%|β–Œ | 245/4350 [01:29<28:52, 2.37it/s]
246
  6%|β–Œ | 246/4350 [01:29<29:27, 2.32it/s]
247
  6%|β–Œ | 247/4350 [01:30<28:08, 2.43it/s]
248
  6%|β–Œ | 248/4350 [01:30<27:08, 2.52it/s]
249
  6%|β–Œ | 249/4350 [01:30<27:43, 2.46it/s]
250
  6%|β–Œ | 250/4350 [01:31<26:32, 2.57it/s]
251
  6%|β–Œ | 251/4350 [01:31<26:18, 2.60it/s]
252
  6%|β–Œ | 252/4350 [01:31<26:35, 2.57it/s]
253
  6%|β–Œ | 253/4350 [01:32<24:08, 2.83it/s]
254
  6%|β–Œ | 254/4350 [01:32<22:32, 3.03it/s]
255
  6%|β–Œ | 255/4350 [01:32<22:46, 3.00it/s]
256
  6%|β–Œ | 256/4350 [01:33<22:59, 2.97it/s]
257
  6%|β–Œ | 257/4350 [01:33<25:40, 2.66it/s]
258
  6%|β–Œ | 258/4350 [01:34<29:38, 2.30it/s]
259
  6%|β–Œ | 259/4350 [01:34<27:20, 2.49it/s]
260
  6%|β–Œ | 260/4350 [01:34<28:15, 2.41it/s]
261
  6%|β–Œ | 261/4350 [01:35<27:24, 2.49it/s]
262
  6%|β–Œ | 262/4350 [01:35<26:03, 2.61it/s]
263
  6%|β–Œ | 263/4350 [01:36<26:28, 2.57it/s]
264
  6%|β–Œ | 264/4350 [01:36<23:58, 2.84it/s]
265
  6%|β–Œ | 265/4350 [01:36<23:33, 2.89it/s]
266
  6%|β–Œ | 266/4350 [01:37<23:12, 2.93it/s]
267
  6%|β–Œ | 267/4350 [01:37<23:00, 2.96it/s]
268
  6%|β–Œ | 268/4350 [01:37<23:03, 2.95it/s]
269
  6%|β–Œ | 269/4350 [01:37<20:59, 3.24it/s]
270
  6%|β–Œ | 270/4350 [01:38<22:08, 3.07it/s]
271
  6%|β–Œ | 271/4350 [01:38<23:17, 2.92it/s]
272
  6%|β–‹ | 272/4350 [01:38<22:17, 3.05it/s]
273
  6%|β–‹ | 273/4350 [01:39<22:14, 3.06it/s]
274
  6%|β–‹ | 274/4350 [01:39<22:00, 3.09it/s]
275
  6%|β–‹ | 275/4350 [01:39<23:06, 2.94it/s]
276
  6%|β–‹ | 276/4350 [01:40<22:26, 3.02it/s]
277
  6%|β–‹ | 277/4350 [01:40<21:32, 3.15it/s]
278
  6%|β–‹ | 278/4350 [01:41<24:22, 2.78it/s]
279
  6%|β–‹ | 279/4350 [01:41<23:27, 2.89it/s]
280
  6%|β–‹ | 280/4350 [01:41<22:21, 3.03it/s]
281
  6%|β–‹ | 281/4350 [01:41<22:36, 3.00it/s]
282
  6%|β–‹ | 282/4350 [01:42<21:42, 3.12it/s]
283
  7%|β–‹ | 283/4350 [01:42<21:10, 3.20it/s]
284
  7%|β–‹ | 284/4350 [01:42<21:09, 3.20it/s]
285
  7%|β–‹ | 285/4350 [01:43<21:50, 3.10it/s]
286
  7%|β–‹ | 286/4350 [01:43<25:09, 2.69it/s]
287
  7%|β–‹ | 287/4350 [01:44<25:34, 2.65it/s]
288
  7%|β–‹ | 288/4350 [01:44<25:56, 2.61it/s]
289
  7%|β–‹ | 289/4350 [01:44<24:41, 2.74it/s]
290
  7%|β–‹ | 290/4350 [01:45<26:16, 2.58it/s]
291
  7%|β–‹ | 291/4350 [01:45<27:35, 2.45it/s]
292
  7%|β–‹ | 292/4350 [01:46<25:57, 2.60it/s]
293
  7%|β–‹ | 293/4350 [01:46<28:13, 2.40it/s]
294
  7%|β–‹ | 294/4350 [01:46<25:55, 2.61it/s]
295
  7%|β–‹ | 295/4350 [01:47<25:00, 2.70it/s]
296
  7%|β–‹ | 296/4350 [01:47<24:25, 2.77it/s]
297
  7%|β–‹ | 297/4350 [01:47<25:04, 2.69it/s]
298
  7%|β–‹ | 298/4350 [01:48<23:36, 2.86it/s]
299
  7%|β–‹ | 299/4350 [01:48<25:33, 2.64it/s]
300
  7%|β–‹ | 300/4350 [01:49<27:17, 2.47it/s]
301
  7%|β–‹ | 301/4350 [01:49<27:11, 2.48it/s]
302
  7%|β–‹ | 302/4350 [01:49<27:24, 2.46it/s]
303
  7%|β–‹ | 303/4350 [01:50<25:35, 2.64it/s]
304
  7%|β–‹ | 304/4350 [01:50<24:47, 2.72it/s]
305
  7%|β–‹ | 305/4350 [01:50<25:02, 2.69it/s]
306
  7%|β–‹ | 306/4350 [01:51<24:32, 2.75it/s]
307
  7%|β–‹ | 307/4350 [01:51<27:04, 2.49it/s]
308
  7%|β–‹ | 308/4350 [01:52<25:18, 2.66it/s]
309
  7%|β–‹ | 309/4350 [01:52<25:37, 2.63it/s]
310
  7%|β–‹ | 310/4350 [01:52<25:13, 2.67it/s]
311
  7%|β–‹ | 311/4350 [01:53<23:19, 2.89it/s]
312
  7%|β–‹ | 312/4350 [01:53<23:13, 2.90it/s]
313
  7%|β–‹ | 313/4350 [01:53<24:41, 2.73it/s]
314
  7%|β–‹ | 314/4350 [01:54<22:47, 2.95it/s]
315
  7%|β–‹ | 315/4350 [01:54<22:39, 2.97it/s]
316
  7%|β–‹ | 316/4350 [01:54<22:45, 2.95it/s]
317
  7%|β–‹ | 317/4350 [01:55<21:31, 3.12it/s]
318
  7%|β–‹ | 318/4350 [01:55<22:18, 3.01it/s]
319
  7%|β–‹ | 319/4350 [01:55<21:27, 3.13it/s]
320
  7%|β–‹ | 320/4350 [01:56<21:30, 3.12it/s]
321
  7%|β–‹ | 321/4350 [01:56<23:32, 2.85it/s]
322
  7%|β–‹ | 322/4350 [01:56<21:24, 3.14it/s]
323
  7%|β–‹ | 323/4350 [01:57<23:29, 2.86it/s]
324
  7%|β–‹ | 324/4350 [01:57<23:12, 2.89it/s]
325
  7%|β–‹ | 325/4350 [01:57<22:36, 2.97it/s]
326
  7%|β–‹ | 326/4350 [01:58<23:16, 2.88it/s]
327
  8%|β–Š | 327/4350 [01:58<22:11, 3.02it/s]
328
  8%|β–Š | 328/4350 [01:58<21:27, 3.12it/s]
329
  8%|β–Š | 329/4350 [01:59<23:33, 2.84it/s]
330
  8%|β–Š | 330/4350 [01:59<23:29, 2.85it/s]
331
  8%|β–Š | 331/4350 [02:00<26:59, 2.48it/s]
332
  8%|β–Š | 332/4350 [02:00<27:55, 2.40it/s]
333
  8%|β–Š | 333/4350 [02:00<27:01, 2.48it/s]
334
  8%|β–Š | 334/4350 [02:01<30:38, 2.18it/s]
335
  8%|οΏ½οΏ½ | 335/4350 [02:01<29:04, 2.30it/s]
336
  8%|β–Š | 336/4350 [02:02<27:30, 2.43it/s]
337
  8%|β–Š | 337/4350 [02:02<25:57, 2.58it/s]
338
  8%|β–Š | 338/4350 [02:02<24:12, 2.76it/s]
339
  8%|β–Š | 339/4350 [02:03<23:21, 2.86it/s]
340
  8%|β–Š | 340/4350 [02:03<22:35, 2.96it/s]
341
  8%|β–Š | 341/4350 [02:03<21:15, 3.14it/s]
342
  8%|β–Š | 342/4350 [02:04<20:49, 3.21it/s]
343
  8%|β–Š | 343/4350 [02:04<21:41, 3.08it/s]
344
  8%|β–Š | 344/4350 [02:04<23:57, 2.79it/s]
345
  8%|β–Š | 345/4350 [02:05<28:34, 2.34it/s]
346
  8%|β–Š | 346/4350 [02:05<25:49, 2.58it/s]
347
  8%|β–Š | 347/4350 [02:06<27:21, 2.44it/s]
348
  8%|β–Š | 348/4350 [02:06<25:58, 2.57it/s]
349
  8%|β–Š | 349/4350 [02:06<24:03, 2.77it/s]
350
  8%|β–Š | 350/4350 [02:07<23:20, 2.86it/s]
351
  8%|β–Š | 351/4350 [02:07<23:17, 2.86it/s]
352
  8%|β–Š | 352/4350 [02:07<22:07, 3.01it/s]
353
  8%|β–Š | 353/4350 [02:08<22:21, 2.98it/s]
354
  8%|β–Š | 354/4350 [02:09<35:49, 1.86it/s]
355
  8%|β–Š | 355/4350 [02:09<30:43, 2.17it/s]
356
  8%|β–Š | 356/4350 [02:09<30:27, 2.19it/s]
357
  8%|β–Š | 357/4350 [02:10<28:53, 2.30it/s]
358
  8%|β–Š | 358/4350 [02:10<25:42, 2.59it/s]
359
  8%|β–Š | 359/4350 [02:10<24:35, 2.70it/s]
360
  8%|β–Š | 360/4350 [02:11<25:09, 2.64it/s]
361
  8%|β–Š | 361/4350 [02:11<24:13, 2.74it/s]
362
  8%|β–Š | 362/4350 [02:11<21:52, 3.04it/s]
363
  8%|β–Š | 363/4350 [02:12<20:15, 3.28it/s]
364
  8%|β–Š | 364/4350 [02:12<20:00, 3.32it/s]
365
  8%|β–Š | 365/4350 [02:12<21:02, 3.16it/s]
366
  8%|β–Š | 366/4350 [02:13<23:22, 2.84it/s]
367
  8%|β–Š | 367/4350 [02:13<22:17, 2.98it/s]
368
  8%|β–Š | 368/4350 [02:13<23:41, 2.80it/s]
369
  8%|β–Š | 369/4350 [02:14<23:06, 2.87it/s]
370
  9%|β–Š | 370/4350 [02:14<22:09, 2.99it/s]
371
  9%|β–Š | 371/4350 [02:14<22:07, 3.00it/s]
372
  9%|β–Š | 372/4350 [02:15<22:35, 2.93it/s]
373
  9%|β–Š | 373/4350 [02:15<21:52, 3.03it/s]
374
  9%|β–Š | 374/4350 [02:15<21:59, 3.01it/s]
375
  9%|β–Š | 375/4350 [02:16<25:02, 2.65it/s]
376
  9%|β–Š | 376/4350 [02:16<24:11, 2.74it/s]
377
  9%|β–Š | 377/4350 [02:17<23:32, 2.81it/s]
378
  9%|β–Š | 378/4350 [02:17<25:04, 2.64it/s]
379
  9%|β–Š | 379/4350 [02:17<24:13, 2.73it/s]
380
  9%|β–Š | 380/4350 [02:18<23:19, 2.84it/s]
381
  9%|β–‰ | 381/4350 [02:18<23:19, 2.84it/s]
382
  9%|β–‰ | 382/4350 [02:19<29:36, 2.23it/s]
383
  9%|β–‰ | 383/4350 [02:19<26:13, 2.52it/s]
384
  9%|β–‰ | 384/4350 [02:19<24:14, 2.73it/s]
385
  9%|β–‰ | 385/4350 [02:20<23:46, 2.78it/s]
386
  9%|β–‰ | 386/4350 [02:20<23:44, 2.78it/s]
387
  9%|β–‰ | 387/4350 [02:20<22:23, 2.95it/s]
388
  9%|β–‰ | 388/4350 [02:21<24:09, 2.73it/s]
389
  9%|β–‰ | 389/4350 [02:21<23:41, 2.79it/s]
390
  9%|β–‰ | 390/4350 [02:21<23:05, 2.86it/s]
391
  9%|β–‰ | 391/4350 [02:22<22:52, 2.88it/s]
392
  9%|β–‰ | 392/4350 [02:22<25:23, 2.60it/s]
393
  9%|β–‰ | 393/4350 [02:22<25:05, 2.63it/s]
394
  9%|β–‰ | 394/4350 [02:23<28:17, 2.33it/s]
395
  9%|β–‰ | 395/4350 [02:23<25:13, 2.61it/s]
396
  9%|β–‰ | 396/4350 [02:24<24:46, 2.66it/s]
397
  9%|β–‰ | 397/4350 [02:24<22:36, 2.91it/s]
398
  9%|β–‰ | 398/4350 [02:24<22:50, 2.88it/s]
399
  9%|β–‰ | 399/4350 [02:25<21:20, 3.08it/s]
400
  9%|β–‰ | 400/4350 [02:25<23:47, 2.77it/s]
401
  9%|β–‰ | 401/4350 [02:25<24:01, 2.74it/s]
402
  9%|β–‰ | 402/4350 [02:26<25:20, 2.60it/s]
403
  9%|β–‰ | 403/4350 [02:26<24:42, 2.66it/s]
404
  9%|β–‰ | 404/4350 [02:27<25:01, 2.63it/s]
405
  9%|β–‰ | 405/4350 [02:27<24:06, 2.73it/s]
406
  9%|β–‰ | 406/4350 [02:27<27:45, 2.37it/s]
407
  9%|β–‰ | 407/4350 [02:28<28:05, 2.34it/s]
408
  9%|β–‰ | 408/4350 [02:28<26:08, 2.51it/s]
409
  9%|β–‰ | 409/4350 [02:29<24:42, 2.66it/s]
410
  9%|β–‰ | 410/4350 [02:29<22:44, 2.89it/s]
411
  9%|β–‰ | 411/4350 [02:29<23:51, 2.75it/s]
412
  9%|β–‰ | 412/4350 [02:30<25:09, 2.61it/s]
413
  9%|β–‰ | 413/4350 [02:30<24:44, 2.65it/s]
414
  10%|β–‰ | 414/4350 [02:30<26:31, 2.47it/s]
415
  10%|β–‰ | 415/4350 [02:31<25:38, 2.56it/s]
416
  10%|β–‰ | 416/4350 [02:31<24:27, 2.68it/s]
417
  10%|β–‰ | 417/4350 [02:32<23:39, 2.77it/s]
418
  10%|β–‰ | 418/4350 [02:32<22:29, 2.91it/s]
419
  10%|β–‰ | 419/4350 [02:32<21:39, 3.02it/s]
420
  10%|β–‰ | 420/4350 [02:32<20:19, 3.22it/s]
421
  10%|β–‰ | 421/4350 [02:33<22:56, 2.85it/s]
422
  10%|β–‰ | 422/4350 [02:33<22:42, 2.88it/s]
423
  10%|β–‰ | 423/4350 [02:33<21:38, 3.03it/s]
424
  10%|β–‰ | 424/4350 [02:34<21:37, 3.03it/s]
425
  10%|β–‰ | 425/4350 [02:34<22:14, 2.94it/s]
426
  10%|β–‰ | 426/4350 [02:35<23:22, 2.80it/s]
427
  10%|β–‰ | 427/4350 [02:35<22:52, 2.86it/s]
428
  10%|β–‰ | 428/4350 [02:35<22:34, 2.89it/s]
429
  10%|β–‰ | 429/4350 [02:36<22:35, 2.89it/s]
430
  10%|β–‰ | 430/4350 [02:36<21:47, 3.00it/s]
431
  10%|β–‰ | 431/4350 [02:36<21:10, 3.09it/s]
432
  10%|β–‰ | 432/4350 [02:37<21:57, 2.97it/s]
433
  10%|β–‰ | 433/4350 [02:37<21:35, 3.02it/s]
434
  10%|β–‰ | 434/4350 [02:37<20:41, 3.15it/s]
435
  10%|β–ˆ | 435/4350 [02:38<23:47, 2.74it/s][INFO|trainer.py:811] 2024-09-09 18:55:23,830 >> The following columns in the evaluation set don't have a corresponding argument in `BertForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `BertForTokenClassification.forward`, you can safely ignore this message.
 
 
 
 
 
 
436
  0%| | 0/869 [00:00<?, ?it/s]
 
437
  1%| | 10/869 [00:00<00:09, 93.25it/s]
 
438
  2%|▏ | 20/869 [00:00<00:10, 81.05it/s]
 
439
  3%|β–Ž | 29/869 [00:00<00:10, 78.93it/s]
 
440
  4%|▍ | 37/869 [00:00<00:10, 76.51it/s]
 
441
  5%|β–Œ | 46/869 [00:00<00:10, 80.40it/s]
 
442
  6%|β–‹ | 55/869 [00:00<00:09, 82.80it/s]
 
443
  7%|β–‹ | 64/869 [00:00<00:10, 77.85it/s]
 
444
  8%|β–Š | 72/869 [00:00<00:10, 76.99it/s]
 
445
  9%|β–‰ | 82/869 [00:01<00:09, 81.30it/s]
 
446
  11%|β–ˆ | 92/869 [00:01<00:09, 84.77it/s]
 
447
  12%|β–ˆβ– | 102/869 [00:01<00:08, 86.85it/s]
 
448
  13%|β–ˆβ–Ž | 111/869 [00:01<00:08, 84.28it/s]
 
449
  14%|β–ˆβ– | 120/869 [00:01<00:09, 82.94it/s]
 
450
  15%|β–ˆβ– | 129/869 [00:01<00:09, 80.32it/s]
 
451
  16%|β–ˆβ–Œ | 139/869 [00:01<00:08, 83.08it/s]
 
452
  17%|β–ˆβ–‹ | 148/869 [00:01<00:09, 78.75it/s]
 
453
  18%|β–ˆβ–Š | 157/869 [00:01<00:09, 78.73it/s]
 
454
  19%|β–ˆβ–‰ | 166/869 [00:02<00:08, 78.19it/s]
 
455
  20%|β–ˆβ–ˆ | 175/869 [00:02<00:08, 79.26it/s]
 
456
  21%|β–ˆβ–ˆ | 183/869 [00:02<00:08, 78.09it/s]
 
457
  22%|β–ˆβ–ˆβ– | 191/869 [00:02<00:08, 76.37it/s]
 
458
  23%|β–ˆβ–ˆβ–Ž | 199/869 [00:02<00:08, 76.97it/s]
 
459
  24%|β–ˆβ–ˆβ– | 208/869 [00:02<00:08, 78.45it/s]
 
460
  25%|β–ˆβ–ˆβ–Œ | 218/869 [00:02<00:07, 82.86it/s]
 
461
  26%|β–ˆβ–ˆβ–Œ | 227/869 [00:02<00:07, 83.20it/s]
 
462
  27%|β–ˆβ–ˆβ–‹ | 236/869 [00:02<00:08, 76.92it/s]
 
463
  28%|β–ˆβ–ˆβ–Š | 244/869 [00:03<00:08, 71.08it/s]
 
464
  29%|β–ˆβ–ˆβ–‰ | 253/869 [00:03<00:08, 75.15it/s]
 
465
  30%|β–ˆβ–ˆβ–ˆ | 262/869 [00:03<00:07, 76.76it/s]
 
466
  31%|β–ˆβ–ˆβ–ˆ | 270/869 [00:03<00:07, 74.97it/s]
 
467
  32%|β–ˆβ–ˆβ–ˆβ– | 278/869 [00:03<00:07, 74.44it/s]
 
468
  33%|β–ˆβ–ˆβ–ˆβ–Ž | 286/869 [00:03<00:07, 74.34it/s]
 
469
  34%|β–ˆβ–ˆβ–ˆβ– | 294/869 [00:03<00:07, 75.42it/s]
 
470
  35%|β–ˆβ–ˆβ–ˆβ– | 302/869 [00:03<00:07, 72.74it/s]
 
471
  36%|β–ˆβ–ˆβ–ˆβ–Œ | 310/869 [00:03<00:07, 74.05it/s]
 
472
  37%|β–ˆβ–ˆβ–ˆβ–‹ | 318/869 [00:04<00:07, 73.18it/s]
 
473
  38%|β–ˆβ–ˆβ–ˆβ–Š | 326/869 [00:04<00:07, 74.32it/s]
 
474
  39%|β–ˆβ–ˆβ–ˆβ–Š | 335/869 [00:04<00:06, 78.23it/s]
 
475
  39%|β–ˆβ–ˆβ–ˆβ–‰ | 343/869 [00:04<00:06, 75.35it/s]
 
476
  40%|β–ˆβ–ˆβ–ˆβ–ˆ | 351/869 [00:04<00:06, 74.42it/s]
 
477
  41%|β–ˆβ–ˆβ–ˆβ–ˆβ– | 360/869 [00:04<00:06, 77.90it/s]
 
478
  42%|β–ˆβ–ˆβ–ˆβ–ˆβ– | 369/869 [00:04<00:06, 79.65it/s]
 
479
  43%|β–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 377/869 [00:04<00:06, 76.71it/s]
 
480
  44%|β–ˆβ–ˆβ–ˆβ–ˆβ– | 385/869 [00:04<00:06, 75.81it/s]
 
481
  45%|β–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 393/869 [00:05<00:06, 72.15it/s]
 
482
  46%|β–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 402/869 [00:05<00:06, 74.91it/s]
 
483
  47%|β–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 411/869 [00:05<00:05, 78.06it/s]
 
484
  48%|β–ˆβ–ˆβ–ˆβ–ˆβ–Š | 420/869 [00:05<00:05, 79.58it/s]
 
485
  49%|β–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 429/869 [00:05<00:05, 82.14it/s]
 
486
  50%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 438/869 [00:05<00:05, 78.97it/s]
 
487
  51%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 446/869 [00:05<00:05, 76.84it/s]
 
488
  52%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 455/869 [00:05<00:05, 78.31it/s]
 
489
  53%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 463/869 [00:05<00:05, 76.71it/s]
 
490
  54%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 472/869 [00:06<00:04, 80.16it/s]
 
491
  55%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 481/869 [00:06<00:04, 82.89it/s]
 
492
  56%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 490/869 [00:06<00:04, 79.00it/s]
 
493
  57%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 498/869 [00:06<00:04, 78.03it/s]
 
494
  58%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 506/869 [00:06<00:04, 76.31it/s]
 
495
  59%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 514/869 [00:06<00:04, 77.22it/s]
 
496
  60%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 522/869 [00:06<00:04, 72.94it/s]
 
497
  61%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 531/869 [00:06<00:04, 75.43it/s]
 
498
  62%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 539/869 [00:06<00:04, 74.36it/s]
 
499
  63%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 547/869 [00:07<00:04, 73.96it/s]
 
500
  64%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 556/869 [00:07<00:04, 76.54it/s]
 
501
  65%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 564/869 [00:07<00:03, 77.26it/s]
 
502
  66%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 572/869 [00:07<00:03, 75.95it/s]
 
503
  67%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 580/869 [00:07<00:03, 76.49it/s]
 
504
  68%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 588/869 [00:07<00:03, 75.47it/s]
 
505
  69%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 596/869 [00:07<00:03, 75.44it/s]
 
506
  70%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 605/869 [00:07<00:03, 77.26it/s]
 
507
  71%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 613/869 [00:07<00:03, 77.48it/s]
 
508
  71%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 621/869 [00:07<00:03, 77.76it/s]
 
509
  72%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 629/869 [00:08<00:03, 76.20it/s]
 
510
  73%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 637/869 [00:08<00:03, 75.43it/s]
 
511
  74%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 646/869 [00:08<00:02, 79.27it/s]
 
512
  75%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 655/869 [00:08<00:02, 81.10it/s]
 
513
  76%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 664/869 [00:08<00:02, 79.18it/s]
 
514
  77%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 673/869 [00:08<00:02, 81.81it/s]
 
515
  78%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 682/869 [00:08<00:02, 71.77it/s]
 
516
  80%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 691/869 [00:08<00:02, 75.44it/s]
 
517
  80%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 699/869 [00:09<00:02, 76.23it/s]
 
518
  81%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 707/869 [00:09<00:02, 75.84it/s]
 
519
  82%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 716/869 [00:09<00:01, 77.83it/s]
 
520
  83%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 725/869 [00:09<00:01, 79.49it/s]
 
521
  84%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 734/869 [00:09<00:01, 78.92it/s]
 
522
  86%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 743/869 [00:09<00:01, 79.35it/s]
 
523
  86%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 751/869 [00:09<00:01, 77.02it/s]
 
524
  87%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 759/869 [00:09<00:01, 76.52it/s]
 
525
  88%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 767/869 [00:09<00:01, 73.86it/s]
 
526
  89%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 776/869 [00:10<00:01, 70.42it/s]
 
527
  90%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 784/869 [00:10<00:01, 67.63it/s]
 
528
  91%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 793/869 [00:10<00:01, 71.94it/s]
 
529
  92%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 802/869 [00:10<00:00, 74.63it/s]
 
530
  93%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž| 811/869 [00:10<00:00, 75.43it/s]
 
531
  94%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 820/869 [00:10<00:00, 76.33it/s]
 
532
  95%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ| 829/869 [00:10<00:00, 78.65it/s]
 
533
  96%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹| 837/869 [00:10<00:00, 78.27it/s]
 
534
  97%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹| 846/869 [00:10<00:00, 81.27it/s]
 
535
  98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 855/869 [00:11<00:00, 80.86it/s]
 
536
  99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 864/869 [00:11<00:00, 75.54it/s]
537
 
 
538
 
539
  10%|β–ˆ | 435/4350 [02:53<23:47, 2.74it/s]
 
 
540
  [INFO|trainer.py:3503] 2024-09-09 18:55:38,835 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-435
 
 
 
 
 
 
 
541
  10%|β–ˆ | 436/4350 [03:01<7:50:34, 7.21s/it]
542
  10%|β–ˆ | 437/4350 [03:01<5:35:45, 5.15s/it]
543
  10%|β–ˆ | 438/4350 [03:01<4:02:01, 3.71s/it]
544
  10%|β–ˆ | 439/4350 [03:02<2:57:17, 2.72s/it]
545
  10%|β–ˆ | 440/4350 [03:02<2:09:48, 1.99s/it]
546
  10%|β–ˆ | 441/4350 [03:03<1:38:29, 1.51s/it]
547
  10%|β–ˆ | 442/4350 [03:03<1:18:31, 1.21s/it]
548
  10%|β–ˆ | 443/4350 [03:03<1:01:09, 1.06it/s]
549
  10%|β–ˆ | 444/4350 [03:04<49:59, 1.30it/s]
550
  10%|β–ˆ | 445/4350 [03:04<40:43, 1.60it/s]
551
  10%|β–ˆ | 446/4350 [03:04<35:23, 1.84it/s]
552
  10%|β–ˆ | 447/4350 [03:05<33:28, 1.94it/s]
553
  10%|β–ˆ | 448/4350 [03:05<29:08, 2.23it/s]
554
  10%|β–ˆ | 449/4350 [03:06<27:52, 2.33it/s]
555
  10%|β–ˆ | 450/4350 [03:06<27:18, 2.38it/s]
556
  10%|β–ˆ | 451/4350 [03:06<24:21, 2.67it/s]
557
  10%|β–ˆ | 452/4350 [03:07<25:23, 2.56it/s]
558
  10%|β–ˆ | 453/4350 [03:07<24:12, 2.68it/s]
559
  10%|β–ˆ | 454/4350 [03:07<23:27, 2.77it/s]
560
  10%|β–ˆ | 455/4350 [03:08<22:49, 2.84it/s]
561
  10%|β–ˆ | 456/4350 [03:08<22:03, 2.94it/s]
562
  11%|β–ˆ | 457/4350 [03:08<21:56, 2.96it/s]
563
  11%|β–ˆ | 458/4350 [03:09<24:30, 2.65it/s]
564
  11%|β–ˆ | 459/4350 [03:09<23:52, 2.72it/s]
565
  11%|β–ˆ | 460/4350 [03:09<21:48, 2.97it/s]
566
  11%|β–ˆ | 461/4350 [03:10<21:29, 3.02it/s]
567
  11%|β–ˆ | 462/4350 [03:10<19:35, 3.31it/s]
568
  11%|β–ˆ | 463/4350 [03:10<23:36, 2.74it/s]
569
  11%|β–ˆ | 464/4350 [03:11<23:42, 2.73it/s]
570
  11%|β–ˆ | 465/4350 [03:11<21:35, 3.00it/s]
571
  11%|β–ˆ | 466/4350 [03:12<24:19, 2.66it/s]
572
  11%|β–ˆ | 467/4350 [03:12<24:10, 2.68it/s]
573
  11%|β–ˆ | 468/4350 [03:13<31:53, 2.03it/s]
574
  11%|β–ˆ | 469/4350 [03:13<28:07, 2.30it/s]
575
  11%|β–ˆ | 470/4350 [03:13<27:34, 2.34it/s]
576
  11%|β–ˆ | 471/4350 [03:14<27:24, 2.36it/s]
577
  11%|β–ˆ | 472/4350 [03:14<25:31, 2.53it/s]
578
  11%|β–ˆ | 473/4350 [03:14<24:42, 2.61it/s]
579
  11%|β–ˆ | 474/4350 [03:15<24:15, 2.66it/s]
580
  11%|β–ˆ | 475/4350 [03:15<24:13, 2.67it/s]
581
  11%|β–ˆ | 476/4350 [03:16<23:17, 2.77it/s]
582
  11%|β–ˆ | 477/4350 [03:16<24:01, 2.69it/s]
583
  11%|β–ˆ | 478/4350 [03:16<23:05, 2.79it/s]
584
  11%|β–ˆ | 479/4350 [03:17<23:58, 2.69it/s]
585
  11%|β–ˆ | 480/4350 [03:17<24:26, 2.64it/s]
586
  11%|β–ˆ | 481/4350 [03:17<23:26, 2.75it/s]
587
  11%|β–ˆ | 482/4350 [03:18<23:50, 2.70it/s]
588
  11%|β–ˆ | 483/4350 [03:18<23:34, 2.73it/s]
589
  11%|β–ˆ | 484/4350 [03:18<21:50, 2.95it/s]
590
  11%|β–ˆ | 485/4350 [03:19<21:30, 3.00it/s]
591
  11%|β–ˆ | 486/4350 [03:19<24:22, 2.64it/s]
592
  11%|β–ˆ | 487/4350 [03:20<23:37, 2.73it/s]
593
  11%|β–ˆ | 488/4350 [03:20<24:31, 2.62it/s]
594
  11%|β–ˆ | 489/4350 [03:20<24:18, 2.65it/s]
595
  11%|β–ˆβ– | 490/4350 [03:21<24:39, 2.61it/s]
596
  11%|β–ˆβ– | 491/4350 [03:21<23:02, 2.79it/s]
597
  11%|β–ˆβ– | 492/4350 [03:21<22:33, 2.85it/s]
598
  11%|β–ˆβ– | 493/4350 [03:22<22:25, 2.87it/s]
599
  11%|β–ˆβ– | 494/4350 [03:22<22:53, 2.81it/s]
600
  11%|β–ˆβ– | 495/4350 [03:22<20:48, 3.09it/s]
601
  11%|β–ˆβ– | 496/4350 [03:23<22:32, 2.85it/s]
602
  11%|β–ˆβ– | 497/4350 [03:23<22:48, 2.82it/s]
603
  11%|β–ˆβ– | 498/4350 [03:23<22:42, 2.83it/s]
604
  11%|β–ˆβ– | 499/4350 [03:24<21:58, 2.92it/s]
605
  11%|β–ˆβ– | 500/4350 [03:24<22:30, 2.85it/s]
606
 
607
  11%|β–ˆβ– | 500/4350 [03:24<22:30, 2.85it/s]
608
  12%|β–ˆβ– | 501/4350 [03:25<23:41, 2.71it/s]
609
  12%|β–ˆβ– | 502/4350 [03:25<22:51, 2.81it/s]
610
  12%|β–ˆβ– | 503/4350 [03:25<23:39, 2.71it/s]
 
1
+ 2024-09-09 18:51:43.893004: I tensorflow/core/util/port.cc:153] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2
+ 2024-09-09 18:51:43.910950: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:485] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
3
+ 2024-09-09 18:51:43.932149: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:8454] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
4
+ 2024-09-09 18:51:43.938564: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1452] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
5
+ 2024-09-09 18:51:43.953786: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
6
+ To enable the following instructions: AVX2 AVX512F AVX512_VNNI FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.
7
+ 2024-09-09 18:51:45.193822: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT
8
+ /usr/local/lib/python3.10/dist-packages/transformers/training_args.py:1525: FutureWarning: `evaluation_strategy` is deprecated and will be removed in version 4.46 of πŸ€— Transformers. Use `eval_strategy` instead
9
+ warnings.warn(
10
+ 09/09/2024 18:51:47 - WARNING - __main__ - Process rank: 0, device: cuda:0, n_gpu: 1distributed training: True, 16-bits training: False
11
+ 09/09/2024 18:51:47 - INFO - __main__ - Training/evaluation parameters TrainingArguments(
12
+ _n_gpu=1,
13
+ accelerator_config={'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None, 'use_configured_state': False},
14
+ adafactor=False,
15
+ adam_beta1=0.9,
16
+ adam_beta2=0.999,
17
+ adam_epsilon=1e-08,
18
+ auto_find_batch_size=False,
19
+ batch_eval_metrics=False,
20
+ bf16=False,
21
+ bf16_full_eval=False,
22
+ data_seed=None,
23
+ dataloader_drop_last=False,
24
+ dataloader_num_workers=0,
25
+ dataloader_persistent_workers=False,
26
+ dataloader_pin_memory=True,
27
+ dataloader_prefetch_factor=None,
28
+ ddp_backend=None,
29
+ ddp_broadcast_buffers=None,
30
+ ddp_bucket_cap_mb=None,
31
+ ddp_find_unused_parameters=None,
32
+ ddp_timeout=1800,
33
+ debug=[],
34
+ deepspeed=None,
35
+ disable_tqdm=False,
36
+ dispatch_batches=None,
37
+ do_eval=True,
38
+ do_predict=True,
39
+ do_train=True,
40
+ eval_accumulation_steps=None,
41
+ eval_delay=0,
42
+ eval_do_concat_batches=True,
43
+ eval_on_start=False,
44
+ eval_steps=None,
45
+ eval_strategy=epoch,
46
+ eval_use_gather_object=False,
47
+ evaluation_strategy=epoch,
48
+ fp16=False,
49
+ fp16_backend=auto,
50
+ fp16_full_eval=False,
51
+ fp16_opt_level=O1,
52
+ fsdp=[],
53
+ fsdp_config={'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False},
54
+ fsdp_min_num_params=0,
55
+ fsdp_transformer_layer_cls_to_wrap=None,
56
+ full_determinism=False,
57
+ gradient_accumulation_steps=2,
58
+ gradient_checkpointing=False,
59
+ gradient_checkpointing_kwargs=None,
60
+ greater_is_better=True,
61
+ group_by_length=False,
62
+ half_precision_backend=auto,
63
+ hub_always_push=False,
64
+ hub_model_id=None,
65
+ hub_private_repo=False,
66
+ hub_strategy=every_save,
67
+ hub_token=<HUB_TOKEN>,
68
+ ignore_data_skip=False,
69
+ include_inputs_for_metrics=False,
70
+ include_num_input_tokens_seen=False,
71
+ include_tokens_per_second=False,
72
+ jit_mode_eval=False,
73
+ label_names=None,
74
+ label_smoothing_factor=0.0,
75
+ learning_rate=5e-05,
76
+ length_column_name=length,
77
+ load_best_model_at_end=True,
78
+ local_rank=0,
79
+ log_level=passive,
80
+ log_level_replica=warning,
81
+ log_on_each_node=True,
82
+ logging_dir=/content/dissertation/scripts/ner/output/tb,
83
+ logging_first_step=False,
84
+ logging_nan_inf_filter=True,
85
+ logging_steps=500,
86
+ logging_strategy=steps,
87
+ lr_scheduler_kwargs={},
88
+ lr_scheduler_type=linear,
89
+ max_grad_norm=1.0,
90
+ max_steps=-1,
91
+ metric_for_best_model=f1,
92
+ mp_parameters=,
93
+ neftune_noise_alpha=None,
94
+ no_cuda=False,
95
+ num_train_epochs=10.0,
96
+ optim=adamw_torch,
97
+ optim_args=None,
98
+ optim_target_modules=None,
99
+ output_dir=/content/dissertation/scripts/ner/output,
100
+ overwrite_output_dir=True,
101
+ past_index=-1,
102
+ per_device_eval_batch_size=8,
103
+ per_device_train_batch_size=32,
104
+ prediction_loss_only=False,
105
+ push_to_hub=True,
106
+ push_to_hub_model_id=None,
107
+ push_to_hub_organization=None,
108
+ push_to_hub_token=<PUSH_TO_HUB_TOKEN>,
109
+ ray_scope=last,
110
+ remove_unused_columns=True,
111
+ report_to=['tensorboard'],
112
+ restore_callback_states_from_checkpoint=False,
113
+ resume_from_checkpoint=None,
114
+ run_name=/content/dissertation/scripts/ner/output,
115
+ save_on_each_node=False,
116
+ save_only_model=False,
117
+ save_safetensors=True,
118
+ save_steps=500,
119
+ save_strategy=epoch,
120
+ save_total_limit=None,
121
+ seed=42,
122
+ skip_memory_metrics=True,
123
+ split_batches=None,
124
+ tf32=None,
125
+ torch_compile=False,
126
+ torch_compile_backend=None,
127
+ torch_compile_mode=None,
128
+ torch_empty_cache_steps=None,
129
+ torchdynamo=None,
130
+ tpu_metrics_debug=False,
131
+ tpu_num_cores=None,
132
+ use_cpu=False,
133
+ use_ipex=False,
134
+ use_legacy_prediction_loop=False,
135
+ use_mps_device=False,
136
+ warmup_ratio=0.0,
137
+ warmup_steps=0,
138
+ weight_decay=0.0,
139
+ )
140
+
141
+
142
+
143
+
144
+
145
+
146
+
147
+ [INFO|configuration_utils.py:733] 2024-09-09 18:52:04,045 >> loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--michiyasunaga--BioLinkBERT-base/snapshots/b71f5d70f063d1c8f1124070ce86f1ee463ca1fe/config.json
148
+ [INFO|configuration_utils.py:800] 2024-09-09 18:52:04,054 >> Model config BertConfig {
149
+ "_name_or_path": "michiyasunaga/BioLinkBERT-base",
150
+ "architectures": [
151
+ "BertModel"
152
+ ],
153
+ "attention_probs_dropout_prob": 0.1,
154
+ "classifier_dropout": null,
155
+ "finetuning_task": "ner",
156
+ "gradient_checkpointing": false,
157
+ "hidden_act": "gelu",
158
+ "hidden_dropout_prob": 0.1,
159
+ "hidden_size": 768,
160
+ "id2label": {
161
+ "0": "O",
162
+ "1": "B-FARMACO",
163
+ "2": "I-FARMACO"
164
+ },
165
+ "initializer_range": 0.02,
166
+ "intermediate_size": 3072,
167
+ "label2id": {
168
+ "B-FARMACO": 1,
169
+ "I-FARMACO": 2,
170
+ "O": 0
171
+ },
172
+ "layer_norm_eps": 1e-12,
173
+ "max_position_embeddings": 512,
174
+ "model_type": "bert",
175
+ "num_attention_heads": 12,
176
+ "num_hidden_layers": 12,
177
+ "pad_token_id": 0,
178
+ "position_embedding_type": "absolute",
179
+ "transformers_version": "4.44.2",
180
+ "type_vocab_size": 2,
181
+ "use_cache": true,
182
+ "vocab_size": 28895
183
+ }
184
+
185
+ [INFO|tokenization_utils_base.py:2269] 2024-09-09 18:52:06,645 >> loading file vocab.txt from cache at /root/.cache/huggingface/hub/models--michiyasunaga--BioLinkBERT-base/snapshots/b71f5d70f063d1c8f1124070ce86f1ee463ca1fe/vocab.txt
186
+ [INFO|tokenization_utils_base.py:2269] 2024-09-09 18:52:06,645 >> loading file tokenizer.json from cache at /root/.cache/huggingface/hub/models--michiyasunaga--BioLinkBERT-base/snapshots/b71f5d70f063d1c8f1124070ce86f1ee463ca1fe/tokenizer.json
187
+ [INFO|tokenization_utils_base.py:2269] 2024-09-09 18:52:06,645 >> loading file added_tokens.json from cache at None
188
+ [INFO|tokenization_utils_base.py:2269] 2024-09-09 18:52:06,645 >> loading file special_tokens_map.json from cache at /root/.cache/huggingface/hub/models--michiyasunaga--BioLinkBERT-base/snapshots/b71f5d70f063d1c8f1124070ce86f1ee463ca1fe/special_tokens_map.json
189
+ [INFO|tokenization_utils_base.py:2269] 2024-09-09 18:52:06,645 >> loading file tokenizer_config.json from cache at /root/.cache/huggingface/hub/models--michiyasunaga--BioLinkBERT-base/snapshots/b71f5d70f063d1c8f1124070ce86f1ee463ca1fe/tokenizer_config.json
190
+ /usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884
191
+ warnings.warn(
192
+ [INFO|modeling_utils.py:3678] 2024-09-09 18:52:37,998 >> loading weights file pytorch_model.bin from cache at /root/.cache/huggingface/hub/models--michiyasunaga--BioLinkBERT-base/snapshots/b71f5d70f063d1c8f1124070ce86f1ee463ca1fe/pytorch_model.bin
193
+ [INFO|modeling_utils.py:4497] 2024-09-09 18:52:38,132 >> Some weights of the model checkpoint at michiyasunaga/BioLinkBERT-base were not used when initializing BertForTokenClassification: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
194
+ - This IS expected if you are initializing BertForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
195
+ - This IS NOT expected if you are initializing BertForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
196
+ [WARNING|modeling_utils.py:4509] 2024-09-09 18:52:38,132 >> Some weights of BertForTokenClassification were not initialized from the model checkpoint at michiyasunaga/BioLinkBERT-base and are newly initialized: ['classifier.bias', 'classifier.weight']
197
+ You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
198
+
199
+
200
+
201
+ /content/dissertation/scripts/ner/run_ner_train.py:397: FutureWarning: load_metric is deprecated and will be removed in the next major version of datasets. Use 'evaluate.load' instead, from the new library πŸ€— Evaluate: https://huggingface.co/docs/evaluate
202
+ metric = load_metric("seqeval", trust_remote_code=True)
203
+
204
+ [INFO|trainer.py:811] 2024-09-09 18:52:45,006 >> The following columns in the training set don't have a corresponding argument in `BertForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `BertForTokenClassification.forward`, you can safely ignore this message.
205
+ [INFO|trainer.py:2134] 2024-09-09 18:52:45,659 >> ***** Running training *****
206
+ [INFO|trainer.py:2135] 2024-09-09 18:52:45,659 >> Num examples = 27,841
207
+ [INFO|trainer.py:2136] 2024-09-09 18:52:45,659 >> Num Epochs = 10
208
+ [INFO|trainer.py:2137] 2024-09-09 18:52:45,659 >> Instantaneous batch size per device = 32
209
+ [INFO|trainer.py:2140] 2024-09-09 18:52:45,659 >> Total train batch size (w. parallel, distributed & accumulation) = 64
210
+ [INFO|trainer.py:2141] 2024-09-09 18:52:45,659 >> Gradient Accumulation steps = 2
211
+ [INFO|trainer.py:2142] 2024-09-09 18:52:45,659 >> Total optimization steps = 4,350
212
+ [INFO|trainer.py:2143] 2024-09-09 18:52:45,660 >> Number of trainable parameters = 107,644,419
213
+
214
  0%| | 0/4350 [00:00<?, ?it/s]
215
  0%| | 1/4350 [00:01<2:12:56, 1.83s/it]
216
  0%| | 2/4350 [00:02<1:07:15, 1.08it/s]
217
  0%| | 3/4350 [00:02<45:13, 1.60it/s]
218
  0%| | 4/4350 [00:02<39:57, 1.81it/s]
219
  0%| | 5/4350 [00:03<35:34, 2.04it/s]
220
  0%| | 6/4350 [00:03<33:09, 2.18it/s]
221
  0%| | 7/4350 [00:03<28:41, 2.52it/s]
222
  0%| | 8/4350 [00:04<30:05, 2.40it/s]
223
  0%| | 9/4350 [00:04<29:31, 2.45it/s]
224
  0%| | 10/4350 [00:05<28:23, 2.55it/s]
225
  0%| | 11/4350 [00:05<30:05, 2.40it/s]
226
  0%| | 12/4350 [00:05<29:20, 2.46it/s]
227
  0%| | 13/4350 [00:06<27:44, 2.61it/s]
228
  0%| | 14/4350 [00:06<24:59, 2.89it/s]
229
  0%| | 15/4350 [00:06<24:46, 2.92it/s]
230
  0%| | 16/4350 [00:07<26:04, 2.77it/s]
231
  0%| | 17/4350 [00:07<24:24, 2.96it/s]
232
  0%| | 18/4350 [00:08<27:09, 2.66it/s]
233
  0%| | 19/4350 [00:08<24:24, 2.96it/s]
234
  0%| | 20/4350 [00:08<24:05, 3.00it/s]
235
  0%| | 21/4350 [00:09<30:36, 2.36it/s]
236
  1%| | 22/4350 [00:09<28:18, 2.55it/s]
237
  1%| | 23/4350 [00:09<27:57, 2.58it/s]
238
  1%| | 24/4350 [00:10<26:27, 2.72it/s]
239
  1%| | 25/4350 [00:10<26:40, 2.70it/s]
240
  1%| | 26/4350 [00:10<26:40, 2.70it/s]
241
  1%| | 27/4350 [00:11<24:01, 3.00it/s]
242
  1%| | 28/4350 [00:11<24:02, 3.00it/s]
243
  1%| | 29/4350 [00:11<24:01, 3.00it/s]
244
  1%| | 30/4350 [00:12<23:34, 3.05it/s]
245
  1%| | 31/4350 [00:12<24:18, 2.96it/s]
246
  1%| | 32/4350 [00:12<23:32, 3.06it/s]
247
  1%| | 33/4350 [00:13<24:37, 2.92it/s]
248
  1%| | 34/4350 [00:13<23:50, 3.02it/s]
249
  1%| | 35/4350 [00:13<23:51, 3.01it/s]
250
  1%| | 36/4350 [00:14<24:55, 2.88it/s]
251
  1%| | 37/4350 [00:14<24:01, 2.99it/s]
252
  1%| | 38/4350 [00:14<22:33, 3.19it/s]
253
  1%| | 39/4350 [00:15<25:07, 2.86it/s]
254
  1%| | 40/4350 [00:15<29:00, 2.48it/s]
255
  1%| | 41/4350 [00:16<28:27, 2.52it/s]
256
  1%| | 42/4350 [00:16<28:13, 2.54it/s]
257
  1%| | 43/4350 [00:17<29:44, 2.41it/s]
258
  1%| | 44/4350 [00:17<27:34, 2.60it/s]
259
  1%| | 45/4350 [00:17<28:06, 2.55it/s]
260
  1%| | 46/4350 [00:18<27:16, 2.63it/s]
261
  1%| | 47/4350 [00:18<27:55, 2.57it/s]
262
  1%| | 48/4350 [00:18<26:50, 2.67it/s]
263
  1%| | 49/4350 [00:19<25:00, 2.87it/s]
264
  1%| | 50/4350 [00:19<24:40, 2.90it/s]
265
  1%| | 51/4350 [00:19<25:36, 2.80it/s]
266
  1%| | 52/4350 [00:20<24:53, 2.88it/s]
267
  1%| | 53/4350 [00:20<24:14, 2.95it/s]
268
  1%| | 54/4350 [00:21<28:01, 2.55it/s]
269
  1%|▏ | 55/4350 [00:21<25:47, 2.77it/s]
270
  1%|▏ | 56/4350 [00:21<23:08, 3.09it/s]
271
  1%|▏ | 57/4350 [00:22<26:16, 2.72it/s]
272
  1%|▏ | 58/4350 [00:22<27:50, 2.57it/s]
273
  1%|▏ | 59/4350 [00:22<29:53, 2.39it/s]
274
  1%|▏ | 60/4350 [00:23<28:31, 2.51it/s]
275
  1%|▏ | 61/4350 [00:23<27:04, 2.64it/s]
276
  1%|▏ | 62/4350 [00:23<25:53, 2.76it/s]
277
  1%|▏ | 63/4350 [00:24<26:30, 2.70it/s]
278
  1%|▏ | 64/4350 [00:24<28:35, 2.50it/s]
279
  1%|▏ | 65/4350 [00:25<25:48, 2.77it/s]
280
  2%|▏ | 66/4350 [00:25<25:04, 2.85it/s]
281
  2%|▏ | 67/4350 [00:25<24:52, 2.87it/s]
282
  2%|▏ | 68/4350 [00:26<27:19, 2.61it/s]
283
  2%|▏ | 69/4350 [00:26<25:42, 2.78it/s]
284
  2%|▏ | 70/4350 [00:26<25:14, 2.83it/s]
285
  2%|▏ | 71/4350 [00:27<25:14, 2.82it/s]
286
  2%|▏ | 72/4350 [00:27<23:56, 2.98it/s]
287
  2%|▏ | 73/4350 [00:27<22:54, 3.11it/s]
288
  2%|▏ | 74/4350 [00:28<28:00, 2.55it/s]
289
  2%|▏ | 75/4350 [00:28<26:37, 2.68it/s]
290
  2%|▏ | 76/4350 [00:29<25:57, 2.74it/s]
291
  2%|▏ | 77/4350 [00:29<24:17, 2.93it/s]
292
  2%|▏ | 78/4350 [00:29<24:17, 2.93it/s]
293
  2%|▏ | 79/4350 [00:29<23:24, 3.04it/s]
294
  2%|▏ | 80/4350 [00:30<27:57, 2.55it/s]
295
  2%|▏ | 81/4350 [00:30<27:40, 2.57it/s]
296
  2%|▏ | 82/4350 [00:31<25:47, 2.76it/s]
297
  2%|▏ | 83/4350 [00:31<25:12, 2.82it/s]
298
  2%|▏ | 84/4350 [00:32<28:43, 2.48it/s]
299
  2%|▏ | 85/4350 [00:32<27:43, 2.56it/s]
300
  2%|▏ | 86/4350 [00:32<26:44, 2.66it/s]
301
  2%|▏ | 87/4350 [00:32<23:57, 2.97it/s]
302
  2%|▏ | 88/4350 [00:33<22:46, 3.12it/s]
303
  2%|▏ | 89/4350 [00:33<22:05, 3.22it/s]
304
  2%|▏ | 90/4350 [00:33<23:12, 3.06it/s]
305
  2%|▏ | 91/4350 [00:34<23:42, 2.99it/s]
306
  2%|▏ | 92/4350 [00:34<24:55, 2.85it/s]
307
  2%|▏ | 93/4350 [00:35<25:03, 2.83it/s]
308
  2%|▏ | 94/4350 [00:35<24:31, 2.89it/s]
309
  2%|▏ | 95/4350 [00:35<24:28, 2.90it/s]
310
  2%|▏ | 96/4350 [00:36<25:09, 2.82it/s]
311
  2%|▏ | 97/4350 [00:36<25:18, 2.80it/s]
312
  2%|▏ | 98/4350 [00:36<24:34, 2.88it/s]
313
  2%|▏ | 99/4350 [00:37<23:06, 3.07it/s]
314
  2%|▏ | 100/4350 [00:37<25:02, 2.83it/s]
315
  2%|▏ | 101/4350 [00:37<24:55, 2.84it/s]
316
  2%|▏ | 102/4350 [00:38<26:01, 2.72it/s]
317
  2%|▏ | 103/4350 [00:38<24:38, 2.87it/s]
318
  2%|▏ | 104/4350 [00:38<24:56, 2.84it/s]
319
  2%|▏ | 105/4350 [00:39<24:00, 2.95it/s]
320
  2%|▏ | 106/4350 [00:39<22:39, 3.12it/s]
321
  2%|▏ | 107/4350 [00:39<21:17, 3.32it/s]
322
  2%|▏ | 108/4350 [00:40<21:47, 3.24it/s]
323
  3%|β–Ž | 109/4350 [00:40<21:16, 3.32it/s]
324
  3%|β–Ž | 110/4350 [00:40<22:04, 3.20it/s]
325
  3%|β–Ž | 111/4350 [00:41<22:32, 3.13it/s]
326
  3%|β–Ž | 112/4350 [00:41<21:56, 3.22it/s]
327
  3%|β–Ž | 113/4350 [00:41<23:45, 2.97it/s]
328
  3%|β–Ž | 114/4350 [00:42<26:21, 2.68it/s]
329
  3%|β–Ž | 115/4350 [00:42<24:32, 2.88it/s]
330
  3%|β–Ž | 116/4350 [00:42<23:14, 3.04it/s]
331
  3%|β–Ž | 117/4350 [00:43<23:19, 3.03it/s]
332
  3%|β–Ž | 118/4350 [00:43<22:47, 3.10it/s]
333
  3%|β–Ž | 119/4350 [00:43<23:32, 2.99it/s]
334
  3%|β–Ž | 120/4350 [00:43<21:34, 3.27it/s]
335
  3%|β–Ž | 121/4350 [00:44<22:33, 3.12it/s]
336
  3%|β–Ž | 122/4350 [00:44<24:02, 2.93it/s]
337
  3%|β–Ž | 123/4350 [00:44<22:52, 3.08it/s]
338
  3%|β–Ž | 124/4350 [00:45<23:48, 2.96it/s]
339
  3%|β–Ž | 125/4350 [00:45<23:16, 3.03it/s]
340
  3%|β–Ž | 126/4350 [00:45<22:53, 3.08it/s]
341
  3%|β–Ž | 127/4350 [00:46<24:18, 2.89it/s]
342
  3%|β–Ž | 128/4350 [00:46<27:49, 2.53it/s]
343
  3%|β–Ž | 129/4350 [00:47<26:33, 2.65it/s]
344
  3%|β–Ž | 130/4350 [00:47<27:10, 2.59it/s]
345
  3%|β–Ž | 131/4350 [00:47<25:19, 2.78it/s]
346
  3%|β–Ž | 132/4350 [00:48<25:45, 2.73it/s]
347
  3%|β–Ž | 133/4350 [00:48<29:04, 2.42it/s]
348
  3%|β–Ž | 134/4350 [00:49<29:58, 2.34it/s]
349
  3%|β–Ž | 135/4350 [00:49<31:40, 2.22it/s]
350
  3%|β–Ž | 136/4350 [00:50<30:30, 2.30it/s]
351
  3%|β–Ž | 137/4350 [00:50<27:22, 2.56it/s]
352
  3%|β–Ž | 138/4350 [00:50<25:51, 2.71it/s]
353
  3%|β–Ž | 139/4350 [00:51<26:03, 2.69it/s]
354
  3%|β–Ž | 140/4350 [00:51<24:06, 2.91it/s]
355
  3%|β–Ž | 141/4350 [00:51<23:46, 2.95it/s]
356
  3%|β–Ž | 142/4350 [00:52<22:27, 3.12it/s]
357
  3%|β–Ž | 143/4350 [00:52<22:25, 3.13it/s]
358
  3%|β–Ž | 144/4350 [00:52<21:37, 3.24it/s]
359
  3%|β–Ž | 145/4350 [00:53<24:18, 2.88it/s]
360
  3%|β–Ž | 146/4350 [00:53<22:25, 3.12it/s]
361
  3%|β–Ž | 147/4350 [00:53<21:27, 3.26it/s]
362
  3%|β–Ž | 148/4350 [00:53<21:06, 3.32it/s]
363
  3%|β–Ž | 149/4350 [00:54<23:46, 2.95it/s]
364
  3%|β–Ž | 150/4350 [00:54<24:06, 2.90it/s]
365
  3%|β–Ž | 151/4350 [00:55<24:54, 2.81it/s]
366
  3%|β–Ž | 152/4350 [00:55<23:49, 2.94it/s]
367
  4%|β–Ž | 153/4350 [00:55<25:34, 2.74it/s]
368
  4%|β–Ž | 154/4350 [00:56<24:10, 2.89it/s]
369
  4%|β–Ž | 155/4350 [00:56<24:19, 2.88it/s]
370
  4%|β–Ž | 156/4350 [00:56<23:13, 3.01it/s]
371
  4%|β–Ž | 157/4350 [00:57<25:11, 2.77it/s]
372
  4%|β–Ž | 158/4350 [00:57<24:25, 2.86it/s]
373
  4%|β–Ž | 159/4350 [00:57<23:44, 2.94it/s]
374
  4%|β–Ž | 160/4350 [00:58<22:35, 3.09it/s]
375
  4%|β–Ž | 161/4350 [00:58<22:00, 3.17it/s]
376
  4%|β–Ž | 162/4350 [00:58<22:49, 3.06it/s]
377
  4%|β–Ž | 163/4350 [00:59<26:36, 2.62it/s]
378
  4%|▍ | 164/4350 [00:59<25:37, 2.72it/s]
379
  4%|▍ | 165/4350 [00:59<25:31, 2.73it/s]
380
  4%|▍ | 166/4350 [01:00<26:19, 2.65it/s]
381
  4%|▍ | 167/4350 [01:00<24:27, 2.85it/s]
382
  4%|▍ | 168/4350 [01:00<23:39, 2.95it/s]
383
  4%|▍ | 169/4350 [01:01<22:04, 3.16it/s]
384
  4%|▍ | 170/4350 [01:01<23:16, 2.99it/s]
385
  4%|▍ | 171/4350 [01:02<25:14, 2.76it/s]
386
  4%|▍ | 172/4350 [01:02<25:29, 2.73it/s]
387
  4%|▍ | 173/4350 [01:02<24:27, 2.85it/s]
388
  4%|▍ | 174/4350 [01:03<23:42, 2.93it/s]
389
  4%|▍ | 175/4350 [01:03<25:38, 2.71it/s]
390
  4%|▍ | 176/4350 [01:04<29:19, 2.37it/s]
391
  4%|▍ | 177/4350 [01:04<26:11, 2.66it/s]
392
  4%|▍ | 178/4350 [01:04<25:03, 2.77it/s]
393
  4%|▍ | 179/4350 [01:05<27:02, 2.57it/s]
394
  4%|▍ | 180/4350 [01:05<25:35, 2.72it/s]
395
  4%|▍ | 181/4350 [01:06<30:51, 2.25it/s]
396
  4%|▍ | 182/4350 [01:06<27:49, 2.50it/s]
397
  4%|▍ | 183/4350 [01:06<24:28, 2.84it/s]
398
  4%|▍ | 184/4350 [01:06<23:31, 2.95it/s]
399
  4%|▍ | 185/4350 [01:07<22:51, 3.04it/s]
400
  4%|▍ | 186/4350 [01:07<23:20, 2.97it/s]
401
  4%|▍ | 187/4350 [01:07<23:48, 2.92it/s]
402
  4%|▍ | 188/4350 [01:08<22:44, 3.05it/s]
403
  4%|▍ | 189/4350 [01:08<22:45, 3.05it/s]
404
  4%|▍ | 190/4350 [01:08<23:19, 2.97it/s]
405
  4%|▍ | 191/4350 [01:09<23:47, 2.91it/s]
406
  4%|▍ | 192/4350 [01:09<25:42, 2.70it/s]
407
  4%|▍ | 193/4350 [01:09<24:41, 2.81it/s]
408
  4%|▍ | 194/4350 [01:10<22:46, 3.04it/s]
409
  4%|▍ | 195/4350 [01:10<26:31, 2.61it/s]
410
  5%|▍ | 196/4350 [01:11<26:26, 2.62it/s]
411
  5%|▍ | 197/4350 [01:11<25:04, 2.76it/s]
412
  5%|▍ | 198/4350 [01:11<23:15, 2.98it/s]
413
  5%|▍ | 199/4350 [01:12<23:17, 2.97it/s]
414
  5%|▍ | 200/4350 [01:12<25:40, 2.69it/s]
415
  5%|▍ | 201/4350 [01:12<24:17, 2.85it/s]
416
  5%|▍ | 202/4350 [01:13<23:54, 2.89it/s]
417
  5%|▍ | 203/4350 [01:13<23:43, 2.91it/s]
418
  5%|▍ | 204/4350 [01:13<24:44, 2.79it/s]
419
  5%|▍ | 205/4350 [01:14<24:15, 2.85it/s]
420
  5%|▍ | 206/4350 [01:14<23:12, 2.98it/s]
421
  5%|▍ | 207/4350 [01:14<23:25, 2.95it/s]
422
  5%|▍ | 208/4350 [01:15<26:19, 2.62it/s]
423
  5%|▍ | 209/4350 [01:15<24:53, 2.77it/s]
424
  5%|▍ | 210/4350 [01:15<22:57, 3.01it/s]
425
  5%|▍ | 211/4350 [01:16<24:11, 2.85it/s]
426
  5%|▍ | 212/4350 [01:16<22:46, 3.03it/s]
427
  5%|▍ | 213/4350 [01:16<23:04, 2.99it/s]
428
  5%|▍ | 214/4350 [01:17<29:05, 2.37it/s]
429
  5%|▍ | 215/4350 [01:17<27:47, 2.48it/s]
430
  5%|▍ | 216/4350 [01:18<27:23, 2.52it/s]
431
  5%|▍ | 217/4350 [01:18<25:58, 2.65it/s]
432
  5%|β–Œ | 218/4350 [01:18<24:47, 2.78it/s]
433
  5%|β–Œ | 219/4350 [01:19<27:15, 2.53it/s]
434
  5%|β–Œ | 220/4350 [01:19<27:40, 2.49it/s]
435
  5%|β–Œ | 221/4350 [01:20<28:06, 2.45it/s]
436
  5%|β–Œ | 222/4350 [01:20<26:57, 2.55it/s]
437
  5%|β–Œ | 223/4350 [01:21<28:14, 2.44it/s]
438
  5%|β–Œ | 224/4350 [01:21<28:53, 2.38it/s]
439
  5%|β–Œ | 225/4350 [01:21<29:20, 2.34it/s]
440
  5%|β–Œ | 226/4350 [01:22<27:47, 2.47it/s]
441
  5%|β–Œ | 227/4350 [01:22<26:55, 2.55it/s]
442
  5%|β–Œ | 228/4350 [01:23<25:30, 2.69it/s]
443
  5%|β–Œ | 229/4350 [01:23<23:06, 2.97it/s]
444
  5%|β–Œ | 230/4350 [01:23<22:14, 3.09it/s]
445
  5%|β–Œ | 231/4350 [01:23<23:09, 2.97it/s]
446
  5%|β–Œ | 232/4350 [01:24<23:03, 2.98it/s]
447
  5%|β–Œ | 233/4350 [01:24<22:17, 3.08it/s]
448
  5%|β–Œ | 234/4350 [01:24<23:21, 2.94it/s]
449
  5%|β–Œ | 235/4350 [01:25<23:27, 2.92it/s]
450
  5%|β–Œ | 236/4350 [01:25<23:20, 2.94it/s]
451
  5%|β–Œ | 237/4350 [01:25<22:38, 3.03it/s]
452
  5%|β–Œ | 238/4350 [01:26<21:16, 3.22it/s]
453
  5%|β–Œ | 239/4350 [01:26<27:58, 2.45it/s]
454
  6%|β–Œ | 240/4350 [01:27<26:00, 2.63it/s]
455
  6%|β–Œ | 241/4350 [01:27<23:48, 2.88it/s]
456
  6%|β–Œ | 242/4350 [01:27<26:38, 2.57it/s]
457
  6%|β–Œ | 243/4350 [01:28<25:21, 2.70it/s]
458
  6%|β–Œ | 244/4350 [01:28<29:04, 2.35it/s]
459
  6%|β–Œ | 245/4350 [01:29<28:52, 2.37it/s]
460
  6%|β–Œ | 246/4350 [01:29<29:27, 2.32it/s]
461
  6%|β–Œ | 247/4350 [01:30<28:08, 2.43it/s]
462
  6%|β–Œ | 248/4350 [01:30<27:08, 2.52it/s]
463
  6%|β–Œ | 249/4350 [01:30<27:43, 2.46it/s]
464
  6%|β–Œ | 250/4350 [01:31<26:32, 2.57it/s]
465
  6%|β–Œ | 251/4350 [01:31<26:18, 2.60it/s]
466
  6%|β–Œ | 252/4350 [01:31<26:35, 2.57it/s]
467
  6%|β–Œ | 253/4350 [01:32<24:08, 2.83it/s]
468
  6%|β–Œ | 254/4350 [01:32<22:32, 3.03it/s]
469
  6%|β–Œ | 255/4350 [01:32<22:46, 3.00it/s]
470
  6%|β–Œ | 256/4350 [01:33<22:59, 2.97it/s]
471
  6%|β–Œ | 257/4350 [01:33<25:40, 2.66it/s]
472
  6%|β–Œ | 258/4350 [01:34<29:38, 2.30it/s]
473
  6%|β–Œ | 259/4350 [01:34<27:20, 2.49it/s]
474
  6%|β–Œ | 260/4350 [01:34<28:15, 2.41it/s]
475
  6%|β–Œ | 261/4350 [01:35<27:24, 2.49it/s]
476
  6%|β–Œ | 262/4350 [01:35<26:03, 2.61it/s]
477
  6%|β–Œ | 263/4350 [01:36<26:28, 2.57it/s]
478
  6%|β–Œ | 264/4350 [01:36<23:58, 2.84it/s]
479
  6%|β–Œ | 265/4350 [01:36<23:33, 2.89it/s]
480
  6%|β–Œ | 266/4350 [01:37<23:12, 2.93it/s]
481
  6%|β–Œ | 267/4350 [01:37<23:00, 2.96it/s]
482
  6%|β–Œ | 268/4350 [01:37<23:03, 2.95it/s]
483
  6%|β–Œ | 269/4350 [01:37<20:59, 3.24it/s]
484
  6%|β–Œ | 270/4350 [01:38<22:08, 3.07it/s]
485
  6%|β–Œ | 271/4350 [01:38<23:17, 2.92it/s]
486
  6%|β–‹ | 272/4350 [01:38<22:17, 3.05it/s]
487
  6%|β–‹ | 273/4350 [01:39<22:14, 3.06it/s]
488
  6%|β–‹ | 274/4350 [01:39<22:00, 3.09it/s]
489
  6%|β–‹ | 275/4350 [01:39<23:06, 2.94it/s]
490
  6%|β–‹ | 276/4350 [01:40<22:26, 3.02it/s]
491
  6%|β–‹ | 277/4350 [01:40<21:32, 3.15it/s]
492
  6%|β–‹ | 278/4350 [01:41<24:22, 2.78it/s]
493
  6%|β–‹ | 279/4350 [01:41<23:27, 2.89it/s]
494
  6%|β–‹ | 280/4350 [01:41<22:21, 3.03it/s]
495
  6%|β–‹ | 281/4350 [01:41<22:36, 3.00it/s]
496
  6%|β–‹ | 282/4350 [01:42<21:42, 3.12it/s]
497
  7%|β–‹ | 283/4350 [01:42<21:10, 3.20it/s]
498
  7%|β–‹ | 284/4350 [01:42<21:09, 3.20it/s]
499
  7%|β–‹ | 285/4350 [01:43<21:50, 3.10it/s]
500
  7%|β–‹ | 286/4350 [01:43<25:09, 2.69it/s]
501
  7%|β–‹ | 287/4350 [01:44<25:34, 2.65it/s]
502
  7%|β–‹ | 288/4350 [01:44<25:56, 2.61it/s]
503
  7%|β–‹ | 289/4350 [01:44<24:41, 2.74it/s]
504
  7%|β–‹ | 290/4350 [01:45<26:16, 2.58it/s]
505
  7%|β–‹ | 291/4350 [01:45<27:35, 2.45it/s]
506
  7%|β–‹ | 292/4350 [01:46<25:57, 2.60it/s]
507
  7%|β–‹ | 293/4350 [01:46<28:13, 2.40it/s]
508
  7%|β–‹ | 294/4350 [01:46<25:55, 2.61it/s]
509
  7%|β–‹ | 295/4350 [01:47<25:00, 2.70it/s]
510
  7%|β–‹ | 296/4350 [01:47<24:25, 2.77it/s]
511
  7%|β–‹ | 297/4350 [01:47<25:04, 2.69it/s]
512
  7%|β–‹ | 298/4350 [01:48<23:36, 2.86it/s]
513
  7%|β–‹ | 299/4350 [01:48<25:33, 2.64it/s]
514
  7%|β–‹ | 300/4350 [01:49<27:17, 2.47it/s]
515
  7%|β–‹ | 301/4350 [01:49<27:11, 2.48it/s]
516
  7%|β–‹ | 302/4350 [01:49<27:24, 2.46it/s]
517
  7%|β–‹ | 303/4350 [01:50<25:35, 2.64it/s]
518
  7%|β–‹ | 304/4350 [01:50<24:47, 2.72it/s]
519
  7%|β–‹ | 305/4350 [01:50<25:02, 2.69it/s]
520
  7%|β–‹ | 306/4350 [01:51<24:32, 2.75it/s]
521
  7%|β–‹ | 307/4350 [01:51<27:04, 2.49it/s]
522
  7%|β–‹ | 308/4350 [01:52<25:18, 2.66it/s]
523
  7%|β–‹ | 309/4350 [01:52<25:37, 2.63it/s]
524
  7%|β–‹ | 310/4350 [01:52<25:13, 2.67it/s]
525
  7%|β–‹ | 311/4350 [01:53<23:19, 2.89it/s]
526
  7%|β–‹ | 312/4350 [01:53<23:13, 2.90it/s]
527
  7%|β–‹ | 313/4350 [01:53<24:41, 2.73it/s]
528
  7%|β–‹ | 314/4350 [01:54<22:47, 2.95it/s]
529
  7%|β–‹ | 315/4350 [01:54<22:39, 2.97it/s]
530
  7%|β–‹ | 316/4350 [01:54<22:45, 2.95it/s]
531
  7%|β–‹ | 317/4350 [01:55<21:31, 3.12it/s]
532
  7%|β–‹ | 318/4350 [01:55<22:18, 3.01it/s]
533
  7%|β–‹ | 319/4350 [01:55<21:27, 3.13it/s]
534
  7%|β–‹ | 320/4350 [01:56<21:30, 3.12it/s]
535
  7%|β–‹ | 321/4350 [01:56<23:32, 2.85it/s]
536
  7%|β–‹ | 322/4350 [01:56<21:24, 3.14it/s]
537
  7%|β–‹ | 323/4350 [01:57<23:29, 2.86it/s]
538
  7%|β–‹ | 324/4350 [01:57<23:12, 2.89it/s]
539
  7%|β–‹ | 325/4350 [01:57<22:36, 2.97it/s]
540
  7%|β–‹ | 326/4350 [01:58<23:16, 2.88it/s]
541
  8%|β–Š | 327/4350 [01:58<22:11, 3.02it/s]
542
  8%|β–Š | 328/4350 [01:58<21:27, 3.12it/s]
543
  8%|β–Š | 329/4350 [01:59<23:33, 2.84it/s]
544
  8%|β–Š | 330/4350 [01:59<23:29, 2.85it/s]
545
  8%|β–Š | 331/4350 [02:00<26:59, 2.48it/s]
546
  8%|β–Š | 332/4350 [02:00<27:55, 2.40it/s]
547
  8%|β–Š | 333/4350 [02:00<27:01, 2.48it/s]
548
  8%|β–Š | 334/4350 [02:01<30:38, 2.18it/s]
549
  8%|οΏ½οΏ½ | 335/4350 [02:01<29:04, 2.30it/s]
550
  8%|β–Š | 336/4350 [02:02<27:30, 2.43it/s]
551
  8%|β–Š | 337/4350 [02:02<25:57, 2.58it/s]
552
  8%|β–Š | 338/4350 [02:02<24:12, 2.76it/s]
553
  8%|β–Š | 339/4350 [02:03<23:21, 2.86it/s]
554
  8%|β–Š | 340/4350 [02:03<22:35, 2.96it/s]
555
  8%|β–Š | 341/4350 [02:03<21:15, 3.14it/s]
556
  8%|β–Š | 342/4350 [02:04<20:49, 3.21it/s]
557
  8%|β–Š | 343/4350 [02:04<21:41, 3.08it/s]
558
  8%|β–Š | 344/4350 [02:04<23:57, 2.79it/s]
559
  8%|β–Š | 345/4350 [02:05<28:34, 2.34it/s]
560
  8%|β–Š | 346/4350 [02:05<25:49, 2.58it/s]
561
  8%|β–Š | 347/4350 [02:06<27:21, 2.44it/s]
562
  8%|β–Š | 348/4350 [02:06<25:58, 2.57it/s]
563
  8%|β–Š | 349/4350 [02:06<24:03, 2.77it/s]
564
  8%|β–Š | 350/4350 [02:07<23:20, 2.86it/s]
565
  8%|β–Š | 351/4350 [02:07<23:17, 2.86it/s]
566
  8%|β–Š | 352/4350 [02:07<22:07, 3.01it/s]
567
  8%|β–Š | 353/4350 [02:08<22:21, 2.98it/s]
568
  8%|β–Š | 354/4350 [02:09<35:49, 1.86it/s]
569
  8%|β–Š | 355/4350 [02:09<30:43, 2.17it/s]
570
  8%|β–Š | 356/4350 [02:09<30:27, 2.19it/s]
571
  8%|β–Š | 357/4350 [02:10<28:53, 2.30it/s]
572
  8%|β–Š | 358/4350 [02:10<25:42, 2.59it/s]
573
  8%|β–Š | 359/4350 [02:10<24:35, 2.70it/s]
574
  8%|β–Š | 360/4350 [02:11<25:09, 2.64it/s]
575
  8%|β–Š | 361/4350 [02:11<24:13, 2.74it/s]
576
  8%|β–Š | 362/4350 [02:11<21:52, 3.04it/s]
577
  8%|β–Š | 363/4350 [02:12<20:15, 3.28it/s]
578
  8%|β–Š | 364/4350 [02:12<20:00, 3.32it/s]
579
  8%|β–Š | 365/4350 [02:12<21:02, 3.16it/s]
580
  8%|β–Š | 366/4350 [02:13<23:22, 2.84it/s]
581
  8%|β–Š | 367/4350 [02:13<22:17, 2.98it/s]
582
  8%|β–Š | 368/4350 [02:13<23:41, 2.80it/s]
583
  8%|β–Š | 369/4350 [02:14<23:06, 2.87it/s]
584
  9%|β–Š | 370/4350 [02:14<22:09, 2.99it/s]
585
  9%|β–Š | 371/4350 [02:14<22:07, 3.00it/s]
586
  9%|β–Š | 372/4350 [02:15<22:35, 2.93it/s]
587
  9%|β–Š | 373/4350 [02:15<21:52, 3.03it/s]
588
  9%|β–Š | 374/4350 [02:15<21:59, 3.01it/s]
589
  9%|β–Š | 375/4350 [02:16<25:02, 2.65it/s]
590
  9%|β–Š | 376/4350 [02:16<24:11, 2.74it/s]
591
  9%|β–Š | 377/4350 [02:17<23:32, 2.81it/s]
592
  9%|β–Š | 378/4350 [02:17<25:04, 2.64it/s]
593
  9%|β–Š | 379/4350 [02:17<24:13, 2.73it/s]
594
  9%|β–Š | 380/4350 [02:18<23:19, 2.84it/s]
595
  9%|β–‰ | 381/4350 [02:18<23:19, 2.84it/s]
596
  9%|β–‰ | 382/4350 [02:19<29:36, 2.23it/s]
597
  9%|β–‰ | 383/4350 [02:19<26:13, 2.52it/s]
598
  9%|β–‰ | 384/4350 [02:19<24:14, 2.73it/s]
599
  9%|β–‰ | 385/4350 [02:20<23:46, 2.78it/s]
600
  9%|β–‰ | 386/4350 [02:20<23:44, 2.78it/s]
601
  9%|β–‰ | 387/4350 [02:20<22:23, 2.95it/s]
602
  9%|β–‰ | 388/4350 [02:21<24:09, 2.73it/s]
603
  9%|β–‰ | 389/4350 [02:21<23:41, 2.79it/s]
604
  9%|β–‰ | 390/4350 [02:21<23:05, 2.86it/s]
605
  9%|β–‰ | 391/4350 [02:22<22:52, 2.88it/s]
606
  9%|β–‰ | 392/4350 [02:22<25:23, 2.60it/s]
607
  9%|β–‰ | 393/4350 [02:22<25:05, 2.63it/s]
608
  9%|β–‰ | 394/4350 [02:23<28:17, 2.33it/s]
609
  9%|β–‰ | 395/4350 [02:23<25:13, 2.61it/s]
610
  9%|β–‰ | 396/4350 [02:24<24:46, 2.66it/s]
611
  9%|β–‰ | 397/4350 [02:24<22:36, 2.91it/s]
612
  9%|β–‰ | 398/4350 [02:24<22:50, 2.88it/s]
613
  9%|β–‰ | 399/4350 [02:25<21:20, 3.08it/s]
614
  9%|β–‰ | 400/4350 [02:25<23:47, 2.77it/s]
615
  9%|β–‰ | 401/4350 [02:25<24:01, 2.74it/s]
616
  9%|β–‰ | 402/4350 [02:26<25:20, 2.60it/s]
617
  9%|β–‰ | 403/4350 [02:26<24:42, 2.66it/s]
618
  9%|β–‰ | 404/4350 [02:27<25:01, 2.63it/s]
619
  9%|β–‰ | 405/4350 [02:27<24:06, 2.73it/s]
620
  9%|β–‰ | 406/4350 [02:27<27:45, 2.37it/s]
621
  9%|β–‰ | 407/4350 [02:28<28:05, 2.34it/s]
622
  9%|β–‰ | 408/4350 [02:28<26:08, 2.51it/s]
623
  9%|β–‰ | 409/4350 [02:29<24:42, 2.66it/s]
624
  9%|β–‰ | 410/4350 [02:29<22:44, 2.89it/s]
625
  9%|β–‰ | 411/4350 [02:29<23:51, 2.75it/s]
626
  9%|β–‰ | 412/4350 [02:30<25:09, 2.61it/s]
627
  9%|β–‰ | 413/4350 [02:30<24:44, 2.65it/s]
628
  10%|β–‰ | 414/4350 [02:30<26:31, 2.47it/s]
629
  10%|β–‰ | 415/4350 [02:31<25:38, 2.56it/s]
630
  10%|β–‰ | 416/4350 [02:31<24:27, 2.68it/s]
631
  10%|β–‰ | 417/4350 [02:32<23:39, 2.77it/s]
632
  10%|β–‰ | 418/4350 [02:32<22:29, 2.91it/s]
633
  10%|β–‰ | 419/4350 [02:32<21:39, 3.02it/s]
634
  10%|β–‰ | 420/4350 [02:32<20:19, 3.22it/s]
635
  10%|β–‰ | 421/4350 [02:33<22:56, 2.85it/s]
636
  10%|β–‰ | 422/4350 [02:33<22:42, 2.88it/s]
637
  10%|β–‰ | 423/4350 [02:33<21:38, 3.03it/s]
638
  10%|β–‰ | 424/4350 [02:34<21:37, 3.03it/s]
639
  10%|β–‰ | 425/4350 [02:34<22:14, 2.94it/s]
640
  10%|β–‰ | 426/4350 [02:35<23:22, 2.80it/s]
641
  10%|β–‰ | 427/4350 [02:35<22:52, 2.86it/s]
642
  10%|β–‰ | 428/4350 [02:35<22:34, 2.89it/s]
643
  10%|β–‰ | 429/4350 [02:36<22:35, 2.89it/s]
644
  10%|β–‰ | 430/4350 [02:36<21:47, 3.00it/s]
645
  10%|β–‰ | 431/4350 [02:36<21:10, 3.09it/s]
646
  10%|β–‰ | 432/4350 [02:37<21:57, 2.97it/s]
647
  10%|β–‰ | 433/4350 [02:37<21:35, 3.02it/s]
648
  10%|β–‰ | 434/4350 [02:37<20:41, 3.15it/s]
649
  10%|β–ˆ | 435/4350 [02:38<23:47, 2.74it/s][INFO|trainer.py:811] 2024-09-09 18:55:23,830 >> The following columns in the evaluation set don't have a corresponding argument in `BertForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `BertForTokenClassification.forward`, you can safely ignore this message.
650
+ [INFO|trainer.py:3819] 2024-09-09 18:55:23,833 >>
651
+ ***** Running Evaluation *****
652
+ [INFO|trainer.py:3821] 2024-09-09 18:55:23,833 >> Num examples = 6946
653
+ [INFO|trainer.py:3824] 2024-09-09 18:55:23,833 >> Batch size = 8
654
+
655
+
656
  0%| | 0/869 [00:00<?, ?it/s]
657
+
658
  1%| | 10/869 [00:00<00:09, 93.25it/s]
659
+
660
  2%|▏ | 20/869 [00:00<00:10, 81.05it/s]
661
+
662
  3%|β–Ž | 29/869 [00:00<00:10, 78.93it/s]
663
+
664
  4%|▍ | 37/869 [00:00<00:10, 76.51it/s]
665
+
666
  5%|β–Œ | 46/869 [00:00<00:10, 80.40it/s]
667
+
668
  6%|β–‹ | 55/869 [00:00<00:09, 82.80it/s]
669
+
670
  7%|β–‹ | 64/869 [00:00<00:10, 77.85it/s]
671
+
672
  8%|β–Š | 72/869 [00:00<00:10, 76.99it/s]
673
+
674
  9%|β–‰ | 82/869 [00:01<00:09, 81.30it/s]
675
+
676
  11%|β–ˆ | 92/869 [00:01<00:09, 84.77it/s]
677
+
678
  12%|β–ˆβ– | 102/869 [00:01<00:08, 86.85it/s]
679
+
680
  13%|β–ˆβ–Ž | 111/869 [00:01<00:08, 84.28it/s]
681
+
682
  14%|β–ˆβ– | 120/869 [00:01<00:09, 82.94it/s]
683
+
684
  15%|β–ˆβ– | 129/869 [00:01<00:09, 80.32it/s]
685
+
686
  16%|β–ˆβ–Œ | 139/869 [00:01<00:08, 83.08it/s]
687
+
688
  17%|β–ˆβ–‹ | 148/869 [00:01<00:09, 78.75it/s]
689
+
690
  18%|β–ˆβ–Š | 157/869 [00:01<00:09, 78.73it/s]
691
+
692
  19%|β–ˆβ–‰ | 166/869 [00:02<00:08, 78.19it/s]
693
+
694
  20%|β–ˆβ–ˆ | 175/869 [00:02<00:08, 79.26it/s]
695
+
696
  21%|β–ˆβ–ˆ | 183/869 [00:02<00:08, 78.09it/s]
697
+
698
  22%|β–ˆβ–ˆβ– | 191/869 [00:02<00:08, 76.37it/s]
699
+
700
  23%|β–ˆβ–ˆβ–Ž | 199/869 [00:02<00:08, 76.97it/s]
701
+
702
  24%|β–ˆβ–ˆβ– | 208/869 [00:02<00:08, 78.45it/s]
703
+
704
  25%|β–ˆβ–ˆβ–Œ | 218/869 [00:02<00:07, 82.86it/s]
705
+
706
  26%|β–ˆβ–ˆβ–Œ | 227/869 [00:02<00:07, 83.20it/s]
707
+
708
  27%|β–ˆβ–ˆβ–‹ | 236/869 [00:02<00:08, 76.92it/s]
709
+
710
  28%|β–ˆβ–ˆβ–Š | 244/869 [00:03<00:08, 71.08it/s]
711
+
712
  29%|β–ˆβ–ˆβ–‰ | 253/869 [00:03<00:08, 75.15it/s]
713
+
714
  30%|β–ˆβ–ˆβ–ˆ | 262/869 [00:03<00:07, 76.76it/s]
715
+
716
  31%|β–ˆβ–ˆβ–ˆ | 270/869 [00:03<00:07, 74.97it/s]
717
+
718
  32%|β–ˆβ–ˆβ–ˆβ– | 278/869 [00:03<00:07, 74.44it/s]
719
+
720
  33%|β–ˆβ–ˆβ–ˆβ–Ž | 286/869 [00:03<00:07, 74.34it/s]
721
+
722
  34%|β–ˆβ–ˆβ–ˆβ– | 294/869 [00:03<00:07, 75.42it/s]
723
+
724
  35%|β–ˆβ–ˆβ–ˆβ– | 302/869 [00:03<00:07, 72.74it/s]
725
+
726
  36%|β–ˆβ–ˆβ–ˆβ–Œ | 310/869 [00:03<00:07, 74.05it/s]
727
+
728
  37%|β–ˆβ–ˆβ–ˆβ–‹ | 318/869 [00:04<00:07, 73.18it/s]
729
+
730
  38%|β–ˆβ–ˆβ–ˆβ–Š | 326/869 [00:04<00:07, 74.32it/s]
731
+
732
  39%|β–ˆβ–ˆβ–ˆβ–Š | 335/869 [00:04<00:06, 78.23it/s]
733
+
734
  39%|β–ˆβ–ˆβ–ˆβ–‰ | 343/869 [00:04<00:06, 75.35it/s]
735
+
736
  40%|β–ˆβ–ˆβ–ˆβ–ˆ | 351/869 [00:04<00:06, 74.42it/s]
737
+
738
  41%|β–ˆβ–ˆβ–ˆβ–ˆβ– | 360/869 [00:04<00:06, 77.90it/s]
739
+
740
  42%|β–ˆβ–ˆβ–ˆβ–ˆβ– | 369/869 [00:04<00:06, 79.65it/s]
741
+
742
  43%|β–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 377/869 [00:04<00:06, 76.71it/s]
743
+
744
  44%|β–ˆβ–ˆβ–ˆβ–ˆβ– | 385/869 [00:04<00:06, 75.81it/s]
745
+
746
  45%|β–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 393/869 [00:05<00:06, 72.15it/s]
747
+
748
  46%|β–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 402/869 [00:05<00:06, 74.91it/s]
749
+
750
  47%|β–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 411/869 [00:05<00:05, 78.06it/s]
751
+
752
  48%|β–ˆβ–ˆβ–ˆβ–ˆβ–Š | 420/869 [00:05<00:05, 79.58it/s]
753
+
754
  49%|β–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 429/869 [00:05<00:05, 82.14it/s]
755
+
756
  50%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 438/869 [00:05<00:05, 78.97it/s]
757
+
758
  51%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 446/869 [00:05<00:05, 76.84it/s]
759
+
760
  52%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 455/869 [00:05<00:05, 78.31it/s]
761
+
762
  53%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 463/869 [00:05<00:05, 76.71it/s]
763
+
764
  54%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 472/869 [00:06<00:04, 80.16it/s]
765
+
766
  55%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 481/869 [00:06<00:04, 82.89it/s]
767
+
768
  56%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 490/869 [00:06<00:04, 79.00it/s]
769
+
770
  57%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 498/869 [00:06<00:04, 78.03it/s]
771
+
772
  58%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 506/869 [00:06<00:04, 76.31it/s]
773
+
774
  59%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 514/869 [00:06<00:04, 77.22it/s]
775
+
776
  60%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 522/869 [00:06<00:04, 72.94it/s]
777
+
778
  61%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 531/869 [00:06<00:04, 75.43it/s]
779
+
780
  62%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 539/869 [00:06<00:04, 74.36it/s]
781
+
782
  63%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 547/869 [00:07<00:04, 73.96it/s]
783
+
784
  64%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 556/869 [00:07<00:04, 76.54it/s]
785
+
786
  65%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 564/869 [00:07<00:03, 77.26it/s]
787
+
788
  66%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 572/869 [00:07<00:03, 75.95it/s]
789
+
790
  67%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 580/869 [00:07<00:03, 76.49it/s]
791
+
792
  68%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 588/869 [00:07<00:03, 75.47it/s]
793
+
794
  69%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 596/869 [00:07<00:03, 75.44it/s]
795
+
796
  70%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 605/869 [00:07<00:03, 77.26it/s]
797
+
798
  71%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 613/869 [00:07<00:03, 77.48it/s]
799
+
800
  71%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 621/869 [00:07<00:03, 77.76it/s]
801
+
802
  72%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 629/869 [00:08<00:03, 76.20it/s]
803
+
804
  73%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 637/869 [00:08<00:03, 75.43it/s]
805
+
806
  74%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 646/869 [00:08<00:02, 79.27it/s]
807
+
808
  75%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 655/869 [00:08<00:02, 81.10it/s]
809
+
810
  76%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 664/869 [00:08<00:02, 79.18it/s]
811
+
812
  77%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 673/869 [00:08<00:02, 81.81it/s]
813
+
814
  78%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 682/869 [00:08<00:02, 71.77it/s]
815
+
816
  80%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 691/869 [00:08<00:02, 75.44it/s]
817
+
818
  80%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 699/869 [00:09<00:02, 76.23it/s]
819
+
820
  81%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 707/869 [00:09<00:02, 75.84it/s]
821
+
822
  82%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 716/869 [00:09<00:01, 77.83it/s]
823
+
824
  83%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 725/869 [00:09<00:01, 79.49it/s]
825
+
826
  84%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 734/869 [00:09<00:01, 78.92it/s]
827
+
828
  86%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 743/869 [00:09<00:01, 79.35it/s]
829
+
830
  86%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 751/869 [00:09<00:01, 77.02it/s]
831
+
832
  87%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 759/869 [00:09<00:01, 76.52it/s]
833
+
834
  88%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 767/869 [00:09<00:01, 73.86it/s]
835
+
836
  89%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 776/869 [00:10<00:01, 70.42it/s]
837
+
838
  90%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 784/869 [00:10<00:01, 67.63it/s]
839
+
840
  91%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 793/869 [00:10<00:01, 71.94it/s]
841
+
842
  92%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 802/869 [00:10<00:00, 74.63it/s]
843
+
844
  93%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž| 811/869 [00:10<00:00, 75.43it/s]
845
+
846
  94%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 820/869 [00:10<00:00, 76.33it/s]
847
+
848
  95%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ| 829/869 [00:10<00:00, 78.65it/s]
849
+
850
  96%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹| 837/869 [00:10<00:00, 78.27it/s]
851
+
852
  97%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹| 846/869 [00:10<00:00, 81.27it/s]
853
+
854
  98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 855/869 [00:11<00:00, 80.86it/s]
855
+
856
  99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 864/869 [00:11<00:00, 75.54it/s]
857
 
858
+
859
 
860
  10%|β–ˆ | 435/4350 [02:53<23:47, 2.74it/s]
861
+
862
+
863
  [INFO|trainer.py:3503] 2024-09-09 18:55:38,835 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-435
864
+ [INFO|configuration_utils.py:472] 2024-09-09 18:55:38,837 >> Configuration saved in /content/dissertation/scripts/ner/output/checkpoint-435/config.json
865
+ [INFO|modeling_utils.py:2799] 2024-09-09 18:55:39,714 >> Model weights saved in /content/dissertation/scripts/ner/output/checkpoint-435/model.safetensors
866
+ [INFO|tokenization_utils_base.py:2684] 2024-09-09 18:55:39,715 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/checkpoint-435/tokenizer_config.json
867
+ [INFO|tokenization_utils_base.py:2693] 2024-09-09 18:55:39,716 >> Special tokens file saved in /content/dissertation/scripts/ner/output/checkpoint-435/special_tokens_map.json
868
+ [INFO|tokenization_utils_base.py:2684] 2024-09-09 18:55:46,753 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json
869
+ [INFO|tokenization_utils_base.py:2693] 2024-09-09 18:55:46,753 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json
870
+
871
  10%|β–ˆ | 436/4350 [03:01<7:50:34, 7.21s/it]
872
  10%|β–ˆ | 437/4350 [03:01<5:35:45, 5.15s/it]
873
  10%|β–ˆ | 438/4350 [03:01<4:02:01, 3.71s/it]
874
  10%|β–ˆ | 439/4350 [03:02<2:57:17, 2.72s/it]
875
  10%|β–ˆ | 440/4350 [03:02<2:09:48, 1.99s/it]
876
  10%|β–ˆ | 441/4350 [03:03<1:38:29, 1.51s/it]
877
  10%|β–ˆ | 442/4350 [03:03<1:18:31, 1.21s/it]
878
  10%|β–ˆ | 443/4350 [03:03<1:01:09, 1.06it/s]
879
  10%|β–ˆ | 444/4350 [03:04<49:59, 1.30it/s]
880
  10%|β–ˆ | 445/4350 [03:04<40:43, 1.60it/s]
881
  10%|β–ˆ | 446/4350 [03:04<35:23, 1.84it/s]
882
  10%|β–ˆ | 447/4350 [03:05<33:28, 1.94it/s]
883
  10%|β–ˆ | 448/4350 [03:05<29:08, 2.23it/s]
884
  10%|β–ˆ | 449/4350 [03:06<27:52, 2.33it/s]
885
  10%|β–ˆ | 450/4350 [03:06<27:18, 2.38it/s]
886
  10%|β–ˆ | 451/4350 [03:06<24:21, 2.67it/s]
887
  10%|β–ˆ | 452/4350 [03:07<25:23, 2.56it/s]
888
  10%|β–ˆ | 453/4350 [03:07<24:12, 2.68it/s]
889
  10%|β–ˆ | 454/4350 [03:07<23:27, 2.77it/s]
890
  10%|β–ˆ | 455/4350 [03:08<22:49, 2.84it/s]
891
  10%|β–ˆ | 456/4350 [03:08<22:03, 2.94it/s]
892
  11%|β–ˆ | 457/4350 [03:08<21:56, 2.96it/s]
893
  11%|β–ˆ | 458/4350 [03:09<24:30, 2.65it/s]
894
  11%|β–ˆ | 459/4350 [03:09<23:52, 2.72it/s]
895
  11%|β–ˆ | 460/4350 [03:09<21:48, 2.97it/s]
896
  11%|β–ˆ | 461/4350 [03:10<21:29, 3.02it/s]
897
  11%|β–ˆ | 462/4350 [03:10<19:35, 3.31it/s]
898
  11%|β–ˆ | 463/4350 [03:10<23:36, 2.74it/s]
899
  11%|β–ˆ | 464/4350 [03:11<23:42, 2.73it/s]
900
  11%|β–ˆ | 465/4350 [03:11<21:35, 3.00it/s]
901
  11%|β–ˆ | 466/4350 [03:12<24:19, 2.66it/s]
902
  11%|β–ˆ | 467/4350 [03:12<24:10, 2.68it/s]
903
  11%|β–ˆ | 468/4350 [03:13<31:53, 2.03it/s]
904
  11%|β–ˆ | 469/4350 [03:13<28:07, 2.30it/s]
905
  11%|β–ˆ | 470/4350 [03:13<27:34, 2.34it/s]
906
  11%|β–ˆ | 471/4350 [03:14<27:24, 2.36it/s]
907
  11%|β–ˆ | 472/4350 [03:14<25:31, 2.53it/s]
908
  11%|β–ˆ | 473/4350 [03:14<24:42, 2.61it/s]
909
  11%|β–ˆ | 474/4350 [03:15<24:15, 2.66it/s]
910
  11%|β–ˆ | 475/4350 [03:15<24:13, 2.67it/s]
911
  11%|β–ˆ | 476/4350 [03:16<23:17, 2.77it/s]
912
  11%|β–ˆ | 477/4350 [03:16<24:01, 2.69it/s]
913
  11%|β–ˆ | 478/4350 [03:16<23:05, 2.79it/s]
914
  11%|β–ˆ | 479/4350 [03:17<23:58, 2.69it/s]
915
  11%|β–ˆ | 480/4350 [03:17<24:26, 2.64it/s]
916
  11%|β–ˆ | 481/4350 [03:17<23:26, 2.75it/s]
917
  11%|β–ˆ | 482/4350 [03:18<23:50, 2.70it/s]
918
  11%|β–ˆ | 483/4350 [03:18<23:34, 2.73it/s]
919
  11%|β–ˆ | 484/4350 [03:18<21:50, 2.95it/s]
920
  11%|β–ˆ | 485/4350 [03:19<21:30, 3.00it/s]
921
  11%|β–ˆ | 486/4350 [03:19<24:22, 2.64it/s]
922
  11%|β–ˆ | 487/4350 [03:20<23:37, 2.73it/s]
923
  11%|β–ˆ | 488/4350 [03:20<24:31, 2.62it/s]
924
  11%|β–ˆ | 489/4350 [03:20<24:18, 2.65it/s]
925
  11%|β–ˆβ– | 490/4350 [03:21<24:39, 2.61it/s]
926
  11%|β–ˆβ– | 491/4350 [03:21<23:02, 2.79it/s]
927
  11%|β–ˆβ– | 492/4350 [03:21<22:33, 2.85it/s]
928
  11%|β–ˆβ– | 493/4350 [03:22<22:25, 2.87it/s]
929
  11%|β–ˆβ– | 494/4350 [03:22<22:53, 2.81it/s]
930
  11%|β–ˆβ– | 495/4350 [03:22<20:48, 3.09it/s]
931
  11%|β–ˆβ– | 496/4350 [03:23<22:32, 2.85it/s]
932
  11%|β–ˆβ– | 497/4350 [03:23<22:48, 2.82it/s]
933
  11%|β–ˆβ– | 498/4350 [03:23<22:42, 2.83it/s]
934
  11%|β–ˆβ– | 499/4350 [03:24<21:58, 2.92it/s]
935
  11%|β–ˆβ– | 500/4350 [03:24<22:30, 2.85it/s]
936
 
937
  11%|β–ˆβ– | 500/4350 [03:24<22:30, 2.85it/s]
938
  12%|β–ˆβ– | 501/4350 [03:25<23:41, 2.71it/s]
939
  12%|β–ˆβ– | 502/4350 [03:25<22:51, 2.81it/s]
940
  12%|β–ˆβ– | 503/4350 [03:25<23:39, 2.71it/s]
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13556e6c97b2f39e25d5830ab0bc61ce81f807bcf643d150d23dd97c2f606c57
3
+ size 5240
vocab.txt ADDED
The diff for this file is too large to render. See raw diff