Metal079 commited on
Commit
05a806e
·
1 Parent(s): e2ff778

Upload 4 files

Browse files
Files changed (3) hide show
  1. sonic/config.json +44 -10
  2. sonic/pytorch_model.bin +2 -2
  3. sonic/trainer_state.json +133 -124
sonic/config.json CHANGED
@@ -19,14 +19,31 @@
19
  ],
20
  "id2label": {
21
  "0": "Tails the fox",
22
- "1": "Amy rose",
23
  "10": "Shadow the hedgehog",
24
  "11": "Sally Acorn",
25
- "12": "mobian",
26
- "13": "Tangle the lemur",
27
- "14": "Big the cat",
28
- "2": "Rouge the bat",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
29
  "3": "Whisper the wolf",
 
 
30
  "4": "Knuckles the echidna",
31
  "5": "Blaze the cat",
32
  "6": "Silver the hedgehog",
@@ -37,21 +54,38 @@
37
  "image_size": 384,
38
  "initializer_range": 0.02,
39
  "label2id": {
40
- "Amy rose": "1",
41
- "Big the cat": "14",
42
  "Blaze the cat": "5",
 
 
 
43
  "Cream the rabbit": "7",
 
 
 
44
  "Knuckles the echidna": "4",
45
- "Rouge the bat": "2",
 
 
 
46
  "Sally Acorn": "11",
47
  "Shadow the hedgehog": "10",
48
  "Silver the hedgehog": "6",
49
  "Sonic the hedgehog": "9",
 
 
 
 
50
  "Tails the fox": "0",
51
- "Tangle the lemur": "13",
 
52
  "Vanilla the rabbit": "8",
 
 
53
  "Whisper the wolf": "3",
54
- "mobian": "12"
 
55
  },
56
  "layer_norm_eps": 1e-12,
57
  "layer_scale_init_value": 1e-06,
 
19
  ],
20
  "id2label": {
21
  "0": "Tails the fox",
22
+ "1": "Amy Rose",
23
  "10": "Shadow the hedgehog",
24
  "11": "Sally Acorn",
25
+ "12": "Tangle the lemur",
26
+ "13": "mobian",
27
+ "14": "Cosmo the seedrian",
28
+ "15": "Big the cat",
29
+ "16": "Sticks the badger",
30
+ "17": "Tikal the echidna",
31
+ "18": "Wave the swallow",
32
+ "19": "Jet the hawk",
33
+ "2": "Rogue the bat",
34
+ "20": "Honey the cat",
35
+ "21": "Surge the tenrec",
36
+ "22": "Starline the platypus",
37
+ "23": "Mighty the armadillo",
38
+ "24": "Vector the crocodile",
39
+ "25": "Charmy the bee",
40
+ "26": "Espio the chameleon",
41
+ "27": "eggman",
42
+ "28": "Bunnie Rabbot",
43
+ "29": "Marine the Raccoon",
44
  "3": "Whisper the wolf",
45
+ "30": "Storm the albatross",
46
+ "31": "Maria Robotnik",
47
  "4": "Knuckles the echidna",
48
  "5": "Blaze the cat",
49
  "6": "Silver the hedgehog",
 
54
  "image_size": 384,
55
  "initializer_range": 0.02,
56
  "label2id": {
57
+ "Amy Rose": "1",
58
+ "Big the cat": "15",
59
  "Blaze the cat": "5",
60
+ "Bunnie Rabbot": "28",
61
+ "Charmy the bee": "25",
62
+ "Cosmo the seedrian": "14",
63
  "Cream the rabbit": "7",
64
+ "Espio the chameleon": "26",
65
+ "Honey the cat": "20",
66
+ "Jet the hawk": "19",
67
  "Knuckles the echidna": "4",
68
+ "Maria Robotnik": "31",
69
+ "Marine the Raccoon": "29",
70
+ "Mighty the armadillo": "23",
71
+ "Rogue the bat": "2",
72
  "Sally Acorn": "11",
73
  "Shadow the hedgehog": "10",
74
  "Silver the hedgehog": "6",
75
  "Sonic the hedgehog": "9",
76
+ "Starline the platypus": "22",
77
+ "Sticks the badger": "16",
78
+ "Storm the albatross": "30",
79
+ "Surge the tenrec": "21",
80
  "Tails the fox": "0",
81
+ "Tangle the lemur": "12",
82
+ "Tikal the echidna": "17",
83
  "Vanilla the rabbit": "8",
84
+ "Vector the crocodile": "24",
85
+ "Wave the swallow": "18",
86
  "Whisper the wolf": "3",
87
+ "eggman": "27",
88
+ "mobian": "13"
89
  },
90
  "layer_norm_eps": 1e-12,
91
  "layer_scale_init_value": 1e-06,
sonic/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd4d6897c65fc76cc210003c9552b14442dd4d5786bab4e5b323c52bafa2e877
3
- size 350446061
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec5e3d6a60bdf3f519adb879379016d6bd97bb046a8f5a18afaac0cbae52c570
3
+ size 350515757
sonic/trainer_state.json CHANGED
@@ -1,177 +1,186 @@
1
  {
2
- "best_metric": 0.09438519924879074,
3
- "best_model_checkpoint": "./SonicCharacterClassifier\\checkpoint-1400",
4
- "epoch": 4.093567251461988,
5
- "global_step": 1400,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.29,
12
- "learning_rate": 4.853801169590643e-05,
13
- "loss": 0.3188,
14
- "step": 100
15
- },
16
- {
17
- "epoch": 0.58,
18
- "learning_rate": 4.707602339181287e-05,
19
- "loss": 0.2087,
20
  "step": 200
21
  },
22
  {
23
- "epoch": 0.58,
24
- "eval_accuracy": 0.9407407407407361,
25
- "eval_loss": 0.16877754032611847,
26
- "eval_precision": 0.6539702845075653,
27
- "eval_recall": 0.5742313120602596,
28
- "eval_runtime": 161.9664,
29
- "eval_samples_per_second": 8.446,
30
- "eval_steps_per_second": 1.056,
31
  "step": 200
32
  },
33
  {
34
- "epoch": 0.88,
35
- "learning_rate": 4.56140350877193e-05,
36
- "loss": 0.1663,
37
- "step": 300
38
- },
39
- {
40
- "epoch": 1.17,
41
- "learning_rate": 4.4152046783625734e-05,
42
- "loss": 0.1155,
43
  "step": 400
44
  },
45
  {
46
- "epoch": 1.17,
47
- "eval_accuracy": 0.9615009746588669,
48
- "eval_loss": 0.12015020102262497,
49
- "eval_precision": 0.8305708768976313,
50
- "eval_recall": 0.7801112001221648,
51
- "eval_runtime": 161.8616,
52
- "eval_samples_per_second": 8.452,
53
- "eval_steps_per_second": 1.056,
54
  "step": 400
55
  },
56
  {
57
- "epoch": 1.46,
58
- "learning_rate": 4.269005847953216e-05,
59
- "loss": 0.095,
60
- "step": 500
61
- },
62
- {
63
- "epoch": 1.75,
64
- "learning_rate": 4.12280701754386e-05,
65
- "loss": 0.0932,
66
  "step": 600
67
  },
68
  {
69
- "epoch": 1.75,
70
- "eval_accuracy": 0.964278752436644,
71
- "eval_loss": 0.1112869530916214,
72
- "eval_precision": 0.8358102748453625,
73
- "eval_recall": 0.7573138768314205,
74
- "eval_runtime": 160.6953,
75
- "eval_samples_per_second": 8.513,
76
- "eval_steps_per_second": 1.064,
77
  "step": 600
78
  },
79
  {
80
- "epoch": 2.05,
81
- "learning_rate": 3.976608187134503e-05,
82
- "loss": 0.087,
83
- "step": 700
84
- },
85
- {
86
- "epoch": 2.34,
87
- "learning_rate": 3.8304093567251465e-05,
88
- "loss": 0.0489,
89
  "step": 800
90
  },
91
  {
92
- "epoch": 2.34,
93
- "eval_accuracy": 0.9684697855750467,
94
- "eval_loss": 0.09839322417974472,
95
- "eval_precision": 0.877861029889539,
96
- "eval_recall": 0.8274951210258222,
97
- "eval_runtime": 160.5107,
98
- "eval_samples_per_second": 8.523,
99
- "eval_steps_per_second": 1.065,
100
  "step": 800
101
  },
102
  {
103
- "epoch": 2.63,
104
- "learning_rate": 3.6842105263157895e-05,
105
- "loss": 0.0506,
106
- "step": 900
107
- },
108
- {
109
- "epoch": 2.92,
110
- "learning_rate": 3.538011695906433e-05,
111
- "loss": 0.0503,
112
  "step": 1000
113
  },
114
  {
115
- "epoch": 2.92,
116
- "eval_accuracy": 0.9692495126705621,
117
- "eval_loss": 0.09646110981702805,
118
- "eval_precision": 0.8755529497305813,
119
- "eval_recall": 0.8374415545468176,
120
- "eval_runtime": 161.798,
121
- "eval_samples_per_second": 8.455,
122
- "eval_steps_per_second": 1.057,
123
  "step": 1000
124
  },
125
  {
126
- "epoch": 3.22,
127
- "learning_rate": 3.391812865497076e-05,
128
- "loss": 0.0297,
129
- "step": 1100
130
- },
131
- {
132
- "epoch": 3.51,
133
- "learning_rate": 3.24561403508772e-05,
134
- "loss": 0.0245,
135
  "step": 1200
136
  },
137
  {
138
- "epoch": 3.51,
139
- "eval_accuracy": 0.9697855750487306,
140
- "eval_loss": 0.09691683202981949,
141
- "eval_precision": 0.8796307635671673,
142
- "eval_recall": 0.8392919296428067,
143
- "eval_runtime": 163.6772,
144
- "eval_samples_per_second": 8.358,
145
- "eval_steps_per_second": 1.045,
146
  "step": 1200
147
  },
148
  {
149
- "epoch": 3.8,
150
- "learning_rate": 3.0994152046783626e-05,
151
- "loss": 0.026,
152
- "step": 1300
153
  },
154
  {
155
- "epoch": 4.09,
156
- "learning_rate": 2.9532163742690062e-05,
157
- "loss": 0.0231,
 
 
 
 
 
158
  "step": 1400
159
  },
160
  {
161
- "epoch": 4.09,
162
- "eval_accuracy": 0.9713937621832336,
163
- "eval_loss": 0.09438519924879074,
164
- "eval_precision": 0.8850769600769599,
165
- "eval_recall": 0.8511938435184049,
166
- "eval_runtime": 161.9688,
167
- "eval_samples_per_second": 8.446,
168
- "eval_steps_per_second": 1.056,
169
- "step": 1400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
170
  }
171
  ],
172
- "max_steps": 3420,
173
  "num_train_epochs": 10,
174
- "total_flos": 5.207113357118669e+18,
175
  "trial_name": null,
176
  "trial_params": null
177
  }
 
1
  {
2
+ "best_metric": 0.08468733727931976,
3
+ "best_model_checkpoint": "./SonicCharacterClassifier\\checkpoint-1600",
4
+ "epoch": 6.042296072507553,
5
+ "global_step": 2000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.6,
12
+ "learning_rate": 4.6978851963746225e-05,
13
+ "loss": 0.2038,
 
 
 
 
 
 
14
  "step": 200
15
  },
16
  {
17
+ "epoch": 0.6,
18
+ "eval_accuracy": 0.9509220795568983,
19
+ "eval_loss": 0.1493668258190155,
20
+ "eval_precision": 0.4276334957981484,
21
+ "eval_recall": 0.34057603409646653,
22
+ "eval_runtime": 245.2223,
23
+ "eval_samples_per_second": 8.099,
24
+ "eval_steps_per_second": 1.015,
25
  "step": 200
26
  },
27
  {
28
+ "epoch": 1.21,
29
+ "learning_rate": 4.395770392749245e-05,
30
+ "loss": 0.1299,
 
 
 
 
 
 
31
  "step": 400
32
  },
33
  {
34
+ "epoch": 1.21,
35
+ "eval_accuracy": 0.9626132930513596,
36
+ "eval_loss": 0.11390183866024017,
37
+ "eval_precision": 0.6821628829936983,
38
+ "eval_recall": 0.6035811496119172,
39
+ "eval_runtime": 245.5675,
40
+ "eval_samples_per_second": 8.087,
41
+ "eval_steps_per_second": 1.014,
42
  "step": 400
43
  },
44
  {
45
+ "epoch": 1.81,
46
+ "learning_rate": 4.093655589123867e-05,
47
+ "loss": 0.0952,
 
 
 
 
 
 
48
  "step": 600
49
  },
50
  {
51
+ "epoch": 1.81,
52
+ "eval_accuracy": 0.9677901560926485,
53
+ "eval_loss": 0.10017536580562592,
54
+ "eval_precision": 0.7746363586620384,
55
+ "eval_recall": 0.71393109788423,
56
+ "eval_runtime": 246.2016,
57
+ "eval_samples_per_second": 8.067,
58
+ "eval_steps_per_second": 1.011,
59
  "step": 600
60
  },
61
  {
62
+ "epoch": 2.42,
63
+ "learning_rate": 3.79154078549849e-05,
64
+ "loss": 0.0681,
 
 
 
 
 
 
65
  "step": 800
66
  },
67
  {
68
+ "epoch": 2.42,
69
+ "eval_accuracy": 0.9708113041289023,
70
+ "eval_loss": 0.09041494876146317,
71
+ "eval_precision": 0.8065139068160218,
72
+ "eval_recall": 0.7231326368063123,
73
+ "eval_runtime": 245.4942,
74
+ "eval_samples_per_second": 8.09,
75
+ "eval_steps_per_second": 1.014,
76
  "step": 800
77
  },
78
  {
79
+ "epoch": 3.02,
80
+ "learning_rate": 3.489425981873112e-05,
81
+ "loss": 0.0608,
 
 
 
 
 
 
82
  "step": 1000
83
  },
84
  {
85
+ "epoch": 3.02,
86
+ "eval_accuracy": 0.972904078549849,
87
+ "eval_loss": 0.08679082244634628,
88
+ "eval_precision": 0.8209949551458537,
89
+ "eval_recall": 0.7289373926706963,
90
+ "eval_runtime": 244.3239,
91
+ "eval_samples_per_second": 8.129,
92
+ "eval_steps_per_second": 1.019,
93
  "step": 1000
94
  },
95
  {
96
+ "epoch": 3.63,
97
+ "learning_rate": 3.187311178247734e-05,
98
+ "loss": 0.0393,
 
 
 
 
 
 
99
  "step": 1200
100
  },
101
  {
102
+ "epoch": 3.63,
103
+ "eval_accuracy": 0.9730771651560927,
104
+ "eval_loss": 0.08753738552331924,
105
+ "eval_precision": 0.8360383490292852,
106
+ "eval_recall": 0.7486598211097333,
107
+ "eval_runtime": 248.2529,
108
+ "eval_samples_per_second": 8.0,
109
+ "eval_steps_per_second": 1.003,
110
  "step": 1200
111
  },
112
  {
113
+ "epoch": 4.23,
114
+ "learning_rate": 2.8851963746223565e-05,
115
+ "loss": 0.0347,
116
+ "step": 1400
117
  },
118
  {
119
+ "epoch": 4.23,
120
+ "eval_accuracy": 0.9733761329305136,
121
+ "eval_loss": 0.08492986112833023,
122
+ "eval_precision": 0.8388275873170129,
123
+ "eval_recall": 0.7801557843198007,
124
+ "eval_runtime": 248.4693,
125
+ "eval_samples_per_second": 7.993,
126
+ "eval_steps_per_second": 1.002,
127
  "step": 1400
128
  },
129
  {
130
+ "epoch": 4.83,
131
+ "learning_rate": 2.583081570996979e-05,
132
+ "loss": 0.0256,
133
+ "step": 1600
134
+ },
135
+ {
136
+ "epoch": 4.83,
137
+ "eval_accuracy": 0.9739583333333334,
138
+ "eval_loss": 0.08468733727931976,
139
+ "eval_precision": 0.8475558611132625,
140
+ "eval_recall": 0.788949676665331,
141
+ "eval_runtime": 248.7261,
142
+ "eval_samples_per_second": 7.985,
143
+ "eval_steps_per_second": 1.001,
144
+ "step": 1600
145
+ },
146
+ {
147
+ "epoch": 5.44,
148
+ "learning_rate": 2.2809667673716012e-05,
149
+ "loss": 0.0191,
150
+ "step": 1800
151
+ },
152
+ {
153
+ "epoch": 5.44,
154
+ "eval_accuracy": 0.9742573011077543,
155
+ "eval_loss": 0.0882001668214798,
156
+ "eval_precision": 0.845859505500522,
157
+ "eval_recall": 0.7649921950675245,
158
+ "eval_runtime": 251.833,
159
+ "eval_samples_per_second": 7.886,
160
+ "eval_steps_per_second": 0.989,
161
+ "step": 1800
162
+ },
163
+ {
164
+ "epoch": 6.04,
165
+ "learning_rate": 1.9788519637462235e-05,
166
+ "loss": 0.0154,
167
+ "step": 2000
168
+ },
169
+ {
170
+ "epoch": 6.04,
171
+ "eval_accuracy": 0.9743674471299094,
172
+ "eval_loss": 0.08864131569862366,
173
+ "eval_precision": 0.8535254440088273,
174
+ "eval_recall": 0.7735381205368478,
175
+ "eval_runtime": 245.1302,
176
+ "eval_samples_per_second": 8.102,
177
+ "eval_steps_per_second": 1.016,
178
+ "step": 2000
179
  }
180
  ],
181
+ "max_steps": 3310,
182
  "num_train_epochs": 10,
183
+ "total_flos": 1.1154739870524506e+19,
184
  "trial_name": null,
185
  "trial_params": null
186
  }