varcoder commited on
Commit
b58fe67
·
1 Parent(s): 4dc31d9

End of training

Browse files
Files changed (4) hide show
  1. all_results.json +10 -10
  2. eval_results.json +5 -5
  3. train_results.json +5 -5
  4. trainer_state.json +56 -64
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 8.11,
3
- "eval_accuracy": 0.0,
4
- "eval_loss": NaN,
5
- "eval_runtime": 5.2931,
6
- "eval_samples_per_second": 55.733,
7
- "eval_steps_per_second": 1.889,
8
- "total_flos": 3.675135085585367e+17,
9
- "train_loss": 0.0,
10
- "train_runtime": 249.2359,
11
- "train_samples_per_second": 47.345,
12
- "train_steps_per_second": 0.12
13
  }
 
1
  {
2
  "epoch": 8.11,
3
+ "eval_accuracy": 0.8542372881355932,
4
+ "eval_loss": 0.5490496158599854,
5
+ "eval_runtime": 29.4646,
6
+ "eval_samples_per_second": 10.012,
7
+ "eval_steps_per_second": 0.339,
8
+ "total_flos": 3.673187375325512e+17,
9
+ "train_loss": 0.8043342590332031,
10
+ "train_runtime": 2700.5846,
11
+ "train_samples_per_second": 4.369,
12
+ "train_steps_per_second": 0.011
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 8.11,
3
- "eval_accuracy": 0.0,
4
- "eval_loss": NaN,
5
- "eval_runtime": 5.2931,
6
- "eval_samples_per_second": 55.733,
7
- "eval_steps_per_second": 1.889
8
  }
 
1
  {
2
  "epoch": 8.11,
3
+ "eval_accuracy": 0.8542372881355932,
4
+ "eval_loss": 0.5490496158599854,
5
+ "eval_runtime": 29.4646,
6
+ "eval_samples_per_second": 10.012,
7
+ "eval_steps_per_second": 0.339
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 8.11,
3
- "total_flos": 3.675135085585367e+17,
4
- "train_loss": 0.0,
5
- "train_runtime": 249.2359,
6
- "train_samples_per_second": 47.345,
7
- "train_steps_per_second": 0.12
8
  }
 
1
  {
2
  "epoch": 8.11,
3
+ "total_flos": 3.673187375325512e+17,
4
+ "train_loss": 0.8043342590332031,
5
+ "train_runtime": 2700.5846,
6
+ "train_samples_per_second": 4.369,
7
+ "train_steps_per_second": 0.011
8
  }
trainer_state.json CHANGED
@@ -1,8 +1,7 @@
1
  {
2
- "best_metric": 0.0,
3
- "best_model_checkpoint": "resnet-101-finetuned-CivilEng11k/checkpoint-3",
4
  "epoch": 8.108108108108109,
5
- "eval_steps": 500,
6
  "global_step": 30,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
@@ -10,123 +9,116 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.81,
13
- "eval_accuracy": 0.0,
14
- "eval_loss": NaN,
15
- "eval_runtime": 5.4471,
16
- "eval_samples_per_second": 54.157,
17
- "eval_steps_per_second": 1.836,
18
  "step": 3
19
  },
20
  {
21
  "epoch": 1.89,
22
- "eval_accuracy": 0.0,
23
- "eval_loss": NaN,
24
- "eval_runtime": 5.2566,
25
- "eval_samples_per_second": 56.12,
26
- "eval_steps_per_second": 1.902,
27
  "step": 7
28
  },
29
  {
30
  "epoch": 2.7,
31
- "grad_norm": NaN,
32
  "learning_rate": 0.00022222222222222218,
33
- "loss": 0.0,
34
  "step": 10
35
  },
36
  {
37
  "epoch": 2.97,
38
- "eval_accuracy": 0.0,
39
- "eval_loss": NaN,
40
- "eval_runtime": 5.2368,
41
- "eval_samples_per_second": 56.332,
42
- "eval_steps_per_second": 1.91,
43
  "step": 11
44
  },
45
  {
46
  "epoch": 3.78,
47
- "eval_accuracy": 0.0,
48
- "eval_loss": NaN,
49
- "eval_runtime": 5.1779,
50
- "eval_samples_per_second": 56.973,
51
- "eval_steps_per_second": 1.931,
52
  "step": 14
53
  },
54
  {
55
  "epoch": 4.86,
56
- "eval_accuracy": 0.0,
57
- "eval_loss": NaN,
58
- "eval_runtime": 5.1256,
59
- "eval_samples_per_second": 57.555,
60
- "eval_steps_per_second": 1.951,
61
  "step": 18
62
  },
63
  {
64
  "epoch": 5.41,
65
- "grad_norm": NaN,
66
  "learning_rate": 0.00011111111111111109,
67
- "loss": 0.0,
68
  "step": 20
69
  },
70
  {
71
  "epoch": 5.95,
72
- "eval_accuracy": 0.0,
73
- "eval_loss": NaN,
74
- "eval_runtime": 5.1976,
75
- "eval_samples_per_second": 56.757,
76
- "eval_steps_per_second": 1.924,
77
  "step": 22
78
  },
79
  {
80
  "epoch": 6.76,
81
- "eval_accuracy": 0.0,
82
- "eval_loss": NaN,
83
- "eval_runtime": 5.1726,
84
- "eval_samples_per_second": 57.032,
85
- "eval_steps_per_second": 1.933,
86
  "step": 25
87
  },
88
  {
89
  "epoch": 7.84,
90
- "eval_accuracy": 0.0,
91
- "eval_loss": NaN,
92
- "eval_runtime": 5.0794,
93
- "eval_samples_per_second": 58.078,
94
- "eval_steps_per_second": 1.969,
95
  "step": 29
96
  },
97
  {
98
  "epoch": 8.11,
99
- "grad_norm": NaN,
100
  "learning_rate": 0.0,
101
- "loss": 0.0,
102
  "step": 30
103
  },
104
  {
105
  "epoch": 8.11,
106
- "eval_accuracy": 0.0,
107
- "eval_loss": NaN,
108
- "eval_runtime": 5.2939,
109
- "eval_samples_per_second": 55.725,
110
- "eval_steps_per_second": 1.889,
111
  "step": 30
112
  },
113
  {
114
  "epoch": 8.11,
115
  "step": 30,
116
- "total_flos": 3.675135085585367e+17,
117
- "train_loss": 0.0,
118
- "train_runtime": 249.2359,
119
- "train_samples_per_second": 47.345,
120
- "train_steps_per_second": 0.12
121
  }
122
  ],
123
- "logging_steps": 10,
124
  "max_steps": 30,
125
- "num_input_tokens_seen": 0,
126
  "num_train_epochs": 10,
127
- "save_steps": 500,
128
- "total_flos": 3.675135085585367e+17,
129
- "train_batch_size": 32,
130
  "trial_name": null,
131
  "trial_params": null
132
  }
 
1
  {
2
+ "best_metric": 0.8542372881355932,
3
+ "best_model_checkpoint": "resnet-101-finetuned-CivilEng11k\\checkpoint-30",
4
  "epoch": 8.108108108108109,
 
5
  "global_step": 30,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
 
9
  "log_history": [
10
  {
11
  "epoch": 0.81,
12
+ "eval_accuracy": 0.5728813559322034,
13
+ "eval_loss": 1.072370171546936,
14
+ "eval_runtime": 31.0882,
15
+ "eval_samples_per_second": 9.489,
16
+ "eval_steps_per_second": 0.322,
17
  "step": 3
18
  },
19
  {
20
  "epoch": 1.89,
21
+ "eval_accuracy": 0.6542372881355932,
22
+ "eval_loss": 0.9717434048652649,
23
+ "eval_runtime": 28.8812,
24
+ "eval_samples_per_second": 10.214,
25
+ "eval_steps_per_second": 0.346,
26
  "step": 7
27
  },
28
  {
29
  "epoch": 2.7,
 
30
  "learning_rate": 0.00022222222222222218,
31
+ "loss": 1.0293,
32
  "step": 10
33
  },
34
  {
35
  "epoch": 2.97,
36
+ "eval_accuracy": 0.6677966101694915,
37
+ "eval_loss": 0.8594140410423279,
38
+ "eval_runtime": 29.6429,
39
+ "eval_samples_per_second": 9.952,
40
+ "eval_steps_per_second": 0.337,
41
  "step": 11
42
  },
43
  {
44
  "epoch": 3.78,
45
+ "eval_accuracy": 0.7016949152542373,
46
+ "eval_loss": 0.7830201983451843,
47
+ "eval_runtime": 27.8913,
48
+ "eval_samples_per_second": 10.577,
49
+ "eval_steps_per_second": 0.359,
50
  "step": 14
51
  },
52
  {
53
  "epoch": 4.86,
54
+ "eval_accuracy": 0.7593220338983051,
55
+ "eval_loss": 0.6764189600944519,
56
+ "eval_runtime": 28.0114,
57
+ "eval_samples_per_second": 10.531,
58
+ "eval_steps_per_second": 0.357,
59
  "step": 18
60
  },
61
  {
62
  "epoch": 5.41,
 
63
  "learning_rate": 0.00011111111111111109,
64
+ "loss": 0.78,
65
  "step": 20
66
  },
67
  {
68
  "epoch": 5.95,
69
+ "eval_accuracy": 0.7830508474576271,
70
+ "eval_loss": 0.6071953177452087,
71
+ "eval_runtime": 27.9144,
72
+ "eval_samples_per_second": 10.568,
73
+ "eval_steps_per_second": 0.358,
74
  "step": 22
75
  },
76
  {
77
  "epoch": 6.76,
78
+ "eval_accuracy": 0.8338983050847457,
79
+ "eval_loss": 0.5745152235031128,
80
+ "eval_runtime": 28.2316,
81
+ "eval_samples_per_second": 10.449,
82
+ "eval_steps_per_second": 0.354,
83
  "step": 25
84
  },
85
  {
86
  "epoch": 7.84,
87
+ "eval_accuracy": 0.8508474576271187,
88
+ "eval_loss": 0.5488777756690979,
89
+ "eval_runtime": 29.7841,
90
+ "eval_samples_per_second": 9.905,
91
+ "eval_steps_per_second": 0.336,
92
  "step": 29
93
  },
94
  {
95
  "epoch": 8.11,
 
96
  "learning_rate": 0.0,
97
+ "loss": 0.6037,
98
  "step": 30
99
  },
100
  {
101
  "epoch": 8.11,
102
+ "eval_accuracy": 0.8542372881355932,
103
+ "eval_loss": 0.5490496158599854,
104
+ "eval_runtime": 29.9582,
105
+ "eval_samples_per_second": 9.847,
106
+ "eval_steps_per_second": 0.334,
107
  "step": 30
108
  },
109
  {
110
  "epoch": 8.11,
111
  "step": 30,
112
+ "total_flos": 3.673187375325512e+17,
113
+ "train_loss": 0.8043342590332031,
114
+ "train_runtime": 2700.5846,
115
+ "train_samples_per_second": 4.369,
116
+ "train_steps_per_second": 0.011
117
  }
118
  ],
 
119
  "max_steps": 30,
 
120
  "num_train_epochs": 10,
121
+ "total_flos": 3.673187375325512e+17,
 
 
122
  "trial_name": null,
123
  "trial_params": null
124
  }