{"train_lr": 9.999999999999999e-05, "train_min_lr": 5.000000000000001e-06, "train_loss": 1.211935778995892, "train_loss_scale": 42903.44744744745, "train_weight_decay": 0.009999999999999919, "train_grad_norm": Infinity, "val_score": 61.19140589237213, "epoch": 0, "n_parameters": 676689114} {"train_lr": 0.0001996958096529171, "train_min_lr": 9.984790482645852e-06, "train_loss": 1.2121001839995742, "train_loss_scale": 20123.29129129129, "train_weight_decay": 0.009999999999999919, "train_grad_norm": NaN, "val_score": 60.15624952316284, "epoch": 1, "n_parameters": 676689114} {"train_lr": 0.0001978726125913927, "train_min_lr": 9.893630629569637e-06, "train_loss": 0.9858112536572121, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 17.722414419099735, "val_score": 62.304686427116394, "epoch": 2, "n_parameters": 676689114} {"train_lr": 0.00019426058254119679, "train_min_lr": 9.713029127059847e-06, "train_loss": 0.8251964157676553, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 17.40996901337449, "val_score": 61.62109398841858, "epoch": 3, "n_parameters": 676689114} {"train_lr": 0.00018893325001791706, "train_min_lr": 9.446662500895856e-06, "train_loss": 0.6833842111242426, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 17.004900761910744, "val_score": 62.08984303474426, "epoch": 4, "n_parameters": 676689114} {"train_lr": 0.00018199906414896873, "train_min_lr": 9.09995320744844e-06, "train_loss": 0.6133985659023663, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 17.63499834587624, "val_score": 61.17187428474426, "epoch": 5, "n_parameters": 676689114} {"train_lr": 0.00017359918496210293, "train_min_lr": 8.679959248105154e-06, "train_loss": 0.5402796789556294, "train_loss_scale": 14883.363363363364, "train_weight_decay": 0.009999999999999919, "train_grad_norm": NaN, "val_score": 63.339842796325684, "epoch": 6, "n_parameters": 676689114} {"train_lr": 0.00016390460977431316, "train_min_lr": 8.19523048871566e-06, "train_loss": 0.5181443974509969, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 17.63569292435059, "val_score": 61.77734363079071, "epoch": 7, "n_parameters": 676689114} {"train_lr": 0.0001531126921795763, "train_min_lr": 7.65563460897881e-06, "train_loss": 0.45838243518774213, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 17.09453874450546, "val_score": 63.808592677116394, "epoch": 8, "n_parameters": 676689114} {"train_lr": 0.00014144312449880072, "train_min_lr": 7.07215622494004e-06, "train_loss": 0.41373957823346685, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 16.566668019996392, "val_score": 63.18359363079071, "epoch": 9, "n_parameters": 676689114} {"train_lr": 0.00012913346547771312, "train_min_lr": 6.456673273885655e-06, "train_loss": 0.3603322505615316, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 15.078377696486923, "val_score": 62.26562464237213, "epoch": 10, "n_parameters": 676689114} {"train_lr": 0.00011643430427585721, "train_min_lr": 5.821715213792866e-06, "train_loss": 0.33128674582273393, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 14.886102125451371, "val_score": 60.97656226158142, "epoch": 11, "n_parameters": 676689114} {"train_lr": 0.00010360415919394631, "train_min_lr": 5.180207959697313e-06, "train_loss": 0.2856660650836097, "train_loss_scale": 4096.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": NaN, "val_score": 62.14843726158142, "epoch": 12, "n_parameters": 676689114} {"train_lr": 9.09042149867648e-05, "train_min_lr": 4.545210749338237e-06, "train_loss": 0.2689260695543554, "train_loss_scale": 4096.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 12.872011095553905, "val_score": 63.046873569488525, "epoch": 13, "n_parameters": 676689114} {"train_lr": 7.859300589475608e-05, "train_min_lr": 3.929650294737803e-06, "train_loss": 0.25824537334611286, "train_loss_scale": 4096.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 12.271222051915464, "val_score": 62.87109386920929, "epoch": 14, "n_parameters": 676689114} {"train_lr": 6.692115263243832e-05, "train_min_lr": 3.346057631621917e-06, "train_loss": 0.23223496808505453, "train_loss_scale": 4096.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 11.5709586641094, "val_score": 61.87500011920929, "epoch": 15, "n_parameters": 676689114} {"train_lr": 5.612626047338678e-05, "train_min_lr": 2.806313023669339e-06, "train_loss": 0.2138716054705528, "train_loss_scale": 4096.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 10.646926737404442, "val_score": 63.04687511920929, "epoch": 16, "n_parameters": 676689114} {"train_lr": 4.642808229206154e-05, "train_min_lr": 2.3214041146030775e-06, "train_loss": 0.19576878029595804, "train_loss_scale": 4096.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 10.534730427258008, "val_score": 63.22265577316284, "epoch": 17, "n_parameters": 676689114} {"train_lr": 3.802404502899794e-05, "train_min_lr": 1.901202251449895e-06, "train_loss": 0.19238561037200708, "train_loss_scale": 8167.399399399399, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 9.451654581694273, "val_score": 61.83593797683716, "epoch": 18, "n_parameters": 676689114} {"train_lr": 3.1085230647629717e-05, "train_min_lr": 1.5542615323814836e-06, "train_loss": 0.1817448143497691, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 9.433108793364632, "val_score": 61.56250047683716, "epoch": 19, "n_parameters": 676689114} {"train_lr": 2.5752893398873276e-05, "train_min_lr": 1.2876446699436636e-06, "train_loss": 0.17458355467621092, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 9.079465755113253, "val_score": 62.69531238079071, "epoch": 20, "n_parameters": 676689114} {"train_lr": 2.2135584291922487e-05, "train_min_lr": 1.1067792145961235e-06, "train_loss": 0.16912682604760648, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 8.673409387872026, "val_score": 63.86718690395355, "epoch": 21, "n_parameters": 676689114} {"train_lr": 2.0306941308736827e-05, "train_min_lr": 1.0153470654368414e-06, "train_loss": 0.16581662617869922, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 8.712674590202424, "val_score": 62.18750035762787, "epoch": 22, "n_parameters": 676689114}