{"train_lr": 0.0001, "train_min_lr": 5e-06, "train_loss": 77.85034447181516, "train_loss_scale": 8991.219512195123, "train_weight_decay": 0.010000000000000005, "train_grad_norm": Infinity, "val_score": 4.31640625, "epoch": 0, "n_parameters": 223095770} {"train_lr": 0.00019983045158353352, "train_min_lr": 9.991522579176675e-06, "train_loss": 7.025817452407464, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 5.701524775202682, "val_score": 4.31640625, "epoch": 1, "n_parameters": 223095770} {"train_lr": 0.00019879013957041123, "train_min_lr": 9.939506978520558e-06, "train_loss": 5.642976144465004, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.488031654823117, "val_score": 4.19921875, "epoch": 2, "n_parameters": 223095770} {"train_lr": 0.00019670884435242454, "train_min_lr": 9.83544221762123e-06, "train_loss": 5.463096548871296, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.1924728591267657, "val_score": 4.7070313692092896, "epoch": 3, "n_parameters": 223095770} {"train_lr": 0.00019361096721305816, "train_min_lr": 9.680548360652908e-06, "train_loss": 5.386132426378204, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.1129612283008856, "val_score": 4.609375, "epoch": 4, "n_parameters": 223095770} {"train_lr": 0.00018953282792935505, "train_min_lr": 9.47664139646775e-06, "train_loss": 5.346672511682278, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.090851234226692, "val_score": 4.609375, "epoch": 5, "n_parameters": 223095770} {"train_lr": 0.00018452223895573826, "train_min_lr": 9.226111947786915e-06, "train_loss": 5.323095240244052, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.0887086304222664, "val_score": 4.609375, "epoch": 6, "n_parameters": 223095770} {"train_lr": 0.00017863794486669825, "train_min_lr": 8.931897243334915e-06, "train_loss": 5.30428313045967, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.097902989969021, "val_score": 4.609375, "epoch": 7, "n_parameters": 223095770} {"train_lr": 0.00017194893363036773, "train_min_lr": 8.597446681518385e-06, "train_loss": 5.275659572787401, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.14394467632945, "val_score": 5.87890625, "epoch": 8, "n_parameters": 223095770} {"train_lr": 0.00016453362778767129, "train_min_lr": 8.226681389383567e-06, "train_loss": 5.159589697675007, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.3277296961807625, "val_score": 6.30859375, "epoch": 9, "n_parameters": 223095770} {"train_lr": 0.00015647896501973577, "train_min_lr": 7.82394825098679e-06, "train_loss": 5.018248918579846, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.2596429673636833, "val_score": 6.40625, "epoch": 10, "n_parameters": 223095770} {"train_lr": 0.0001478793788830669, "train_min_lr": 7.39396894415334e-06, "train_loss": 4.9448066920768925, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.2446578682922738, "val_score": 6.8359373807907104, "epoch": 11, "n_parameters": 223095770} {"train_lr": 0.00013883569166244037, "train_min_lr": 6.941784583122018e-06, "train_loss": 4.890266302155285, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.2621670641550202, "val_score": 6.6210936307907104, "epoch": 12, "n_parameters": 223095770} {"train_lr": 0.00012945393232179604, "train_min_lr": 6.4726966160898044e-06, "train_loss": 4.80834550392337, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.395012840992067, "val_score": 8.63281238079071, "epoch": 13, "n_parameters": 223095770} {"train_lr": 0.00011984409341157866, "train_min_lr": 5.992204670578932e-06, "train_loss": 4.678725893904523, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.4546352479516007, "val_score": 9.062499761581421, "epoch": 14, "n_parameters": 223095770} {"train_lr": 0.00011011884150665089, "train_min_lr": 5.505942075332545e-06, "train_loss": 4.549415693050477, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.574625079224749, "val_score": 14.66796875, "epoch": 15, "n_parameters": 223095770} {"train_lr": 0.00010039219629371552, "train_min_lr": 5.019609814685776e-06, "train_loss": 4.42408505881705, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.648424317197102, "val_score": 17.324217796325684, "epoch": 16, "n_parameters": 223095770} {"train_lr": 9.077819379473764e-05, "train_min_lr": 4.538909689736882e-06, "train_loss": 4.28675083997773, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 2.838902002427636, "val_score": 23.339843273162842, "epoch": 17, "n_parameters": 223095770} {"train_lr": 8.138954939885138e-05, "train_min_lr": 4.069477469942571e-06, "train_loss": 4.113551750415709, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 3.0310123548275087, "val_score": 30.136717796325684, "epoch": 18, "n_parameters": 223095770} {"train_lr": 7.233633637747924e-05, "train_min_lr": 3.616816818873962e-06, "train_loss": 3.9277686781999543, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 3.188710282488567, "val_score": 32.32421875, "epoch": 19, "n_parameters": 223095770} {"train_lr": 6.372469537586505e-05, "train_min_lr": 3.186234768793252e-06, "train_loss": 3.7431207342845636, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 3.354506701957889, "val_score": 35.46875047683716, "epoch": 20, "n_parameters": 223095770} {"train_lr": 5.565559001105433e-05, "train_min_lr": 2.782779500552716e-06, "train_loss": 3.5962114683011683, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 3.5105015359273772, "val_score": 37.28515625, "epoch": 21, "n_parameters": 223095770} {"train_lr": 4.8223623165796115e-05, "train_min_lr": 2.4111811582898055e-06, "train_loss": 3.472690297336113, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 3.685645086009328, "val_score": 38.710936546325684, "epoch": 22, "n_parameters": 223095770} {"train_lr": 4.151592785623897e-05, "train_min_lr": 2.075796392811948e-06, "train_loss": 3.369144096607115, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 3.7349208622443966, "val_score": 38.671875, "epoch": 23, "n_parameters": 223095770} {"train_lr": 3.561114567698311e-05, "train_min_lr": 1.7805572838491561e-06, "train_loss": 3.28924276770615, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 3.8288840026390263, "val_score": 40.29296684265137, "epoch": 24, "n_parameters": 223095770} {"train_lr": 3.0578504800286517e-05, "train_min_lr": 1.5289252400143263e-06, "train_loss": 3.227319374317076, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 3.883898054681173, "val_score": 40.546875, "epoch": 25, "n_parameters": 223095770} {"train_lr": 2.647700833904102e-05, "train_min_lr": 1.3238504169520507e-06, "train_loss": 3.1698229661801967, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 3.947190912758432, "val_score": 41.386717796325684, "epoch": 26, "n_parameters": 223095770} {"train_lr": 2.3354742589220726e-05, "train_min_lr": 1.1677371294610364e-06, "train_loss": 3.1281202653559244, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 4.021333758423968, "val_score": 41.42578125, "epoch": 27, "n_parameters": 223095770} {"train_lr": 2.124831326202749e-05, "train_min_lr": 1.0624156631013745e-06, "train_loss": 3.089860200881958, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 4.192677852584095, "val_score": 41.93359375, "epoch": 28, "n_parameters": 223095770} {"train_lr": 2.0182416315395952e-05, "train_min_lr": 1.0091208157697977e-06, "train_loss": 3.0539176289628194, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000005, "train_grad_norm": 4.23136305809021, "val_score": 42.597655296325684, "epoch": 29, "n_parameters": 223095770}