{"train_lr": 9.999999999999996e-05, "train_min_lr": 5e-06, "train_loss": 41.42953062631998, "train_loss_scale": 8488.096385542169, "train_weight_decay": 0.010000000000000007, "train_grad_norm": Infinity, "val_score": 4.316406264901161, "epoch": 0, "n_parameters": 223387610} {"train_lr": 0.00019982565581158298, "train_min_lr": 9.99128279057915e-06, "train_loss": 5.435071330472647, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 4.401134400482637, "val_score": 6.62109375, "epoch": 1, "n_parameters": 223387610} {"train_lr": 0.00019877571034157302, "train_min_lr": 9.93878551707865e-06, "train_loss": 5.104092259004892, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 4.513412854757654, "val_score": 6.71875, "epoch": 2, "n_parameters": 223387610} {"train_lr": 0.00019668495083621437, "train_min_lr": 9.834247541810718e-06, "train_loss": 4.553876282220863, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 5.020111019352832, "val_score": 26.87500035762787, "epoch": 3, "n_parameters": 223387610} {"train_lr": 0.00019357788953910728, "train_min_lr": 9.678894476955367e-06, "train_loss": 3.537763997732875, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 6.444521786218666, "val_score": 38.26171863079071, "epoch": 4, "n_parameters": 223387610} {"train_lr": 0.00018949095390314753, "train_min_lr": 9.474547695157376e-06, "train_loss": 2.908365284103945, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 8.018994411790228, "val_score": 42.44140625, "epoch": 5, "n_parameters": 223387610} {"train_lr": 0.0001844720595119453, "train_min_lr": 9.223602975597268e-06, "train_loss": 2.5526550735335753, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 9.366189505680499, "val_score": 47.441407442092896, "epoch": 6, "n_parameters": 223387610} {"train_lr": 0.00017858004831341904, "train_min_lr": 8.929002415670954e-06, "train_loss": 2.236787036240819, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 10.639315096728772, "val_score": 53.14453101158142, "epoch": 7, "n_parameters": 223387610} {"train_lr": 0.0001718839987517542, "train_min_lr": 8.59419993758771e-06, "train_loss": 1.9938740241958435, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 11.461752503751272, "val_score": 55.42968797683716, "epoch": 8, "n_parameters": 223387610} {"train_lr": 0.00016446241588580443, "train_min_lr": 8.223120794290222e-06, "train_loss": 1.7935115177947354, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 12.54727828933532, "val_score": 55.52734375, "epoch": 9, "n_parameters": 223387610} {"train_lr": 0.00015640231098905548, "train_min_lr": 7.820115549452776e-06, "train_loss": 1.6551586016114936, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 13.545576968825007, "val_score": 58.339844703674316, "epoch": 10, "n_parameters": 223387610} {"train_lr": 0.00014779818142199747, "train_min_lr": 7.389909071099871e-06, "train_loss": 1.5137181957084012, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 14.02851342005902, "val_score": 57.5, "epoch": 11, "n_parameters": 223387610} {"train_lr": 0.0001387509027369731, "train_min_lr": 6.937545136848659e-06, "train_loss": 1.400743959538908, "train_loss_scale": 15791.807228915663, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 14.584117090845682, "val_score": 58.88671922683716, "epoch": 12, "n_parameters": 223387610} {"train_lr": 0.00012936654600455906, "train_min_lr": 6.468327300227951e-06, "train_loss": 1.3017923268209022, "train_loss_scale": 16384.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 14.933083114853824, "val_score": 59.64843821525574, "epoch": 13, "n_parameters": 223387610} {"train_lr": 0.0001197551342272433, "train_min_lr": 5.987756711362163e-06, "train_loss": 1.2224243645926556, "train_loss_scale": 16384.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 15.135863947581095, "val_score": 58.96484446525574, "epoch": 14, "n_parameters": 223387610} {"train_lr": 0.00011002935242031735, "train_min_lr": 5.50146762101587e-06, "train_loss": 1.151152405394129, "train_loss_scale": 16384.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 15.676761408886277, "val_score": 59.37499976158142, "epoch": 15, "n_parameters": 223387610} {"train_lr": 0.00010030322648310045, "train_min_lr": 5.015161324155024e-06, "train_loss": 1.0652403300067028, "train_loss_scale": 16384.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 15.666179151420133, "val_score": 60.44921898841858, "epoch": 16, "n_parameters": 223387610} {"train_lr": 9.069078634952463e-05, "train_min_lr": 4.534539317476229e-06, "train_loss": 1.0001962457794742, "train_loss_scale": 10314.024096385541, "train_weight_decay": 0.010000000000000007, "train_grad_norm": NaN, "val_score": 59.31640553474426, "epoch": 17, "n_parameters": 223387610} {"train_lr": 8.130472909141817e-05, "train_min_lr": 4.06523645457091e-06, "train_loss": 0.9675739770194134, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 16.340348496494524, "val_score": 59.570313453674316, "epoch": 18, "n_parameters": 223387610} {"train_lr": 7.225509764837844e-05, "train_min_lr": 3.6127548824189226e-06, "train_loss": 0.918909461742424, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 16.528942705637, "val_score": 59.511717557907104, "epoch": 19, "n_parameters": 223387610} {"train_lr": 6.36479906749182e-05, "train_min_lr": 3.1823995337459088e-06, "train_loss": 0.8700280647320919, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 16.649569586098913, "val_score": 60.546876192092896, "epoch": 20, "n_parameters": 223387610} {"train_lr": 5.5584318630748205e-05, "train_min_lr": 2.7792159315374105e-06, "train_loss": 0.8370450770998575, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 16.26901368060744, "val_score": 60.52734327316284, "epoch": 21, "n_parameters": 223387610} {"train_lr": 4.8158620697900774e-05, "train_min_lr": 2.40793103489504e-06, "train_loss": 0.8006192583994693, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 16.439209128000652, "val_score": 60.585936069488525, "epoch": 22, "n_parameters": 223387610} {"train_lr": 4.1457956395258196e-05, "train_min_lr": 2.07289781976291e-06, "train_loss": 0.768808602748147, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 16.57604116416839, "val_score": 60.41015601158142, "epoch": 23, "n_parameters": 223387610} {"train_lr": 3.556088488529306e-05, "train_min_lr": 1.7780442442646535e-06, "train_loss": 0.7472374739058046, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 16.658628952072327, "val_score": 60.5078125, "epoch": 24, "n_parameters": 223387610} {"train_lr": 3.0536543939715874e-05, "train_min_lr": 1.5268271969857936e-06, "train_loss": 0.7228963184787567, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 16.68775792294238, "val_score": 60.29296827316284, "epoch": 25, "n_parameters": 223387610} {"train_lr": 2.644383936231479e-05, "train_min_lr": 1.3221919681157395e-06, "train_loss": 0.7066218414938593, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 17.135527156921754, "val_score": 61.19140625, "epoch": 26, "n_parameters": 223387610} {"train_lr": 2.333075437226435e-05, "train_min_lr": 1.1665377186132175e-06, "train_loss": 0.7012411246457732, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 16.7521299224302, "val_score": 61.09375, "epoch": 27, "n_parameters": 223387610} {"train_lr": 2.1233787044752136e-05, "train_min_lr": 1.0616893522376066e-06, "train_loss": 0.6835373790867357, "train_loss_scale": 8192.0, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 16.50884308872453, "val_score": 59.37500071525574, "epoch": 28, "n_parameters": 223387610} {"train_lr": 2.0177522404417735e-05, "train_min_lr": 1.008876120220887e-06, "train_loss": 0.6717967215072678, "train_loss_scale": 13867.180722891566, "train_weight_decay": 0.010000000000000007, "train_grad_norm": 16.787567178887056, "val_score": 59.74609422683716, "epoch": 29, "n_parameters": 223387610}