{"train_lr": 9.999999999999999e-05, "train_min_lr": 5.000000000000001e-06, "train_loss": 26.182623874675762, "train_loss_scale": 4231.303303303303, "train_weight_decay": 0.009999999999999919, "train_grad_norm": Infinity, "val_score": 4.316406257450581, "epoch": 0, "n_parameters": 677020890} {"train_lr": 0.00019982486126720822, "train_min_lr": 9.991243063360407e-06, "train_loss": 4.968530958479231, "train_loss_scale": 4096.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 7.785102943042377, "val_score": 28.92578113079071, "epoch": 1, "n_parameters": 677020890} {"train_lr": 0.00019877333123240822, "train_min_lr": 9.938666561620405e-06, "train_loss": 3.0626874098906645, "train_loss_scale": 4096.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 10.118952039483789, "val_score": 43.749999940395355, "epoch": 2, "n_parameters": 677020890} {"train_lr": 0.00019668101505513922, "train_min_lr": 9.83405075275696e-06, "train_loss": 2.21171091913103, "train_loss_scale": 4096.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 12.776510444847313, "val_score": 53.16406178474426, "epoch": 3, "n_parameters": 677020890} {"train_lr": 0.0001935724432295562, "train_min_lr": 9.678622161477808e-06, "train_loss": 1.7926711445456152, "train_loss_scale": 4096.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 12.478762486317494, "val_score": 59.0429682135582, "epoch": 4, "n_parameters": 677020890} {"train_lr": 0.00018948406091812042, "train_min_lr": 9.474203045906028e-06, "train_loss": 1.4770364213634182, "train_loss_scale": 4096.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 14.36354748980777, "val_score": 59.49218738079071, "epoch": 5, "n_parameters": 677020890} {"train_lr": 0.00018446380066538962, "train_min_lr": 9.223190033269488e-06, "train_loss": 1.249427579723679, "train_loss_scale": 8130.4984984984985, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 14.833532452225327, "val_score": 62.10937440395355, "epoch": 6, "n_parameters": 677020890} {"train_lr": 0.0001785705204327593, "train_min_lr": 8.928526021637972e-06, "train_loss": 1.0643869607119232, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 15.094122318176177, "val_score": 62.75390589237213, "epoch": 7, "n_parameters": 677020890} {"train_lr": 0.00017187331354267965, "train_min_lr": 8.593665677133979e-06, "train_loss": 0.9221940057592707, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 14.639201391924608, "val_score": 60.95703113079071, "epoch": 8, "n_parameters": 677020890} {"train_lr": 0.00016445069862262214, "train_min_lr": 8.222534931131104e-06, "train_loss": 0.8159086400413657, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 15.106565837745553, "val_score": 62.57812488079071, "epoch": 9, "n_parameters": 677020890} {"train_lr": 0.00015638969904596285, "train_min_lr": 7.81948495229814e-06, "train_loss": 0.7085787440921452, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 15.28641129828788, "val_score": 61.09374964237213, "epoch": 10, "n_parameters": 677020890} {"train_lr": 0.00014778482266249588, "train_min_lr": 7.389241133124806e-06, "train_loss": 0.6360200635484747, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 15.04913724721731, "val_score": 62.36328113079071, "epoch": 11, "n_parameters": 677020890} {"train_lr": 0.00013873695378030412, "train_min_lr": 6.936847689015204e-06, "train_loss": 0.5701365657933839, "train_loss_scale": 9840.24024024024, "train_weight_decay": 0.009999999999999919, "train_grad_norm": Infinity, "val_score": 61.99218666553497, "epoch": 12, "n_parameters": 677020890} {"train_lr": 0.0001293521703894856, "train_min_lr": 6.467608519474285e-06, "train_loss": 0.49803302868887467, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 14.222424806417287, "val_score": 62.59765648841858, "epoch": 13, "n_parameters": 677020890} {"train_lr": 0.00011974050049470861, "train_min_lr": 5.987025024735426e-06, "train_loss": 0.44331464502546525, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 14.169997569676992, "val_score": 62.63671863079071, "epoch": 14, "n_parameters": 677020890} {"train_lr": 0.00011001463213745562, "train_min_lr": 5.500731606872777e-06, "train_loss": 0.3969369358844585, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 13.146547428480497, "val_score": 61.56250011920929, "epoch": 15, "n_parameters": 677020890} {"train_lr": 0.00010028859223176908, "train_min_lr": 5.014429611588457e-06, "train_loss": 0.3482672312819922, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 12.62019040491488, "val_score": 62.07031309604645, "epoch": 16, "n_parameters": 677020890} {"train_lr": 9.06764097029405e-05, "train_min_lr": 4.533820485147025e-06, "train_loss": 0.32557909422226855, "train_loss_scale": 8192.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 13.185535986502249, "val_score": 62.38281178474426, "epoch": 17, "n_parameters": 677020890} {"train_lr": 8.129077860261774e-05, "train_min_lr": 4.064538930130887e-06, "train_loss": 0.2988820619679786, "train_loss_scale": 14514.354354354355, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 11.447971378360783, "val_score": 61.23046803474426, "epoch": 18, "n_parameters": 677020890} {"train_lr": 7.224173687408786e-05, "train_min_lr": 3.612086843704389e-06, "train_loss": 0.27654498768550856, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 11.389693122726303, "val_score": 61.26953065395355, "epoch": 19, "n_parameters": 677020890} {"train_lr": 6.36353762580001e-05, "train_min_lr": 3.181768812900003e-06, "train_loss": 0.25095447398968285, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 10.429948024205617, "val_score": 61.523436427116394, "epoch": 20, "n_parameters": 677020890} {"train_lr": 5.557259846370749e-05, "train_min_lr": 2.7786299231853746e-06, "train_loss": 0.23496153250381396, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 10.62993753672362, "val_score": 62.285155057907104, "epoch": 21, "n_parameters": 677020890} {"train_lr": 4.81479321889802e-05, "train_min_lr": 2.4073966094490112e-06, "train_loss": 0.22002185065601323, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 10.160439169084704, "val_score": 61.38671815395355, "epoch": 22, "n_parameters": 677020890} {"train_lr": 4.14484248574522e-05, "train_min_lr": 2.0724212428726083e-06, "train_loss": 0.21307115947027822, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 11.101758199411112, "val_score": 61.679686427116394, "epoch": 23, "n_parameters": 677020890} {"train_lr": 3.55526220671677e-05, "train_min_lr": 1.7776311033583843e-06, "train_loss": 0.19930720541279418, "train_loss_scale": 20713.705705705706, "train_weight_decay": 0.009999999999999919, "train_grad_norm": NaN, "val_score": 62.34374916553497, "epoch": 24, "n_parameters": 677020890} {"train_lr": 3.052964671525884e-05, "train_min_lr": 1.5264823357629409e-06, "train_loss": 0.19287315460744206, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 9.257866463145694, "val_score": 62.16796839237213, "epoch": 25, "n_parameters": 677020890} {"train_lr": 2.6438388595176714e-05, "train_min_lr": 1.321919429758834e-06, "train_loss": 0.1969604425232958, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 9.523305104122505, "val_score": 62.42187452316284, "epoch": 26, "n_parameters": 677020890} {"train_lr": 2.3326813967706174e-05, "train_min_lr": 1.1663406983853087e-06, "train_loss": 0.187447168184696, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 9.592776701615021, "val_score": 61.56249952316284, "epoch": 27, "n_parameters": 677020890} {"train_lr": 2.1231403200414615e-05, "train_min_lr": 1.0615701600207302e-06, "train_loss": 0.17364879642185327, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 9.058554746367195, "val_score": 61.933592677116394, "epoch": 28, "n_parameters": 677020890} {"train_lr": 2.0176723068696133e-05, "train_min_lr": 1.008836153434806e-06, "train_loss": 0.17385395037922058, "train_loss_scale": 16384.0, "train_weight_decay": 0.009999999999999919, "train_grad_norm": 8.664375653317025, "val_score": 62.18749952316284, "epoch": 29, "n_parameters": 677020890}