{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4130, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.00847457627118644, "grad_norm": 12.236435102750375, "learning_rate": 3.8740920096852305e-07, "loss": 0.8295, "loss_nan_ranks": 0, "loss_rank_avg": 0.2684570252895355, "step": 5, "valid_targets_mean": 4368.4, "valid_targets_min": 2939 }, { "epoch": 0.01694915254237288, "grad_norm": 10.058309821274516, "learning_rate": 8.716707021791768e-07, "loss": 0.8055, "loss_nan_ranks": 0, "loss_rank_avg": 0.5616639852523804, "step": 10, "valid_targets_mean": 9545.8, "valid_targets_min": 4547 }, { "epoch": 0.025423728813559324, "grad_norm": 8.52945178256474, "learning_rate": 1.3559322033898307e-06, "loss": 0.7631, "loss_nan_ranks": 0, "loss_rank_avg": 0.4021530747413635, "step": 15, "valid_targets_mean": 9586.9, "valid_targets_min": 5112 }, { "epoch": 0.03389830508474576, "grad_norm": 5.980922520646845, "learning_rate": 1.8401937046004845e-06, "loss": 0.7736, "loss_nan_ranks": 0, "loss_rank_avg": 0.41938316822052, "step": 20, "valid_targets_mean": 8228.5, "valid_targets_min": 3550 }, { "epoch": 0.0423728813559322, "grad_norm": 3.7984612636995125, "learning_rate": 2.324455205811138e-06, "loss": 0.7283, "loss_nan_ranks": 0, "loss_rank_avg": 0.4073244035243988, "step": 25, "valid_targets_mean": 10135.8, "valid_targets_min": 4168 }, { "epoch": 0.05084745762711865, "grad_norm": 2.94113455953092, "learning_rate": 2.808716707021792e-06, "loss": 0.7287, "loss_nan_ranks": 0, "loss_rank_avg": 0.3122481405735016, "step": 30, "valid_targets_mean": 8561.0, "valid_targets_min": 3843 }, { "epoch": 0.059322033898305086, "grad_norm": 2.719124371329246, "learning_rate": 3.2929782082324455e-06, "loss": 0.7333, "loss_nan_ranks": 0, "loss_rank_avg": 0.31176847219467163, "step": 35, "valid_targets_mean": 5976.4, "valid_targets_min": 3033 }, { "epoch": 0.06779661016949153, "grad_norm": 1.8367152849661372, "learning_rate": 3.7772397094430994e-06, "loss": 0.6223, "loss_nan_ranks": 0, "loss_rank_avg": 0.3117915391921997, "step": 40, "valid_targets_mean": 6918.5, "valid_targets_min": 3257 }, { "epoch": 0.07627118644067797, "grad_norm": 1.202874459401654, "learning_rate": 4.261501210653753e-06, "loss": 0.6556, "loss_nan_ranks": 0, "loss_rank_avg": 0.36333340406417847, "step": 45, "valid_targets_mean": 9124.4, "valid_targets_min": 2913 }, { "epoch": 0.0847457627118644, "grad_norm": 1.0786502836699934, "learning_rate": 4.745762711864408e-06, "loss": 0.5957, "loss_nan_ranks": 0, "loss_rank_avg": 0.32077574729919434, "step": 50, "valid_targets_mean": 9160.0, "valid_targets_min": 4550 }, { "epoch": 0.09322033898305085, "grad_norm": 0.9850973794351479, "learning_rate": 5.230024213075061e-06, "loss": 0.5574, "loss_nan_ranks": 0, "loss_rank_avg": 0.28348320722579956, "step": 55, "valid_targets_mean": 7648.8, "valid_targets_min": 2230 }, { "epoch": 0.1016949152542373, "grad_norm": 0.9506271905194752, "learning_rate": 5.7142857142857145e-06, "loss": 0.5513, "loss_nan_ranks": 0, "loss_rank_avg": 0.35213959217071533, "step": 60, "valid_targets_mean": 9959.1, "valid_targets_min": 6620 }, { "epoch": 0.11016949152542373, "grad_norm": 0.7568590634359315, "learning_rate": 6.198547215496369e-06, "loss": 0.5441, "loss_nan_ranks": 0, "loss_rank_avg": 0.32353514432907104, "step": 65, "valid_targets_mean": 8611.0, "valid_targets_min": 3485 }, { "epoch": 0.11864406779661017, "grad_norm": 0.8003434826466195, "learning_rate": 6.682808716707022e-06, "loss": 0.5294, "loss_nan_ranks": 0, "loss_rank_avg": 0.2963908612728119, "step": 70, "valid_targets_mean": 8577.6, "valid_targets_min": 4103 }, { "epoch": 0.1271186440677966, "grad_norm": 0.6819382378620414, "learning_rate": 7.1670702179176766e-06, "loss": 0.5266, "loss_nan_ranks": 0, "loss_rank_avg": 0.29446882009506226, "step": 75, "valid_targets_mean": 9525.9, "valid_targets_min": 2096 }, { "epoch": 0.13559322033898305, "grad_norm": 0.5426614937193089, "learning_rate": 7.65133171912833e-06, "loss": 0.4912, "loss_nan_ranks": 0, "loss_rank_avg": 0.1997358202934265, "step": 80, "valid_targets_mean": 6563.4, "valid_targets_min": 2943 }, { "epoch": 0.1440677966101695, "grad_norm": 0.5948300852884347, "learning_rate": 8.135593220338983e-06, "loss": 0.5251, "loss_nan_ranks": 0, "loss_rank_avg": 0.4521056115627289, "step": 85, "valid_targets_mean": 12116.9, "valid_targets_min": 3622 }, { "epoch": 0.15254237288135594, "grad_norm": 0.49709515079932287, "learning_rate": 8.619854721549637e-06, "loss": 0.5206, "loss_nan_ranks": 0, "loss_rank_avg": 0.284382164478302, "step": 90, "valid_targets_mean": 8606.2, "valid_targets_min": 3501 }, { "epoch": 0.16101694915254236, "grad_norm": 0.4713133451299385, "learning_rate": 9.10411622276029e-06, "loss": 0.474, "loss_nan_ranks": 0, "loss_rank_avg": 0.15513190627098083, "step": 95, "valid_targets_mean": 6271.8, "valid_targets_min": 3023 }, { "epoch": 0.1694915254237288, "grad_norm": 0.4457304349817586, "learning_rate": 9.588377723970946e-06, "loss": 0.4661, "loss_nan_ranks": 0, "loss_rank_avg": 0.2053360641002655, "step": 100, "valid_targets_mean": 7486.0, "valid_targets_min": 3465 }, { "epoch": 0.17796610169491525, "grad_norm": 0.44154277874061937, "learning_rate": 1.0072639225181599e-05, "loss": 0.4511, "loss_nan_ranks": 0, "loss_rank_avg": 0.20671820640563965, "step": 105, "valid_targets_mean": 6911.2, "valid_targets_min": 2853 }, { "epoch": 0.1864406779661017, "grad_norm": 0.48622015880781266, "learning_rate": 1.0556900726392252e-05, "loss": 0.4333, "loss_nan_ranks": 0, "loss_rank_avg": 0.292965292930603, "step": 110, "valid_targets_mean": 8936.8, "valid_targets_min": 1718 }, { "epoch": 0.19491525423728814, "grad_norm": 0.4945674916588067, "learning_rate": 1.1041162227602906e-05, "loss": 0.46, "loss_nan_ranks": 0, "loss_rank_avg": 0.15357142686843872, "step": 115, "valid_targets_mean": 6594.0, "valid_targets_min": 1819 }, { "epoch": 0.2033898305084746, "grad_norm": 0.5260662505419903, "learning_rate": 1.1525423728813561e-05, "loss": 0.4256, "loss_nan_ranks": 0, "loss_rank_avg": 0.2100408673286438, "step": 120, "valid_targets_mean": 6844.6, "valid_targets_min": 2819 }, { "epoch": 0.211864406779661, "grad_norm": 0.4859160469605518, "learning_rate": 1.2009685230024215e-05, "loss": 0.4549, "loss_nan_ranks": 0, "loss_rank_avg": 0.29052165150642395, "step": 125, "valid_targets_mean": 9443.6, "valid_targets_min": 2351 }, { "epoch": 0.22033898305084745, "grad_norm": 0.4887408500988149, "learning_rate": 1.2493946731234868e-05, "loss": 0.4533, "loss_nan_ranks": 0, "loss_rank_avg": 0.32517391443252563, "step": 130, "valid_targets_mean": 9598.9, "valid_targets_min": 3221 }, { "epoch": 0.2288135593220339, "grad_norm": 0.44709723187595857, "learning_rate": 1.2978208232445521e-05, "loss": 0.4038, "loss_nan_ranks": 0, "loss_rank_avg": 0.22177180647850037, "step": 135, "valid_targets_mean": 7938.1, "valid_targets_min": 1772 }, { "epoch": 0.23728813559322035, "grad_norm": 0.47189922671995305, "learning_rate": 1.3462469733656177e-05, "loss": 0.4447, "loss_nan_ranks": 0, "loss_rank_avg": 0.19433565437793732, "step": 140, "valid_targets_mean": 7033.0, "valid_targets_min": 3731 }, { "epoch": 0.2457627118644068, "grad_norm": 0.7896370250308062, "learning_rate": 1.3946731234866828e-05, "loss": 0.4819, "loss_nan_ranks": 0, "loss_rank_avg": 0.25007662177085876, "step": 145, "valid_targets_mean": 7750.5, "valid_targets_min": 3290 }, { "epoch": 0.2542372881355932, "grad_norm": 1.167473809507481, "learning_rate": 1.4430992736077482e-05, "loss": 0.3776, "loss_nan_ranks": 0, "loss_rank_avg": 0.19537419080734253, "step": 150, "valid_targets_mean": 7780.4, "valid_targets_min": 2228 }, { "epoch": 0.2627118644067797, "grad_norm": 0.4604199039648987, "learning_rate": 1.4915254237288137e-05, "loss": 0.4206, "loss_nan_ranks": 0, "loss_rank_avg": 0.20237131416797638, "step": 155, "valid_targets_mean": 6237.5, "valid_targets_min": 2797 }, { "epoch": 0.2711864406779661, "grad_norm": 1.2851421474093927, "learning_rate": 1.5399515738498792e-05, "loss": 0.3927, "loss_nan_ranks": 0, "loss_rank_avg": 0.1901024878025055, "step": 160, "valid_targets_mean": 7075.9, "valid_targets_min": 3662 }, { "epoch": 0.2796610169491525, "grad_norm": 0.4580396609863836, "learning_rate": 1.5883777239709442e-05, "loss": 0.3924, "loss_nan_ranks": 0, "loss_rank_avg": 0.146134614944458, "step": 165, "valid_targets_mean": 7100.8, "valid_targets_min": 3506 }, { "epoch": 0.288135593220339, "grad_norm": 0.4849064596017498, "learning_rate": 1.63680387409201e-05, "loss": 0.4289, "loss_nan_ranks": 0, "loss_rank_avg": 0.18006592988967896, "step": 170, "valid_targets_mean": 8865.8, "valid_targets_min": 3261 }, { "epoch": 0.2966101694915254, "grad_norm": 0.4697056355654206, "learning_rate": 1.6852300242130752e-05, "loss": 0.3988, "loss_nan_ranks": 0, "loss_rank_avg": 0.23008233308792114, "step": 175, "valid_targets_mean": 8906.1, "valid_targets_min": 3874 }, { "epoch": 0.3050847457627119, "grad_norm": 0.4186025820722969, "learning_rate": 1.7336561743341406e-05, "loss": 0.4076, "loss_nan_ranks": 0, "loss_rank_avg": 0.21983414888381958, "step": 180, "valid_targets_mean": 9217.2, "valid_targets_min": 4157 }, { "epoch": 0.3135593220338983, "grad_norm": 0.4880177558476617, "learning_rate": 1.782082324455206e-05, "loss": 0.408, "loss_nan_ranks": 0, "loss_rank_avg": 0.20033296942710876, "step": 185, "valid_targets_mean": 8644.5, "valid_targets_min": 5639 }, { "epoch": 0.3220338983050847, "grad_norm": 0.506835537780777, "learning_rate": 1.8305084745762713e-05, "loss": 0.4345, "loss_nan_ranks": 0, "loss_rank_avg": 0.15411603450775146, "step": 190, "valid_targets_mean": 5940.5, "valid_targets_min": 2975 }, { "epoch": 0.3305084745762712, "grad_norm": 0.5175806823084516, "learning_rate": 1.8789346246973366e-05, "loss": 0.3823, "loss_nan_ranks": 0, "loss_rank_avg": 0.22352342307567596, "step": 195, "valid_targets_mean": 6518.9, "valid_targets_min": 1922 }, { "epoch": 0.3389830508474576, "grad_norm": 0.39209882371312016, "learning_rate": 1.927360774818402e-05, "loss": 0.4033, "loss_nan_ranks": 0, "loss_rank_avg": 0.23113977909088135, "step": 200, "valid_targets_mean": 11211.2, "valid_targets_min": 5692 }, { "epoch": 0.3474576271186441, "grad_norm": 0.5642312831981638, "learning_rate": 1.9757869249394673e-05, "loss": 0.4274, "loss_nan_ranks": 0, "loss_rank_avg": 0.29515933990478516, "step": 205, "valid_targets_mean": 12401.2, "valid_targets_min": 5602 }, { "epoch": 0.3559322033898305, "grad_norm": 0.4694784872364969, "learning_rate": 2.0242130750605327e-05, "loss": 0.3671, "loss_nan_ranks": 0, "loss_rank_avg": 0.22254446148872375, "step": 210, "valid_targets_mean": 9149.9, "valid_targets_min": 3145 }, { "epoch": 0.3644067796610169, "grad_norm": 0.4729181140659464, "learning_rate": 2.072639225181598e-05, "loss": 0.3811, "loss_nan_ranks": 0, "loss_rank_avg": 0.1420256644487381, "step": 215, "valid_targets_mean": 6157.2, "valid_targets_min": 2493 }, { "epoch": 0.3728813559322034, "grad_norm": 0.48751693402766566, "learning_rate": 2.1210653753026637e-05, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.30695676803588867, "step": 220, "valid_targets_mean": 10364.8, "valid_targets_min": 4940 }, { "epoch": 0.3813559322033898, "grad_norm": 0.4492368775328314, "learning_rate": 2.169491525423729e-05, "loss": 0.392, "loss_nan_ranks": 0, "loss_rank_avg": 0.1817527413368225, "step": 225, "valid_targets_mean": 8587.1, "valid_targets_min": 6431 }, { "epoch": 0.3898305084745763, "grad_norm": 0.5264407991637193, "learning_rate": 2.2179176755447944e-05, "loss": 0.3598, "loss_nan_ranks": 0, "loss_rank_avg": 0.144405335187912, "step": 230, "valid_targets_mean": 6391.9, "valid_targets_min": 2800 }, { "epoch": 0.3983050847457627, "grad_norm": 0.44859050212635043, "learning_rate": 2.2663438256658597e-05, "loss": 0.4306, "loss_nan_ranks": 0, "loss_rank_avg": 0.12371104955673218, "step": 235, "valid_targets_mean": 6035.9, "valid_targets_min": 2422 }, { "epoch": 0.4067796610169492, "grad_norm": 0.4487952241314178, "learning_rate": 2.3147699757869254e-05, "loss": 0.3496, "loss_nan_ranks": 0, "loss_rank_avg": 0.15325893461704254, "step": 240, "valid_targets_mean": 7694.0, "valid_targets_min": 2322 }, { "epoch": 0.4152542372881356, "grad_norm": 0.5180958481856792, "learning_rate": 2.3631961259079904e-05, "loss": 0.3907, "loss_nan_ranks": 0, "loss_rank_avg": 0.20144130289554596, "step": 245, "valid_targets_mean": 6840.8, "valid_targets_min": 2925 }, { "epoch": 0.423728813559322, "grad_norm": 0.4491176387970824, "learning_rate": 2.4116222760290558e-05, "loss": 0.3935, "loss_nan_ranks": 0, "loss_rank_avg": 0.20885750651359558, "step": 250, "valid_targets_mean": 8512.1, "valid_targets_min": 2493 }, { "epoch": 0.4322033898305085, "grad_norm": 0.4628691361446054, "learning_rate": 2.460048426150121e-05, "loss": 0.3732, "loss_nan_ranks": 0, "loss_rank_avg": 0.18055710196495056, "step": 255, "valid_targets_mean": 7962.2, "valid_targets_min": 3404 }, { "epoch": 0.4406779661016949, "grad_norm": 0.4696155991888429, "learning_rate": 2.5084745762711865e-05, "loss": 0.3845, "loss_nan_ranks": 0, "loss_rank_avg": 0.2186737358570099, "step": 260, "valid_targets_mean": 8228.9, "valid_targets_min": 4428 }, { "epoch": 0.4491525423728814, "grad_norm": 0.4797313441924088, "learning_rate": 2.556900726392252e-05, "loss": 0.3806, "loss_nan_ranks": 0, "loss_rank_avg": 0.18754912912845612, "step": 265, "valid_targets_mean": 8026.2, "valid_targets_min": 2632 }, { "epoch": 0.4576271186440678, "grad_norm": 0.500792419812694, "learning_rate": 2.6053268765133175e-05, "loss": 0.3691, "loss_nan_ranks": 0, "loss_rank_avg": 0.14188027381896973, "step": 270, "valid_targets_mean": 6896.5, "valid_targets_min": 2844 }, { "epoch": 0.4661016949152542, "grad_norm": 0.5194573027568329, "learning_rate": 2.653753026634383e-05, "loss": 0.4269, "loss_nan_ranks": 0, "loss_rank_avg": 0.25647997856140137, "step": 275, "valid_targets_mean": 10153.5, "valid_targets_min": 2859 }, { "epoch": 0.4745762711864407, "grad_norm": 0.4835165912338022, "learning_rate": 2.702179176755448e-05, "loss": 0.4008, "loss_nan_ranks": 0, "loss_rank_avg": 0.2677648067474365, "step": 280, "valid_targets_mean": 10436.8, "valid_targets_min": 2643 }, { "epoch": 0.4830508474576271, "grad_norm": 0.4697980137297522, "learning_rate": 2.7506053268765135e-05, "loss": 0.3844, "loss_nan_ranks": 0, "loss_rank_avg": 0.23836316168308258, "step": 285, "valid_targets_mean": 9596.2, "valid_targets_min": 4758 }, { "epoch": 0.4915254237288136, "grad_norm": 0.7658555007951203, "learning_rate": 2.799031476997579e-05, "loss": 0.389, "loss_nan_ranks": 0, "loss_rank_avg": 0.1868828684091568, "step": 290, "valid_targets_mean": 7418.0, "valid_targets_min": 2145 }, { "epoch": 0.5, "grad_norm": 0.47702422177750037, "learning_rate": 2.8474576271186442e-05, "loss": 0.3657, "loss_nan_ranks": 0, "loss_rank_avg": 0.20087997615337372, "step": 295, "valid_targets_mean": 7950.9, "valid_targets_min": 1969 }, { "epoch": 0.5084745762711864, "grad_norm": 0.46273864653365726, "learning_rate": 2.8958837772397096e-05, "loss": 0.3648, "loss_nan_ranks": 0, "loss_rank_avg": 0.1638944149017334, "step": 300, "valid_targets_mean": 7513.8, "valid_targets_min": 1750 }, { "epoch": 0.5169491525423728, "grad_norm": 0.47460686381697653, "learning_rate": 2.9443099273607753e-05, "loss": 0.3583, "loss_nan_ranks": 0, "loss_rank_avg": 0.22977076470851898, "step": 305, "valid_targets_mean": 10273.2, "valid_targets_min": 6552 }, { "epoch": 0.5254237288135594, "grad_norm": 0.5179070401819209, "learning_rate": 2.9927360774818406e-05, "loss": 0.3636, "loss_nan_ranks": 0, "loss_rank_avg": 0.1554882526397705, "step": 310, "valid_targets_mean": 6126.1, "valid_targets_min": 2357 }, { "epoch": 0.5338983050847458, "grad_norm": 0.4667464306864076, "learning_rate": 3.041162227602906e-05, "loss": 0.3599, "loss_nan_ranks": 0, "loss_rank_avg": 0.14054939150810242, "step": 315, "valid_targets_mean": 7663.6, "valid_targets_min": 5239 }, { "epoch": 0.5423728813559322, "grad_norm": 0.4781556906105198, "learning_rate": 3.089588377723971e-05, "loss": 0.3804, "loss_nan_ranks": 0, "loss_rank_avg": 0.19416019320487976, "step": 320, "valid_targets_mean": 7567.8, "valid_targets_min": 1645 }, { "epoch": 0.5508474576271186, "grad_norm": 0.511629903592572, "learning_rate": 3.138014527845036e-05, "loss": 0.357, "loss_nan_ranks": 0, "loss_rank_avg": 0.12012749165296555, "step": 325, "valid_targets_mean": 5964.8, "valid_targets_min": 4470 }, { "epoch": 0.559322033898305, "grad_norm": 0.4480119776210039, "learning_rate": 3.186440677966102e-05, "loss": 0.3552, "loss_nan_ranks": 0, "loss_rank_avg": 0.162928506731987, "step": 330, "valid_targets_mean": 7623.0, "valid_targets_min": 2591 }, { "epoch": 0.5677966101694916, "grad_norm": 0.4937825533870499, "learning_rate": 3.234866828087168e-05, "loss": 0.3694, "loss_nan_ranks": 0, "loss_rank_avg": 0.19250673055648804, "step": 335, "valid_targets_mean": 8913.8, "valid_targets_min": 2840 }, { "epoch": 0.576271186440678, "grad_norm": 0.4878075980066041, "learning_rate": 3.283292978208233e-05, "loss": 0.3802, "loss_nan_ranks": 0, "loss_rank_avg": 0.16013866662979126, "step": 340, "valid_targets_mean": 6744.0, "valid_targets_min": 1682 }, { "epoch": 0.5847457627118644, "grad_norm": 0.45319045459430685, "learning_rate": 3.3317191283292984e-05, "loss": 0.3863, "loss_nan_ranks": 0, "loss_rank_avg": 0.14388547837734222, "step": 345, "valid_targets_mean": 7284.5, "valid_targets_min": 1990 }, { "epoch": 0.5932203389830508, "grad_norm": 0.47236199339171486, "learning_rate": 3.3801452784503634e-05, "loss": 0.3804, "loss_nan_ranks": 0, "loss_rank_avg": 0.231609508395195, "step": 350, "valid_targets_mean": 9248.5, "valid_targets_min": 2566 }, { "epoch": 0.6016949152542372, "grad_norm": 0.5119661968795367, "learning_rate": 3.4285714285714284e-05, "loss": 0.3726, "loss_nan_ranks": 0, "loss_rank_avg": 0.21987944841384888, "step": 355, "valid_targets_mean": 8192.4, "valid_targets_min": 2871 }, { "epoch": 0.6101694915254238, "grad_norm": 0.42304412282644255, "learning_rate": 3.476997578692494e-05, "loss": 0.3661, "loss_nan_ranks": 0, "loss_rank_avg": 0.13173159956932068, "step": 360, "valid_targets_mean": 8175.8, "valid_targets_min": 5029 }, { "epoch": 0.6186440677966102, "grad_norm": 0.47803298114996845, "learning_rate": 3.52542372881356e-05, "loss": 0.3882, "loss_nan_ranks": 0, "loss_rank_avg": 0.14908023178577423, "step": 365, "valid_targets_mean": 6414.9, "valid_targets_min": 3910 }, { "epoch": 0.6271186440677966, "grad_norm": 0.4881529791768924, "learning_rate": 3.573849878934625e-05, "loss": 0.3723, "loss_nan_ranks": 0, "loss_rank_avg": 0.16491301357746124, "step": 370, "valid_targets_mean": 7414.9, "valid_targets_min": 2965 }, { "epoch": 0.635593220338983, "grad_norm": 0.5108906486160846, "learning_rate": 3.6222760290556904e-05, "loss": 0.3844, "loss_nan_ranks": 0, "loss_rank_avg": 0.22124037146568298, "step": 375, "valid_targets_mean": 7832.9, "valid_targets_min": 2970 }, { "epoch": 0.6440677966101694, "grad_norm": 0.5139550621670309, "learning_rate": 3.670702179176756e-05, "loss": 0.3794, "loss_nan_ranks": 0, "loss_rank_avg": 0.24905268847942352, "step": 380, "valid_targets_mean": 8240.8, "valid_targets_min": 5678 }, { "epoch": 0.652542372881356, "grad_norm": 0.4939392728062636, "learning_rate": 3.719128329297821e-05, "loss": 0.398, "loss_nan_ranks": 0, "loss_rank_avg": 0.1989961713552475, "step": 385, "valid_targets_mean": 9710.9, "valid_targets_min": 4394 }, { "epoch": 0.6610169491525424, "grad_norm": 0.47183364711246323, "learning_rate": 3.767554479418886e-05, "loss": 0.3727, "loss_nan_ranks": 0, "loss_rank_avg": 0.17190328240394592, "step": 390, "valid_targets_mean": 7330.9, "valid_targets_min": 2921 }, { "epoch": 0.6694915254237288, "grad_norm": 0.4406788345603544, "learning_rate": 3.815980629539952e-05, "loss": 0.3487, "loss_nan_ranks": 0, "loss_rank_avg": 0.15205857157707214, "step": 395, "valid_targets_mean": 6784.4, "valid_targets_min": 2346 }, { "epoch": 0.6779661016949152, "grad_norm": 0.4456952077678055, "learning_rate": 3.8644067796610175e-05, "loss": 0.3699, "loss_nan_ranks": 0, "loss_rank_avg": 0.1788387894630432, "step": 400, "valid_targets_mean": 7900.6, "valid_targets_min": 3235 }, { "epoch": 0.6864406779661016, "grad_norm": 0.5523324054394816, "learning_rate": 3.9128329297820825e-05, "loss": 0.3574, "loss_nan_ranks": 0, "loss_rank_avg": 0.13928887248039246, "step": 405, "valid_targets_mean": 5171.9, "valid_targets_min": 3136 }, { "epoch": 0.6949152542372882, "grad_norm": 0.5002722226670426, "learning_rate": 3.961259079903148e-05, "loss": 0.385, "loss_nan_ranks": 0, "loss_rank_avg": 0.1312628537416458, "step": 410, "valid_targets_mean": 6787.4, "valid_targets_min": 3693 }, { "epoch": 0.7033898305084746, "grad_norm": 0.42843480849686666, "learning_rate": 3.9999992856441635e-05, "loss": 0.3493, "loss_nan_ranks": 0, "loss_rank_avg": 0.1744052767753601, "step": 415, "valid_targets_mean": 7211.9, "valid_targets_min": 2393 }, { "epoch": 0.711864406779661, "grad_norm": 0.4679043644147995, "learning_rate": 3.999974283243472e-05, "loss": 0.3639, "loss_nan_ranks": 0, "loss_rank_avg": 0.1082448959350586, "step": 420, "valid_targets_mean": 6552.6, "valid_targets_min": 2437 }, { "epoch": 0.7203389830508474, "grad_norm": 0.47331069467877396, "learning_rate": 3.9999135635612606e-05, "loss": 0.4011, "loss_nan_ranks": 0, "loss_rank_avg": 0.23097260296344757, "step": 425, "valid_targets_mean": 8409.1, "valid_targets_min": 3741 }, { "epoch": 0.7288135593220338, "grad_norm": 0.5135319796540361, "learning_rate": 3.999817127681917e-05, "loss": 0.3778, "loss_nan_ranks": 0, "loss_rank_avg": 0.33611786365509033, "step": 430, "valid_targets_mean": 11845.2, "valid_targets_min": 1936 }, { "epoch": 0.7372881355932204, "grad_norm": 0.5557676245987662, "learning_rate": 3.9996849773276764e-05, "loss": 0.3458, "loss_nan_ranks": 0, "loss_rank_avg": 0.12023050338029861, "step": 435, "valid_targets_mean": 4693.2, "valid_targets_min": 3425 }, { "epoch": 0.7457627118644068, "grad_norm": 0.5410110705579056, "learning_rate": 3.9995171148585944e-05, "loss": 0.3175, "loss_nan_ranks": 0, "loss_rank_avg": 0.16153821349143982, "step": 440, "valid_targets_mean": 6421.5, "valid_targets_min": 3319 }, { "epoch": 0.7542372881355932, "grad_norm": 0.4951775086532844, "learning_rate": 3.999313543272505e-05, "loss": 0.3564, "loss_nan_ranks": 0, "loss_rank_avg": 0.1502537578344345, "step": 445, "valid_targets_mean": 7038.1, "valid_targets_min": 3514 }, { "epoch": 0.7627118644067796, "grad_norm": 0.47906530418320226, "learning_rate": 3.999074266204967e-05, "loss": 0.3263, "loss_nan_ranks": 0, "loss_rank_avg": 0.16620051860809326, "step": 450, "valid_targets_mean": 8577.1, "valid_targets_min": 3324 }, { "epoch": 0.7711864406779662, "grad_norm": 0.5177860251716547, "learning_rate": 3.998799287929199e-05, "loss": 0.3375, "loss_nan_ranks": 0, "loss_rank_avg": 0.20412178337574005, "step": 455, "valid_targets_mean": 7626.9, "valid_targets_min": 1240 }, { "epoch": 0.7796610169491526, "grad_norm": 0.46635973969392164, "learning_rate": 3.998488613356002e-05, "loss": 0.3464, "loss_nan_ranks": 0, "loss_rank_avg": 0.1993708461523056, "step": 460, "valid_targets_mean": 9630.6, "valid_targets_min": 4060 }, { "epoch": 0.788135593220339, "grad_norm": 0.48835104343419244, "learning_rate": 3.998142248033673e-05, "loss": 0.3796, "loss_nan_ranks": 0, "loss_rank_avg": 0.20394505560398102, "step": 465, "valid_targets_mean": 7548.1, "valid_targets_min": 3516 }, { "epoch": 0.7966101694915254, "grad_norm": 0.4557086785487366, "learning_rate": 3.997760198147904e-05, "loss": 0.3486, "loss_nan_ranks": 0, "loss_rank_avg": 0.15721432864665985, "step": 470, "valid_targets_mean": 6833.1, "valid_targets_min": 2772 }, { "epoch": 0.8050847457627118, "grad_norm": 0.4515063413898264, "learning_rate": 3.9973424705216774e-05, "loss": 0.3784, "loss_nan_ranks": 0, "loss_rank_avg": 0.1749514490365982, "step": 475, "valid_targets_mean": 7408.5, "valid_targets_min": 1943 }, { "epoch": 0.8135593220338984, "grad_norm": 0.4428676672373464, "learning_rate": 3.996889072615134e-05, "loss": 0.3258, "loss_nan_ranks": 0, "loss_rank_avg": 0.21249344944953918, "step": 480, "valid_targets_mean": 9819.9, "valid_targets_min": 3010 }, { "epoch": 0.8220338983050848, "grad_norm": 0.49524032365604226, "learning_rate": 3.99640001252545e-05, "loss": 0.375, "loss_nan_ranks": 0, "loss_rank_avg": 0.1323350965976715, "step": 485, "valid_targets_mean": 5834.0, "valid_targets_min": 3776 }, { "epoch": 0.8305084745762712, "grad_norm": 0.47661852289977547, "learning_rate": 3.9958752989866856e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.2077844887971878, "step": 490, "valid_targets_mean": 7829.8, "valid_targets_min": 3541 }, { "epoch": 0.8389830508474576, "grad_norm": 0.5368833318390628, "learning_rate": 3.995314941369631e-05, "loss": 0.3385, "loss_nan_ranks": 0, "loss_rank_avg": 0.1979312300682068, "step": 495, "valid_targets_mean": 7753.1, "valid_targets_min": 3245 }, { "epoch": 0.847457627118644, "grad_norm": 0.43413683875323356, "learning_rate": 3.994718949681642e-05, "loss": 0.3241, "loss_nan_ranks": 0, "loss_rank_avg": 0.08601364493370056, "step": 500, "valid_targets_mean": 4876.6, "valid_targets_min": 1373 }, { "epoch": 0.8559322033898306, "grad_norm": 0.45697287254458874, "learning_rate": 3.994087334566455e-05, "loss": 0.3471, "loss_nan_ranks": 0, "loss_rank_avg": 0.1718927025794983, "step": 505, "valid_targets_mean": 7721.6, "valid_targets_min": 4226 }, { "epoch": 0.864406779661017, "grad_norm": 0.47862116333913, "learning_rate": 3.9934201073040035e-05, "loss": 0.3587, "loss_nan_ranks": 0, "loss_rank_avg": 0.1376647651195526, "step": 510, "valid_targets_mean": 7147.1, "valid_targets_min": 4853 }, { "epoch": 0.8728813559322034, "grad_norm": 0.4429781490950345, "learning_rate": 3.992717279810213e-05, "loss": 0.3546, "loss_nan_ranks": 0, "loss_rank_avg": 0.17605769634246826, "step": 515, "valid_targets_mean": 7849.5, "valid_targets_min": 4396 }, { "epoch": 0.8813559322033898, "grad_norm": 0.45127457745702443, "learning_rate": 3.991978864636788e-05, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.1218881830573082, "step": 520, "valid_targets_mean": 6575.2, "valid_targets_min": 2730 }, { "epoch": 0.8898305084745762, "grad_norm": 0.4345536633734186, "learning_rate": 3.9912048749709896e-05, "loss": 0.3497, "loss_nan_ranks": 0, "loss_rank_avg": 0.1432826966047287, "step": 525, "valid_targets_mean": 8336.4, "valid_targets_min": 3085 }, { "epoch": 0.8983050847457628, "grad_norm": 0.4843526513333187, "learning_rate": 3.990395324635399e-05, "loss": 0.3294, "loss_nan_ranks": 0, "loss_rank_avg": 0.18618427217006683, "step": 530, "valid_targets_mean": 8355.0, "valid_targets_min": 4107 }, { "epoch": 0.9067796610169492, "grad_norm": 0.44356795524997744, "learning_rate": 3.989550228087671e-05, "loss": 0.3497, "loss_nan_ranks": 0, "loss_rank_avg": 0.1626293659210205, "step": 535, "valid_targets_mean": 7243.9, "valid_targets_min": 2909 }, { "epoch": 0.9152542372881356, "grad_norm": 0.41561791071560467, "learning_rate": 3.988669600420275e-05, "loss": 0.3201, "loss_nan_ranks": 0, "loss_rank_avg": 0.1661594808101654, "step": 540, "valid_targets_mean": 9455.1, "valid_targets_min": 4298 }, { "epoch": 0.923728813559322, "grad_norm": 0.4358520648605049, "learning_rate": 3.9877534573602254e-05, "loss": 0.3617, "loss_nan_ranks": 0, "loss_rank_avg": 0.27095770835876465, "step": 545, "valid_targets_mean": 8973.9, "valid_targets_min": 2827 }, { "epoch": 0.9322033898305084, "grad_norm": 0.4813894750533826, "learning_rate": 3.9868018152688044e-05, "loss": 0.3558, "loss_nan_ranks": 0, "loss_rank_avg": 0.17274773120880127, "step": 550, "valid_targets_mean": 7341.4, "valid_targets_min": 1721 }, { "epoch": 0.940677966101695, "grad_norm": 0.46263973848113316, "learning_rate": 3.985814691141263e-05, "loss": 0.3598, "loss_nan_ranks": 0, "loss_rank_avg": 0.2267192006111145, "step": 555, "valid_targets_mean": 9122.1, "valid_targets_min": 3336 }, { "epoch": 0.9491525423728814, "grad_norm": 0.46520816240799234, "learning_rate": 3.984792102606524e-05, "loss": 0.3821, "loss_nan_ranks": 0, "loss_rank_avg": 0.11244647204875946, "step": 560, "valid_targets_mean": 6185.9, "valid_targets_min": 2997 }, { "epoch": 0.9576271186440678, "grad_norm": 0.5072756278635104, "learning_rate": 3.9837340679268634e-05, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.11192071437835693, "step": 565, "valid_targets_mean": 6087.0, "valid_targets_min": 3094 }, { "epoch": 0.9661016949152542, "grad_norm": 0.4165557159597932, "learning_rate": 3.982640605997585e-05, "loss": 0.329, "loss_nan_ranks": 0, "loss_rank_avg": 0.14271879196166992, "step": 570, "valid_targets_mean": 7421.4, "valid_targets_min": 3182 }, { "epoch": 0.9745762711864406, "grad_norm": 0.4465966835957301, "learning_rate": 3.981511736346684e-05, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.1899096965789795, "step": 575, "valid_targets_mean": 8330.2, "valid_targets_min": 3990 }, { "epoch": 0.9830508474576272, "grad_norm": 0.47188153745533346, "learning_rate": 3.980347479134498e-05, "loss": 0.3326, "loss_nan_ranks": 0, "loss_rank_avg": 0.16237373650074005, "step": 580, "valid_targets_mean": 7614.1, "valid_targets_min": 3425 }, { "epoch": 0.9915254237288136, "grad_norm": 0.45659300690082466, "learning_rate": 3.9791478551533435e-05, "loss": 0.3241, "loss_nan_ranks": 0, "loss_rank_avg": 0.1724914014339447, "step": 585, "valid_targets_mean": 7735.9, "valid_targets_min": 3159 }, { "epoch": 1.0, "grad_norm": 0.4731948101985973, "learning_rate": 3.977912885827151e-05, "loss": 0.342, "loss_nan_ranks": 0, "loss_rank_avg": 0.1396312415599823, "step": 590, "valid_targets_mean": 6537.0, "valid_targets_min": 2991 }, { "epoch": 1.0084745762711864, "grad_norm": 0.4627342217897108, "learning_rate": 3.976642593211079e-05, "loss": 0.3613, "loss_nan_ranks": 0, "loss_rank_avg": 0.24919381737709045, "step": 595, "valid_targets_mean": 10379.8, "valid_targets_min": 3903 }, { "epoch": 1.0169491525423728, "grad_norm": 0.4536741195006425, "learning_rate": 3.9753369999911166e-05, "loss": 0.3309, "loss_nan_ranks": 0, "loss_rank_avg": 0.15797701478004456, "step": 600, "valid_targets_mean": 7904.0, "valid_targets_min": 3709 }, { "epoch": 1.0254237288135593, "grad_norm": 0.4589851155496452, "learning_rate": 3.973996129483684e-05, "loss": 0.3171, "loss_nan_ranks": 0, "loss_rank_avg": 0.10587269067764282, "step": 605, "valid_targets_mean": 7432.1, "valid_targets_min": 2532 }, { "epoch": 1.0338983050847457, "grad_norm": 0.47318377384255594, "learning_rate": 3.972620005635216e-05, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.1729205846786499, "step": 610, "valid_targets_mean": 7595.9, "valid_targets_min": 2825 }, { "epoch": 1.042372881355932, "grad_norm": 0.4469128531341844, "learning_rate": 3.971208653021727e-05, "loss": 0.3171, "loss_nan_ranks": 0, "loss_rank_avg": 0.20472905039787292, "step": 615, "valid_targets_mean": 8200.1, "valid_targets_min": 2509 }, { "epoch": 1.0508474576271187, "grad_norm": 0.4833955669012435, "learning_rate": 3.969762096848383e-05, "loss": 0.3673, "loss_nan_ranks": 0, "loss_rank_avg": 0.15367567539215088, "step": 620, "valid_targets_mean": 7303.2, "valid_targets_min": 712 }, { "epoch": 1.0593220338983051, "grad_norm": 0.4180140372553057, "learning_rate": 3.968280362949042e-05, "loss": 0.329, "loss_nan_ranks": 0, "loss_rank_avg": 0.20632800459861755, "step": 625, "valid_targets_mean": 9386.4, "valid_targets_min": 4698 }, { "epoch": 1.0677966101694916, "grad_norm": 0.40174569986041325, "learning_rate": 3.9667634777857975e-05, "loss": 0.3588, "loss_nan_ranks": 0, "loss_rank_avg": 0.14220260083675385, "step": 630, "valid_targets_mean": 8459.8, "valid_targets_min": 3319 }, { "epoch": 1.076271186440678, "grad_norm": 0.44484170138321344, "learning_rate": 3.965211468448505e-05, "loss": 0.3388, "loss_nan_ranks": 0, "loss_rank_avg": 0.14559875428676605, "step": 635, "valid_targets_mean": 7179.8, "valid_targets_min": 3830 }, { "epoch": 1.0847457627118644, "grad_norm": 0.4395541639351123, "learning_rate": 3.963624362654299e-05, "loss": 0.3324, "loss_nan_ranks": 0, "loss_rank_avg": 0.13254770636558533, "step": 640, "valid_targets_mean": 7157.9, "valid_targets_min": 1936 }, { "epoch": 1.0932203389830508, "grad_norm": 0.4654264001987176, "learning_rate": 3.962002188747096e-05, "loss": 0.3234, "loss_nan_ranks": 0, "loss_rank_avg": 0.28930819034576416, "step": 645, "valid_targets_mean": 10538.6, "valid_targets_min": 2967 }, { "epoch": 1.1016949152542372, "grad_norm": 0.40719297523344944, "learning_rate": 3.9603449756970877e-05, "loss": 0.3219, "loss_nan_ranks": 0, "loss_rank_avg": 0.09647984802722931, "step": 650, "valid_targets_mean": 6410.5, "valid_targets_min": 2114 }, { "epoch": 1.1101694915254237, "grad_norm": 0.6812110649265294, "learning_rate": 3.95865275310023e-05, "loss": 0.3275, "loss_nan_ranks": 0, "loss_rank_avg": 0.09337997436523438, "step": 655, "valid_targets_mean": 4987.0, "valid_targets_min": 2152 }, { "epoch": 1.11864406779661, "grad_norm": 0.4778768969090781, "learning_rate": 3.9569255511777054e-05, "loss": 0.3253, "loss_nan_ranks": 0, "loss_rank_avg": 0.1386423110961914, "step": 660, "valid_targets_mean": 6117.6, "valid_targets_min": 2957 }, { "epoch": 1.1271186440677967, "grad_norm": 0.4193417013796084, "learning_rate": 3.955163400775389e-05, "loss": 0.361, "loss_nan_ranks": 0, "loss_rank_avg": 0.12261968106031418, "step": 665, "valid_targets_mean": 6347.0, "valid_targets_min": 3535 }, { "epoch": 1.1355932203389831, "grad_norm": 0.5013613951602334, "learning_rate": 3.953366333363297e-05, "loss": 0.3222, "loss_nan_ranks": 0, "loss_rank_avg": 0.12408879399299622, "step": 670, "valid_targets_mean": 6869.2, "valid_targets_min": 1409 }, { "epoch": 1.1440677966101696, "grad_norm": 0.4160706590681276, "learning_rate": 3.9515343810350236e-05, "loss": 0.3091, "loss_nan_ranks": 0, "loss_rank_avg": 0.2585446834564209, "step": 675, "valid_targets_mean": 11118.4, "valid_targets_min": 2837 }, { "epoch": 1.152542372881356, "grad_norm": 0.48357167974115245, "learning_rate": 3.949667576507168e-05, "loss": 0.3338, "loss_nan_ranks": 0, "loss_rank_avg": 0.2446514070034027, "step": 680, "valid_targets_mean": 7852.5, "valid_targets_min": 2865 }, { "epoch": 1.1610169491525424, "grad_norm": 0.5207580063819728, "learning_rate": 3.9477659531187484e-05, "loss": 0.3305, "loss_nan_ranks": 0, "loss_rank_avg": 0.2768232822418213, "step": 685, "valid_targets_mean": 9521.2, "valid_targets_min": 1901 }, { "epoch": 1.1694915254237288, "grad_norm": 0.4352619530283247, "learning_rate": 3.9458295448306134e-05, "loss": 0.3273, "loss_nan_ranks": 0, "loss_rank_avg": 0.169637992978096, "step": 690, "valid_targets_mean": 8180.2, "valid_targets_min": 3197 }, { "epoch": 1.1779661016949152, "grad_norm": 0.6375401638430952, "learning_rate": 3.943858386224825e-05, "loss": 0.3542, "loss_nan_ranks": 0, "loss_rank_avg": 0.20666490495204926, "step": 695, "valid_targets_mean": 7918.8, "valid_targets_min": 2972 }, { "epoch": 1.1864406779661016, "grad_norm": 0.5237074435643403, "learning_rate": 3.941852512504052e-05, "loss": 0.3069, "loss_nan_ranks": 0, "loss_rank_avg": 0.16815276443958282, "step": 700, "valid_targets_mean": 8423.9, "valid_targets_min": 3467 }, { "epoch": 1.194915254237288, "grad_norm": 0.46230638915825684, "learning_rate": 3.939811959490931e-05, "loss": 0.3183, "loss_nan_ranks": 0, "loss_rank_avg": 0.22283053398132324, "step": 705, "valid_targets_mean": 11047.0, "valid_targets_min": 4423 }, { "epoch": 1.2033898305084745, "grad_norm": 0.4545188486641544, "learning_rate": 3.937736763627435e-05, "loss": 0.3157, "loss_nan_ranks": 0, "loss_rank_avg": 0.19005794823169708, "step": 710, "valid_targets_mean": 8591.1, "valid_targets_min": 3981 }, { "epoch": 1.211864406779661, "grad_norm": 0.4552644672198827, "learning_rate": 3.935626961974217e-05, "loss": 0.3603, "loss_nan_ranks": 0, "loss_rank_avg": 0.14236797392368317, "step": 715, "valid_targets_mean": 6977.0, "valid_targets_min": 3031 }, { "epoch": 1.2203389830508475, "grad_norm": 0.46886754247998963, "learning_rate": 3.933482592209951e-05, "loss": 0.3314, "loss_nan_ranks": 0, "loss_rank_avg": 0.26897650957107544, "step": 720, "valid_targets_mean": 9310.5, "valid_targets_min": 3393 }, { "epoch": 1.228813559322034, "grad_norm": 0.48772266789453395, "learning_rate": 3.931303692630661e-05, "loss": 0.3101, "loss_nan_ranks": 0, "loss_rank_avg": 0.16506057977676392, "step": 725, "valid_targets_mean": 7079.0, "valid_targets_min": 2432 }, { "epoch": 1.2372881355932204, "grad_norm": 0.42871408585096393, "learning_rate": 3.92909030214903e-05, "loss": 0.3268, "loss_nan_ranks": 0, "loss_rank_avg": 0.11513777822256088, "step": 730, "valid_targets_mean": 6985.9, "valid_targets_min": 3986 }, { "epoch": 1.2457627118644068, "grad_norm": 0.44587055811958604, "learning_rate": 3.9268424602937124e-05, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.17389066517353058, "step": 735, "valid_targets_mean": 8847.4, "valid_targets_min": 2642 }, { "epoch": 1.2542372881355932, "grad_norm": 0.47861212973477374, "learning_rate": 3.9245602072086246e-05, "loss": 0.3732, "loss_nan_ranks": 0, "loss_rank_avg": 0.10631030052900314, "step": 740, "valid_targets_mean": 5761.5, "valid_targets_min": 4648 }, { "epoch": 1.2627118644067796, "grad_norm": 0.49947791123701396, "learning_rate": 3.9222435836522286e-05, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.1645757257938385, "step": 745, "valid_targets_mean": 9582.9, "valid_targets_min": 1652 }, { "epoch": 1.271186440677966, "grad_norm": 0.42913688486951385, "learning_rate": 3.919892630996804e-05, "loss": 0.3352, "loss_nan_ranks": 0, "loss_rank_avg": 0.14238014817237854, "step": 750, "valid_targets_mean": 6065.2, "valid_targets_min": 2457 }, { "epoch": 1.2796610169491525, "grad_norm": 0.4255980165569159, "learning_rate": 3.9175073912277107e-05, "loss": 0.305, "loss_nan_ranks": 0, "loss_rank_avg": 0.11966271698474884, "step": 755, "valid_targets_mean": 6778.5, "valid_targets_min": 3511 }, { "epoch": 1.288135593220339, "grad_norm": 0.4383294865094197, "learning_rate": 3.915087906942635e-05, "loss": 0.3196, "loss_nan_ranks": 0, "loss_rank_avg": 0.18853090703487396, "step": 760, "valid_targets_mean": 7773.5, "valid_targets_min": 2965 }, { "epoch": 1.2966101694915255, "grad_norm": 0.42624494152006837, "learning_rate": 3.912634221350834e-05, "loss": 0.3482, "loss_nan_ranks": 0, "loss_rank_avg": 0.20799216628074646, "step": 765, "valid_targets_mean": 10677.5, "valid_targets_min": 2482 }, { "epoch": 1.305084745762712, "grad_norm": 0.4740167806151876, "learning_rate": 3.910146378272361e-05, "loss": 0.316, "loss_nan_ranks": 0, "loss_rank_avg": 0.1015789806842804, "step": 770, "valid_targets_mean": 5372.8, "valid_targets_min": 2801 }, { "epoch": 1.3135593220338984, "grad_norm": 0.5006756358318566, "learning_rate": 3.9076244221372824e-05, "loss": 0.321, "loss_nan_ranks": 0, "loss_rank_avg": 0.1526796519756317, "step": 775, "valid_targets_mean": 6574.1, "valid_targets_min": 2460 }, { "epoch": 1.3220338983050848, "grad_norm": 0.4267845459550884, "learning_rate": 3.905068397984886e-05, "loss": 0.3168, "loss_nan_ranks": 0, "loss_rank_avg": 0.16761890053749084, "step": 780, "valid_targets_mean": 8788.9, "valid_targets_min": 4154 }, { "epoch": 1.3305084745762712, "grad_norm": 0.41392713104247275, "learning_rate": 3.9024783514628765e-05, "loss": 0.3568, "loss_nan_ranks": 0, "loss_rank_avg": 0.17586758732795715, "step": 785, "valid_targets_mean": 10475.6, "valid_targets_min": 3622 }, { "epoch": 1.3389830508474576, "grad_norm": 0.5337105064121502, "learning_rate": 3.899854328826559e-05, "loss": 0.3425, "loss_nan_ranks": 0, "loss_rank_avg": 0.0900270864367485, "step": 790, "valid_targets_mean": 4031.1, "valid_targets_min": 1420 }, { "epoch": 1.347457627118644, "grad_norm": 0.4488578510290259, "learning_rate": 3.897196376938013e-05, "loss": 0.318, "loss_nan_ranks": 0, "loss_rank_avg": 0.17309337854385376, "step": 795, "valid_targets_mean": 6397.8, "valid_targets_min": 2425 }, { "epoch": 1.3559322033898304, "grad_norm": 0.39620489867483555, "learning_rate": 3.8945045432652575e-05, "loss": 0.3404, "loss_nan_ranks": 0, "loss_rank_avg": 0.08745632320642471, "step": 800, "valid_targets_mean": 6055.2, "valid_targets_min": 3550 }, { "epoch": 1.3644067796610169, "grad_norm": 0.42992870791787763, "learning_rate": 3.8917788758814e-05, "loss": 0.3174, "loss_nan_ranks": 0, "loss_rank_avg": 0.13015861809253693, "step": 805, "valid_targets_mean": 7460.4, "valid_targets_min": 3055 }, { "epoch": 1.3728813559322033, "grad_norm": 0.40354106059339273, "learning_rate": 3.889019423463783e-05, "loss": 0.3149, "loss_nan_ranks": 0, "loss_rank_avg": 0.09485109150409698, "step": 810, "valid_targets_mean": 6865.6, "valid_targets_min": 2911 }, { "epoch": 1.3813559322033897, "grad_norm": 0.4686368291789137, "learning_rate": 3.8862262352931075e-05, "loss": 0.3294, "loss_nan_ranks": 0, "loss_rank_avg": 0.1537308543920517, "step": 815, "valid_targets_mean": 6440.1, "valid_targets_min": 2110 }, { "epoch": 1.3898305084745763, "grad_norm": 0.4408642589858194, "learning_rate": 3.88339936125256e-05, "loss": 0.3157, "loss_nan_ranks": 0, "loss_rank_avg": 0.17375317215919495, "step": 820, "valid_targets_mean": 8280.6, "valid_targets_min": 2743 }, { "epoch": 1.3983050847457628, "grad_norm": 0.46062681778063724, "learning_rate": 3.8805388518269184e-05, "loss": 0.2962, "loss_nan_ranks": 0, "loss_rank_avg": 0.17423167824745178, "step": 825, "valid_targets_mean": 8636.1, "valid_targets_min": 4169 }, { "epoch": 1.4067796610169492, "grad_norm": 0.4486860590784266, "learning_rate": 3.877644758101648e-05, "loss": 0.3156, "loss_nan_ranks": 0, "loss_rank_avg": 0.17933771014213562, "step": 830, "valid_targets_mean": 8570.9, "valid_targets_min": 1893 }, { "epoch": 1.4152542372881356, "grad_norm": 0.4719151934288519, "learning_rate": 3.8747171317619955e-05, "loss": 0.3143, "loss_nan_ranks": 0, "loss_rank_avg": 0.09397554397583008, "step": 835, "valid_targets_mean": 5133.0, "valid_targets_min": 2254 }, { "epoch": 1.423728813559322, "grad_norm": 0.4667473106135975, "learning_rate": 3.871756025092059e-05, "loss": 0.3479, "loss_nan_ranks": 0, "loss_rank_avg": 0.1407933086156845, "step": 840, "valid_targets_mean": 6628.8, "valid_targets_min": 2795 }, { "epoch": 1.4322033898305084, "grad_norm": 0.4412306378722383, "learning_rate": 3.868761490973859e-05, "loss": 0.307, "loss_nan_ranks": 0, "loss_rank_avg": 0.1313735395669937, "step": 845, "valid_targets_mean": 6751.1, "valid_targets_min": 3064 }, { "epoch": 1.4406779661016949, "grad_norm": 0.43177538465939785, "learning_rate": 3.8657335828863924e-05, "loss": 0.3316, "loss_nan_ranks": 0, "loss_rank_avg": 0.1634959578514099, "step": 850, "valid_targets_mean": 7480.4, "valid_targets_min": 3151 }, { "epoch": 1.4491525423728815, "grad_norm": 0.43807884753609994, "learning_rate": 3.8626723549046774e-05, "loss": 0.3268, "loss_nan_ranks": 0, "loss_rank_avg": 0.12339450418949127, "step": 855, "valid_targets_mean": 6659.2, "valid_targets_min": 2840 }, { "epoch": 1.457627118644068, "grad_norm": 0.4727987965750298, "learning_rate": 3.859577861698787e-05, "loss": 0.2922, "loss_nan_ranks": 0, "loss_rank_avg": 0.15785086154937744, "step": 860, "valid_targets_mean": 7509.2, "valid_targets_min": 3028 }, { "epoch": 1.4661016949152543, "grad_norm": 0.4384303554477187, "learning_rate": 3.856450158532875e-05, "loss": 0.323, "loss_nan_ranks": 0, "loss_rank_avg": 0.1519169807434082, "step": 865, "valid_targets_mean": 7232.5, "valid_targets_min": 3849 }, { "epoch": 1.4745762711864407, "grad_norm": 0.49727270409272106, "learning_rate": 3.853289301264187e-05, "loss": 0.3358, "loss_nan_ranks": 0, "loss_rank_avg": 0.1139516681432724, "step": 870, "valid_targets_mean": 6231.1, "valid_targets_min": 1612 }, { "epoch": 1.4830508474576272, "grad_norm": 0.4426633905595123, "learning_rate": 3.850095346342064e-05, "loss": 0.3273, "loss_nan_ranks": 0, "loss_rank_avg": 0.16769997775554657, "step": 875, "valid_targets_mean": 7338.5, "valid_targets_min": 3859 }, { "epoch": 1.4915254237288136, "grad_norm": 0.4593726038548315, "learning_rate": 3.84686835080693e-05, "loss": 0.3099, "loss_nan_ranks": 0, "loss_rank_avg": 0.11144979298114777, "step": 880, "valid_targets_mean": 6119.1, "valid_targets_min": 3785 }, { "epoch": 1.5, "grad_norm": 0.49604203241194217, "learning_rate": 3.843608372289283e-05, "loss": 0.3271, "loss_nan_ranks": 0, "loss_rank_avg": 0.15156549215316772, "step": 885, "valid_targets_mean": 7399.4, "valid_targets_min": 3299 }, { "epoch": 1.5084745762711864, "grad_norm": 0.545080093883971, "learning_rate": 3.8403154690086564e-05, "loss": 0.3361, "loss_nan_ranks": 0, "loss_rank_avg": 0.12989340722560883, "step": 890, "valid_targets_mean": 7236.0, "valid_targets_min": 3225 }, { "epoch": 1.5169491525423728, "grad_norm": 0.45075511600659357, "learning_rate": 3.836989699772582e-05, "loss": 0.3229, "loss_nan_ranks": 0, "loss_rank_avg": 0.1870659589767456, "step": 895, "valid_targets_mean": 7038.4, "valid_targets_min": 2187 }, { "epoch": 1.5254237288135593, "grad_norm": 0.47217639934643396, "learning_rate": 3.8336311239755424e-05, "loss": 0.3622, "loss_nan_ranks": 0, "loss_rank_avg": 0.15166038274765015, "step": 900, "valid_targets_mean": 7118.4, "valid_targets_min": 2202 }, { "epoch": 1.5338983050847457, "grad_norm": 0.41709638199225046, "learning_rate": 3.830239801597907e-05, "loss": 0.3125, "loss_nan_ranks": 0, "loss_rank_avg": 0.14974796772003174, "step": 905, "valid_targets_mean": 7620.0, "valid_targets_min": 2350 }, { "epoch": 1.542372881355932, "grad_norm": 0.41637607079903677, "learning_rate": 3.826815793204863e-05, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.1806432008743286, "step": 910, "valid_targets_mean": 9408.8, "valid_targets_min": 4175 }, { "epoch": 1.5508474576271185, "grad_norm": 0.5361115971794117, "learning_rate": 3.823359159945332e-05, "loss": 0.3193, "loss_nan_ranks": 0, "loss_rank_avg": 0.1987413465976715, "step": 915, "valid_targets_mean": 8330.9, "valid_targets_min": 3259 }, { "epoch": 1.559322033898305, "grad_norm": 0.44132736535406036, "learning_rate": 3.8198699635508805e-05, "loss": 0.2982, "loss_nan_ranks": 0, "loss_rank_avg": 0.18994596600532532, "step": 920, "valid_targets_mean": 9074.9, "valid_targets_min": 3436 }, { "epoch": 1.5677966101694916, "grad_norm": 0.3816717467254405, "learning_rate": 3.816348266334614e-05, "loss": 0.319, "loss_nan_ranks": 0, "loss_rank_avg": 0.12687310576438904, "step": 925, "valid_targets_mean": 8785.6, "valid_targets_min": 4974 }, { "epoch": 1.576271186440678, "grad_norm": 0.4412025073597514, "learning_rate": 3.812794131190066e-05, "loss": 0.3306, "loss_nan_ranks": 0, "loss_rank_avg": 0.13384410738945007, "step": 930, "valid_targets_mean": 7849.2, "valid_targets_min": 3985 }, { "epoch": 1.5847457627118644, "grad_norm": 0.396693457802134, "learning_rate": 3.8092076215900765e-05, "loss": 0.303, "loss_nan_ranks": 0, "loss_rank_avg": 0.20873287320137024, "step": 935, "valid_targets_mean": 11243.4, "valid_targets_min": 5339 }, { "epoch": 1.5932203389830508, "grad_norm": 0.4285610045500551, "learning_rate": 3.805588801585654e-05, "loss": 0.3188, "loss_nan_ranks": 0, "loss_rank_avg": 0.08912678807973862, "step": 940, "valid_targets_mean": 4676.0, "valid_targets_min": 2847 }, { "epoch": 1.6016949152542372, "grad_norm": 0.41295836604849834, "learning_rate": 3.801937735804838e-05, "loss": 0.3439, "loss_nan_ranks": 0, "loss_rank_avg": 0.17002055048942566, "step": 945, "valid_targets_mean": 8253.2, "valid_targets_min": 2292 }, { "epoch": 1.6101694915254239, "grad_norm": 0.4110467780511449, "learning_rate": 3.798254489451539e-05, "loss": 0.3218, "loss_nan_ranks": 0, "loss_rank_avg": 0.26079848408699036, "step": 950, "valid_targets_mean": 11661.2, "valid_targets_min": 2093 }, { "epoch": 1.6186440677966103, "grad_norm": 0.5284185078380007, "learning_rate": 3.794539128304374e-05, "loss": 0.3327, "loss_nan_ranks": 0, "loss_rank_avg": 0.21993231773376465, "step": 955, "valid_targets_mean": 10140.0, "valid_targets_min": 4917 }, { "epoch": 1.6271186440677967, "grad_norm": 0.43465978137133837, "learning_rate": 3.790791718715498e-05, "loss": 0.3362, "loss_nan_ranks": 0, "loss_rank_avg": 0.16745583713054657, "step": 960, "valid_targets_mean": 7656.5, "valid_targets_min": 2997 }, { "epoch": 1.6355932203389831, "grad_norm": 0.46353679599089426, "learning_rate": 3.7870123276094134e-05, "loss": 0.3063, "loss_nan_ranks": 0, "loss_rank_avg": 0.14307042956352234, "step": 965, "valid_targets_mean": 6720.0, "valid_targets_min": 2036 }, { "epoch": 1.6440677966101696, "grad_norm": 0.42508115955425385, "learning_rate": 3.783201022481775e-05, "loss": 0.307, "loss_nan_ranks": 0, "loss_rank_avg": 0.16600486636161804, "step": 970, "valid_targets_mean": 7660.0, "valid_targets_min": 4016 }, { "epoch": 1.652542372881356, "grad_norm": 0.47460145753384014, "learning_rate": 3.7793578713981876e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.17931526899337769, "step": 975, "valid_targets_mean": 7207.9, "valid_targets_min": 2066 }, { "epoch": 1.6610169491525424, "grad_norm": 0.4565761001462879, "learning_rate": 3.775482942992989e-05, "loss": 0.296, "loss_nan_ranks": 0, "loss_rank_avg": 0.10052239894866943, "step": 980, "valid_targets_mean": 5350.4, "valid_targets_min": 3691 }, { "epoch": 1.6694915254237288, "grad_norm": 0.404024020976862, "learning_rate": 3.771576306468022e-05, "loss": 0.331, "loss_nan_ranks": 0, "loss_rank_avg": 0.13798417150974274, "step": 985, "valid_targets_mean": 8586.6, "valid_targets_min": 2541 }, { "epoch": 1.6779661016949152, "grad_norm": 0.46889190610408676, "learning_rate": 3.7676380315914025e-05, "loss": 0.3316, "loss_nan_ranks": 0, "loss_rank_avg": 0.09154243022203445, "step": 990, "valid_targets_mean": 5740.6, "valid_targets_min": 1962 }, { "epoch": 1.6864406779661016, "grad_norm": 0.4064487350790923, "learning_rate": 3.7636681886962724e-05, "loss": 0.3665, "loss_nan_ranks": 0, "loss_rank_avg": 0.15788796544075012, "step": 995, "valid_targets_mean": 7709.4, "valid_targets_min": 2560 }, { "epoch": 1.694915254237288, "grad_norm": 0.7897794567174825, "learning_rate": 3.759666848679539e-05, "loss": 0.304, "loss_nan_ranks": 0, "loss_rank_avg": 0.15532286465168, "step": 1000, "valid_targets_mean": 9089.0, "valid_targets_min": 5046 }, { "epoch": 1.7033898305084745, "grad_norm": 0.6035847206124464, "learning_rate": 3.755634083000617e-05, "loss": 0.3292, "loss_nan_ranks": 0, "loss_rank_avg": 0.1320587694644928, "step": 1005, "valid_targets_mean": 6896.9, "valid_targets_min": 2965 }, { "epoch": 1.711864406779661, "grad_norm": 0.41483149367263833, "learning_rate": 3.751569963680146e-05, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.20763173699378967, "step": 1010, "valid_targets_mean": 9600.8, "valid_targets_min": 5071 }, { "epoch": 1.7203389830508473, "grad_norm": 0.45501656641530847, "learning_rate": 3.747474563298705e-05, "loss": 0.3288, "loss_nan_ranks": 0, "loss_rank_avg": 0.13265684247016907, "step": 1015, "valid_targets_mean": 6442.4, "valid_targets_min": 1875 }, { "epoch": 1.7288135593220337, "grad_norm": 0.5257033113939008, "learning_rate": 3.743347954995519e-05, "loss": 0.3268, "loss_nan_ranks": 0, "loss_rank_avg": 0.13818372786045074, "step": 1020, "valid_targets_mean": 6209.2, "valid_targets_min": 3843 }, { "epoch": 1.7372881355932204, "grad_norm": 0.4383597245709914, "learning_rate": 3.7391902124671516e-05, "loss": 0.3244, "loss_nan_ranks": 0, "loss_rank_avg": 0.19095399975776672, "step": 1025, "valid_targets_mean": 8865.8, "valid_targets_min": 3685 }, { "epoch": 1.7457627118644068, "grad_norm": 0.39724550405667364, "learning_rate": 3.7350014099661874e-05, "loss": 0.3066, "loss_nan_ranks": 0, "loss_rank_avg": 0.20521703362464905, "step": 1030, "valid_targets_mean": 9690.9, "valid_targets_min": 3548 }, { "epoch": 1.7542372881355932, "grad_norm": 0.39927522299758583, "learning_rate": 3.730781622299907e-05, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.17346695065498352, "step": 1035, "valid_targets_mean": 8075.1, "valid_targets_min": 3805 }, { "epoch": 1.7627118644067796, "grad_norm": 0.4350255084725687, "learning_rate": 3.7265309248289516e-05, "loss": 0.3455, "loss_nan_ranks": 0, "loss_rank_avg": 0.16887761652469635, "step": 1040, "valid_targets_mean": 7783.6, "valid_targets_min": 3913 }, { "epoch": 1.7711864406779663, "grad_norm": 0.421663580685689, "learning_rate": 3.7222493934659765e-05, "loss": 0.3466, "loss_nan_ranks": 0, "loss_rank_avg": 0.1530277132987976, "step": 1045, "valid_targets_mean": 9355.5, "valid_targets_min": 4980 }, { "epoch": 1.7796610169491527, "grad_norm": 0.4369588066271297, "learning_rate": 3.717937104674296e-05, "loss": 0.2978, "loss_nan_ranks": 0, "loss_rank_avg": 0.13133104145526886, "step": 1050, "valid_targets_mean": 7752.2, "valid_targets_min": 4407 }, { "epoch": 1.788135593220339, "grad_norm": 0.4368294132363595, "learning_rate": 3.713594135466515e-05, "loss": 0.3225, "loss_nan_ranks": 0, "loss_rank_avg": 0.17027533054351807, "step": 1055, "valid_targets_mean": 8704.5, "valid_targets_min": 2855 }, { "epoch": 1.7966101694915255, "grad_norm": 0.43449669149693804, "learning_rate": 3.7092205634031595e-05, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.08701007068157196, "step": 1060, "valid_targets_mean": 4998.2, "valid_targets_min": 2374 }, { "epoch": 1.805084745762712, "grad_norm": 0.39372753859603943, "learning_rate": 3.704816466591286e-05, "loss": 0.3163, "loss_nan_ranks": 0, "loss_rank_avg": 0.12855243682861328, "step": 1065, "valid_targets_mean": 7622.5, "valid_targets_min": 4093 }, { "epoch": 1.8135593220338984, "grad_norm": 0.3964647607911203, "learning_rate": 3.700381923683087e-05, "loss": 0.3364, "loss_nan_ranks": 0, "loss_rank_avg": 0.1131635457277298, "step": 1070, "valid_targets_mean": 7209.1, "valid_targets_min": 2797 }, { "epoch": 1.8220338983050848, "grad_norm": 0.4159371295645834, "learning_rate": 3.695917013874491e-05, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.13864587247371674, "step": 1075, "valid_targets_mean": 7083.8, "valid_targets_min": 3551 }, { "epoch": 1.8305084745762712, "grad_norm": 0.41132981890721415, "learning_rate": 3.691421816903744e-05, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.20368866622447968, "step": 1080, "valid_targets_mean": 8503.0, "valid_targets_min": 1795 }, { "epoch": 1.8389830508474576, "grad_norm": 0.43908713798714083, "learning_rate": 3.686896413049985e-05, "loss": 0.2886, "loss_nan_ranks": 0, "loss_rank_avg": 0.12140090763568878, "step": 1085, "valid_targets_mean": 6773.4, "valid_targets_min": 3364 }, { "epoch": 1.847457627118644, "grad_norm": 0.4338791941921327, "learning_rate": 3.6823408831318154e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.16254982352256775, "step": 1090, "valid_targets_mean": 7966.9, "valid_targets_min": 2532 }, { "epoch": 1.8559322033898304, "grad_norm": 0.41721828273489936, "learning_rate": 3.677755308505854e-05, "loss": 0.3423, "loss_nan_ranks": 0, "loss_rank_avg": 0.1637614667415619, "step": 1095, "valid_targets_mean": 7360.9, "valid_targets_min": 3864 }, { "epoch": 1.8644067796610169, "grad_norm": 0.4152523100279547, "learning_rate": 3.673139771065282e-05, "loss": 0.3229, "loss_nan_ranks": 0, "loss_rank_avg": 0.11550319194793701, "step": 1100, "valid_targets_mean": 6838.5, "valid_targets_min": 3869 }, { "epoch": 1.8728813559322033, "grad_norm": 0.37899639866690693, "learning_rate": 3.6684943532383866e-05, "loss": 0.3448, "loss_nan_ranks": 0, "loss_rank_avg": 0.18879902362823486, "step": 1105, "valid_targets_mean": 10441.6, "valid_targets_min": 3589 }, { "epoch": 1.8813559322033897, "grad_norm": 0.40369311396663893, "learning_rate": 3.663819137987081e-05, "loss": 0.3342, "loss_nan_ranks": 0, "loss_rank_avg": 0.16418354213237762, "step": 1110, "valid_targets_mean": 9130.6, "valid_targets_min": 6228 }, { "epoch": 1.8898305084745761, "grad_norm": 0.4216701104223837, "learning_rate": 3.65911420880543e-05, "loss": 0.3106, "loss_nan_ranks": 0, "loss_rank_avg": 0.2091543972492218, "step": 1115, "valid_targets_mean": 8209.8, "valid_targets_min": 3449 }, { "epoch": 1.8983050847457628, "grad_norm": 0.39934323363745766, "learning_rate": 3.654379649718153e-05, "loss": 0.3059, "loss_nan_ranks": 0, "loss_rank_avg": 0.16052965819835663, "step": 1120, "valid_targets_mean": 8141.9, "valid_targets_min": 2341 }, { "epoch": 1.9067796610169492, "grad_norm": 0.425180656486338, "learning_rate": 3.649615545279127e-05, "loss": 0.3443, "loss_nan_ranks": 0, "loss_rank_avg": 0.23255954682826996, "step": 1125, "valid_targets_mean": 8977.1, "valid_targets_min": 1589 }, { "epoch": 1.9152542372881356, "grad_norm": 0.4134843945605497, "learning_rate": 3.644821980569876e-05, "loss": 0.3293, "loss_nan_ranks": 0, "loss_rank_avg": 0.18696650862693787, "step": 1130, "valid_targets_mean": 9344.6, "valid_targets_min": 2897 }, { "epoch": 1.923728813559322, "grad_norm": 0.4247315776579201, "learning_rate": 3.639999041198051e-05, "loss": 0.3106, "loss_nan_ranks": 0, "loss_rank_avg": 0.15916836261749268, "step": 1135, "valid_targets_mean": 7757.0, "valid_targets_min": 2240 }, { "epoch": 1.9322033898305084, "grad_norm": 0.4285608095339475, "learning_rate": 3.635146813295902e-05, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.12798747420310974, "step": 1140, "valid_targets_mean": 7018.9, "valid_targets_min": 3392 }, { "epoch": 1.940677966101695, "grad_norm": 0.4320951231170634, "learning_rate": 3.6302653835187366e-05, "loss": 0.3154, "loss_nan_ranks": 0, "loss_rank_avg": 0.2193724513053894, "step": 1145, "valid_targets_mean": 8454.5, "valid_targets_min": 4385 }, { "epoch": 1.9491525423728815, "grad_norm": 0.3679163355593773, "learning_rate": 3.625354839043377e-05, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.2157258540391922, "step": 1150, "valid_targets_mean": 12249.4, "valid_targets_min": 4241 }, { "epoch": 1.957627118644068, "grad_norm": 0.4102455825218708, "learning_rate": 3.620415267566601e-05, "loss": 0.3306, "loss_nan_ranks": 0, "loss_rank_avg": 0.12105512619018555, "step": 1155, "valid_targets_mean": 7516.5, "valid_targets_min": 3222 }, { "epoch": 1.9661016949152543, "grad_norm": 0.4175220017891001, "learning_rate": 3.615446757303575e-05, "loss": 0.3221, "loss_nan_ranks": 0, "loss_rank_avg": 0.17339207231998444, "step": 1160, "valid_targets_mean": 8759.4, "valid_targets_min": 2960 }, { "epoch": 1.9745762711864407, "grad_norm": 0.44844776216498816, "learning_rate": 3.610449396986281e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.09378059208393097, "step": 1165, "valid_targets_mean": 5834.0, "valid_targets_min": 2096 }, { "epoch": 1.9830508474576272, "grad_norm": 0.44812744257447257, "learning_rate": 3.6054232758619274e-05, "loss": 0.3161, "loss_nan_ranks": 0, "loss_rank_avg": 0.1947910189628601, "step": 1170, "valid_targets_mean": 7453.2, "valid_targets_min": 2451 }, { "epoch": 1.9915254237288136, "grad_norm": 0.4242232674193107, "learning_rate": 3.600368483691361e-05, "loss": 0.3279, "loss_nan_ranks": 0, "loss_rank_avg": 0.13258054852485657, "step": 1175, "valid_targets_mean": 7682.2, "valid_targets_min": 2492 }, { "epoch": 2.0, "grad_norm": 0.45289022894013076, "learning_rate": 3.59528511074746e-05, "loss": 0.299, "loss_nan_ranks": 0, "loss_rank_avg": 0.12481173872947693, "step": 1180, "valid_targets_mean": 5148.2, "valid_targets_min": 1999 }, { "epoch": 2.0084745762711864, "grad_norm": 0.47796518296033785, "learning_rate": 3.5901732478135235e-05, "loss": 0.3136, "loss_nan_ranks": 0, "loss_rank_avg": 0.15180028975009918, "step": 1185, "valid_targets_mean": 6321.6, "valid_targets_min": 2236 }, { "epoch": 2.016949152542373, "grad_norm": 0.438352359074808, "learning_rate": 3.5850329861816475e-05, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.12889432907104492, "step": 1190, "valid_targets_mean": 6916.6, "valid_targets_min": 2771 }, { "epoch": 2.0254237288135593, "grad_norm": 0.4126031654763985, "learning_rate": 3.5798644176511e-05, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.09737379848957062, "step": 1195, "valid_targets_mean": 6256.8, "valid_targets_min": 3050 }, { "epoch": 2.0338983050847457, "grad_norm": 0.408111961548012, "learning_rate": 3.574667634526676e-05, "loss": 0.3122, "loss_nan_ranks": 0, "loss_rank_avg": 0.14440008997917175, "step": 1200, "valid_targets_mean": 7384.1, "valid_targets_min": 2779 }, { "epoch": 2.042372881355932, "grad_norm": 0.455628995610143, "learning_rate": 3.5694427296170514e-05, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.16236944496631622, "step": 1205, "valid_targets_mean": 8072.6, "valid_targets_min": 4463 }, { "epoch": 2.0508474576271185, "grad_norm": 0.43337894990516485, "learning_rate": 3.564189796233125e-05, "loss": 0.3144, "loss_nan_ranks": 0, "loss_rank_avg": 0.22974911332130432, "step": 1210, "valid_targets_mean": 9636.9, "valid_targets_min": 3097 }, { "epoch": 2.059322033898305, "grad_norm": 0.40732481179936597, "learning_rate": 3.5589089281863547e-05, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.1029449924826622, "step": 1215, "valid_targets_mean": 7567.2, "valid_targets_min": 2751 }, { "epoch": 2.0677966101694913, "grad_norm": 0.4252300433877439, "learning_rate": 3.553600219787079e-05, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.19273892045021057, "step": 1220, "valid_targets_mean": 8599.9, "valid_targets_min": 3639 }, { "epoch": 2.0762711864406778, "grad_norm": 0.4546211585832868, "learning_rate": 3.5482637658428315e-05, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.23350149393081665, "step": 1225, "valid_targets_mean": 9294.4, "valid_targets_min": 1933 }, { "epoch": 2.084745762711864, "grad_norm": 0.4145817713099008, "learning_rate": 3.542899661656653e-05, "loss": 0.3212, "loss_nan_ranks": 0, "loss_rank_avg": 0.1794952154159546, "step": 1230, "valid_targets_mean": 9705.6, "valid_targets_min": 4885 }, { "epoch": 2.093220338983051, "grad_norm": 0.5271058668855069, "learning_rate": 3.5375080030253826e-05, "loss": 0.3432, "loss_nan_ranks": 0, "loss_rank_avg": 0.12348256260156631, "step": 1235, "valid_targets_mean": 6719.0, "valid_targets_min": 3708 }, { "epoch": 2.1016949152542375, "grad_norm": 0.4232353398881956, "learning_rate": 3.532088886237956e-05, "loss": 0.3022, "loss_nan_ranks": 0, "loss_rank_avg": 0.10980045795440674, "step": 1240, "valid_targets_mean": 6338.2, "valid_targets_min": 3309 }, { "epoch": 2.110169491525424, "grad_norm": 0.45183791890941466, "learning_rate": 3.5266424080736765e-05, "loss": 0.3079, "loss_nan_ranks": 0, "loss_rank_avg": 0.15499433875083923, "step": 1245, "valid_targets_mean": 7531.9, "valid_targets_min": 3690 }, { "epoch": 2.1186440677966103, "grad_norm": 0.43508072611158927, "learning_rate": 3.521168665800491e-05, "loss": 0.3222, "loss_nan_ranks": 0, "loss_rank_avg": 0.2509422302246094, "step": 1250, "valid_targets_mean": 13284.1, "valid_targets_min": 5966 }, { "epoch": 2.1271186440677967, "grad_norm": 0.42735089982934016, "learning_rate": 3.515667757173254e-05, "loss": 0.2953, "loss_nan_ranks": 0, "loss_rank_avg": 0.13675671815872192, "step": 1255, "valid_targets_mean": 7142.9, "valid_targets_min": 2413 }, { "epoch": 2.135593220338983, "grad_norm": 0.40760862132146264, "learning_rate": 3.5101397804319794e-05, "loss": 0.2859, "loss_nan_ranks": 0, "loss_rank_avg": 0.17705723643302917, "step": 1260, "valid_targets_mean": 8875.0, "valid_targets_min": 3101 }, { "epoch": 2.1440677966101696, "grad_norm": 0.4900166239838904, "learning_rate": 3.5045848343000876e-05, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.1725788712501526, "step": 1265, "valid_targets_mean": 7732.4, "valid_targets_min": 2984 }, { "epoch": 2.152542372881356, "grad_norm": 0.428816419240488, "learning_rate": 3.4990030179826414e-05, "loss": 0.3253, "loss_nan_ranks": 0, "loss_rank_avg": 0.20709286630153656, "step": 1270, "valid_targets_mean": 10128.1, "valid_targets_min": 4459 }, { "epoch": 2.1610169491525424, "grad_norm": 0.40014932477968135, "learning_rate": 3.493394431164576e-05, "loss": 0.2927, "loss_nan_ranks": 0, "loss_rank_avg": 0.15721966326236725, "step": 1275, "valid_targets_mean": 8368.9, "valid_targets_min": 4914 }, { "epoch": 2.169491525423729, "grad_norm": 0.460349336503394, "learning_rate": 3.4877591740089144e-05, "loss": 0.3034, "loss_nan_ranks": 0, "loss_rank_avg": 0.12180677056312561, "step": 1280, "valid_targets_mean": 6484.2, "valid_targets_min": 2984 }, { "epoch": 2.1779661016949152, "grad_norm": 0.4167414151848438, "learning_rate": 3.482097347154986e-05, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.15773698687553406, "step": 1285, "valid_targets_mean": 8676.9, "valid_targets_min": 2724 }, { "epoch": 2.1864406779661016, "grad_norm": 0.4119767997336977, "learning_rate": 3.476409051716621e-05, "loss": 0.3075, "loss_nan_ranks": 0, "loss_rank_avg": 0.19150680303573608, "step": 1290, "valid_targets_mean": 9972.0, "valid_targets_min": 4367 }, { "epoch": 2.194915254237288, "grad_norm": 0.46842012389861176, "learning_rate": 3.470694389280352e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.13265065848827362, "step": 1295, "valid_targets_mean": 6506.4, "valid_targets_min": 2591 }, { "epoch": 2.2033898305084745, "grad_norm": 0.5070785490329287, "learning_rate": 3.464953461903593e-05, "loss": 0.2815, "loss_nan_ranks": 0, "loss_rank_avg": 0.16730618476867676, "step": 1300, "valid_targets_mean": 7640.6, "valid_targets_min": 2556 }, { "epoch": 2.211864406779661, "grad_norm": 0.44925860012957636, "learning_rate": 3.459186372112824e-05, "loss": 0.3067, "loss_nan_ranks": 0, "loss_rank_avg": 0.12842459976673126, "step": 1305, "valid_targets_mean": 6798.6, "valid_targets_min": 3979 }, { "epoch": 2.2203389830508473, "grad_norm": 0.41138242525433244, "learning_rate": 3.453393222901753e-05, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.09415019303560257, "step": 1310, "valid_targets_mean": 7214.1, "valid_targets_min": 2008 }, { "epoch": 2.2288135593220337, "grad_norm": 0.41131324862852436, "learning_rate": 3.44757411772948e-05, "loss": 0.3134, "loss_nan_ranks": 0, "loss_rank_avg": 0.173304945230484, "step": 1315, "valid_targets_mean": 8934.2, "valid_targets_min": 3731 }, { "epoch": 2.23728813559322, "grad_norm": 0.47453310588934633, "learning_rate": 3.441729160518652e-05, "loss": 0.326, "loss_nan_ranks": 0, "loss_rank_avg": 0.20205450057983398, "step": 1320, "valid_targets_mean": 8631.2, "valid_targets_min": 3796 }, { "epoch": 2.2457627118644066, "grad_norm": 0.43201686834502273, "learning_rate": 3.435858455653601e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.13337936997413635, "step": 1325, "valid_targets_mean": 7937.0, "valid_targets_min": 2699 }, { "epoch": 2.2542372881355934, "grad_norm": 0.458779232154746, "learning_rate": 3.429962107978485e-05, "loss": 0.3096, "loss_nan_ranks": 0, "loss_rank_avg": 0.1039549931883812, "step": 1330, "valid_targets_mean": 5822.1, "valid_targets_min": 2106 }, { "epoch": 2.26271186440678, "grad_norm": 0.40314998050323314, "learning_rate": 3.424040222795412e-05, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.10799141228199005, "step": 1335, "valid_targets_mean": 6850.5, "valid_targets_min": 3619 }, { "epoch": 2.2711864406779663, "grad_norm": 0.4249827679361363, "learning_rate": 3.418092905862563e-05, "loss": 0.2919, "loss_nan_ranks": 0, "loss_rank_avg": 0.1282862275838852, "step": 1340, "valid_targets_mean": 7501.6, "valid_targets_min": 4154 }, { "epoch": 2.2796610169491527, "grad_norm": 0.45225084379688923, "learning_rate": 3.412120263392301e-05, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.15831294655799866, "step": 1345, "valid_targets_mean": 8395.9, "valid_targets_min": 5077 }, { "epoch": 2.288135593220339, "grad_norm": 0.4323979115648768, "learning_rate": 3.406122402049272e-05, "loss": 0.3187, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440098136663437, "step": 1350, "valid_targets_mean": 8358.2, "valid_targets_min": 3033 }, { "epoch": 2.2966101694915255, "grad_norm": 0.44798843437203717, "learning_rate": 3.400099428948505e-05, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.24259638786315918, "step": 1355, "valid_targets_mean": 9828.9, "valid_targets_min": 3934 }, { "epoch": 2.305084745762712, "grad_norm": 0.4118065309385498, "learning_rate": 3.394051451653496e-05, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.12573987245559692, "step": 1360, "valid_targets_mean": 7931.0, "valid_targets_min": 5094 }, { "epoch": 2.3135593220338984, "grad_norm": 0.43851923519918656, "learning_rate": 3.3879785781742875e-05, "loss": 0.3164, "loss_nan_ranks": 0, "loss_rank_avg": 0.18017522990703583, "step": 1365, "valid_targets_mean": 8832.6, "valid_targets_min": 3053 }, { "epoch": 2.3220338983050848, "grad_norm": 0.49539123931874524, "learning_rate": 3.381880916965541e-05, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.10733641684055328, "step": 1370, "valid_targets_mean": 5227.6, "valid_targets_min": 2791 }, { "epoch": 2.330508474576271, "grad_norm": 0.512139157052037, "learning_rate": 3.3757585769245964e-05, "loss": 0.312, "loss_nan_ranks": 0, "loss_rank_avg": 0.151132732629776, "step": 1375, "valid_targets_mean": 7262.0, "valid_targets_min": 3945 }, { "epoch": 2.3389830508474576, "grad_norm": 0.4416566028201391, "learning_rate": 3.3696116673895314e-05, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.2037435919046402, "step": 1380, "valid_targets_mean": 9578.2, "valid_targets_min": 3736 }, { "epoch": 2.347457627118644, "grad_norm": 0.45082149557407764, "learning_rate": 3.363440298137207e-05, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.12679685652256012, "step": 1385, "valid_targets_mean": 6039.9, "valid_targets_min": 2300 }, { "epoch": 2.3559322033898304, "grad_norm": 0.4421724624356205, "learning_rate": 3.357244579381306e-05, "loss": 0.2908, "loss_nan_ranks": 0, "loss_rank_avg": 0.14652232825756073, "step": 1390, "valid_targets_mean": 7244.0, "valid_targets_min": 1903 }, { "epoch": 2.364406779661017, "grad_norm": 0.4495061538438427, "learning_rate": 3.351024621770369e-05, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.0919191762804985, "step": 1395, "valid_targets_mean": 5043.9, "valid_targets_min": 2452 }, { "epoch": 2.3728813559322033, "grad_norm": 0.45212052889171317, "learning_rate": 3.34478053638581e-05, "loss": 0.2859, "loss_nan_ranks": 0, "loss_rank_avg": 0.14459501206874847, "step": 1400, "valid_targets_mean": 7165.5, "valid_targets_min": 1936 }, { "epoch": 2.3813559322033897, "grad_norm": 0.45753710310314344, "learning_rate": 3.3385124347399415e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.11004475504159927, "step": 1405, "valid_targets_mean": 7322.9, "valid_targets_min": 2350 }, { "epoch": 2.389830508474576, "grad_norm": 0.4527197832006006, "learning_rate": 3.33222042877398e-05, "loss": 0.301, "loss_nan_ranks": 0, "loss_rank_avg": 0.17083138227462769, "step": 1410, "valid_targets_mean": 7809.4, "valid_targets_min": 2393 }, { "epoch": 2.3983050847457625, "grad_norm": 0.3772050754545617, "learning_rate": 3.325904630856042e-05, "loss": 0.2956, "loss_nan_ranks": 0, "loss_rank_avg": 0.18102893233299255, "step": 1415, "valid_targets_mean": 10666.2, "valid_targets_min": 3513 }, { "epoch": 2.406779661016949, "grad_norm": 0.4563452741739858, "learning_rate": 3.319565153779146e-05, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.26052290201187134, "step": 1420, "valid_targets_mean": 10017.8, "valid_targets_min": 5124 }, { "epoch": 2.415254237288136, "grad_norm": 0.46401872953783496, "learning_rate": 3.31320211075919e-05, "loss": 0.3201, "loss_nan_ranks": 0, "loss_rank_avg": 0.1795731782913208, "step": 1425, "valid_targets_mean": 7820.4, "valid_targets_min": 2278 }, { "epoch": 2.423728813559322, "grad_norm": 0.4298768255585762, "learning_rate": 3.306815615432936e-05, "loss": 0.3383, "loss_nan_ranks": 0, "loss_rank_avg": 0.1531204879283905, "step": 1430, "valid_targets_mean": 8088.8, "valid_targets_min": 2989 }, { "epoch": 2.4322033898305087, "grad_norm": 0.42943975120474337, "learning_rate": 3.300405781855975e-05, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.19165225327014923, "step": 1435, "valid_targets_mean": 9201.4, "valid_targets_min": 6019 }, { "epoch": 2.440677966101695, "grad_norm": 0.3977047765538059, "learning_rate": 3.2939727245006956e-05, "loss": 0.2999, "loss_nan_ranks": 0, "loss_rank_avg": 0.15969790518283844, "step": 1440, "valid_targets_mean": 8977.9, "valid_targets_min": 2996 }, { "epoch": 2.4491525423728815, "grad_norm": 0.43392603484157843, "learning_rate": 3.2875165582542347e-05, "loss": 0.3049, "loss_nan_ranks": 0, "loss_rank_avg": 0.09724732488393784, "step": 1445, "valid_targets_mean": 6136.5, "valid_targets_min": 3622 }, { "epoch": 2.457627118644068, "grad_norm": 0.39026794378770674, "learning_rate": 3.281037398416427e-05, "loss": 0.2698, "loss_nan_ranks": 0, "loss_rank_avg": 0.12890513241291046, "step": 1450, "valid_targets_mean": 6924.1, "valid_targets_min": 2394 }, { "epoch": 2.4661016949152543, "grad_norm": 0.4242919077715597, "learning_rate": 3.2745353606977506e-05, "loss": 0.3159, "loss_nan_ranks": 0, "loss_rank_avg": 0.1096186563372612, "step": 1455, "valid_targets_mean": 7928.4, "valid_targets_min": 3062 }, { "epoch": 2.4745762711864407, "grad_norm": 0.4289426904620235, "learning_rate": 3.268010561217253e-05, "loss": 0.308, "loss_nan_ranks": 0, "loss_rank_avg": 0.13930077850818634, "step": 1460, "valid_targets_mean": 8676.9, "valid_targets_min": 4315 }, { "epoch": 2.483050847457627, "grad_norm": 0.4051021933769338, "learning_rate": 3.261463116500483e-05, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.10786758363246918, "step": 1465, "valid_targets_mean": 6350.8, "valid_targets_min": 2847 }, { "epoch": 2.4915254237288136, "grad_norm": 0.4019638092945469, "learning_rate": 3.254893143477408e-05, "loss": 0.2916, "loss_nan_ranks": 0, "loss_rank_avg": 0.20479941368103027, "step": 1470, "valid_targets_mean": 10263.6, "valid_targets_min": 2865 }, { "epoch": 2.5, "grad_norm": 0.4299334544244074, "learning_rate": 3.248300759480323e-05, "loss": 0.3183, "loss_nan_ranks": 0, "loss_rank_avg": 0.2492760419845581, "step": 1475, "valid_targets_mean": 10219.6, "valid_targets_min": 5175 }, { "epoch": 2.5084745762711864, "grad_norm": 0.4023371948985823, "learning_rate": 3.241686082241761e-05, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.1464785933494568, "step": 1480, "valid_targets_mean": 8838.9, "valid_targets_min": 2493 }, { "epoch": 2.516949152542373, "grad_norm": 0.41294672992405235, "learning_rate": 3.235049229892384e-05, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.12958091497421265, "step": 1485, "valid_targets_mean": 7342.2, "valid_targets_min": 4829 }, { "epoch": 2.5254237288135593, "grad_norm": 0.3831925532498252, "learning_rate": 3.2283903209588795e-05, "loss": 0.3178, "loss_nan_ranks": 0, "loss_rank_avg": 0.1335603892803192, "step": 1490, "valid_targets_mean": 7712.6, "valid_targets_min": 2385 }, { "epoch": 2.5338983050847457, "grad_norm": 0.4157070224630618, "learning_rate": 3.221709474361838e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.12635986506938934, "step": 1495, "valid_targets_mean": 6957.0, "valid_targets_min": 2932 }, { "epoch": 2.542372881355932, "grad_norm": 0.4224344033837063, "learning_rate": 3.215006809413633e-05, "loss": 0.3194, "loss_nan_ranks": 0, "loss_rank_avg": 0.1392759382724762, "step": 1500, "valid_targets_mean": 6384.5, "valid_targets_min": 2434 }, { "epoch": 2.5508474576271185, "grad_norm": 0.43012730740401234, "learning_rate": 3.20828244581629e-05, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.1791025698184967, "step": 1505, "valid_targets_mean": 7117.2, "valid_targets_min": 1495 }, { "epoch": 2.559322033898305, "grad_norm": 0.4845914897087292, "learning_rate": 3.2015365036593466e-05, "loss": 0.3306, "loss_nan_ranks": 0, "loss_rank_avg": 0.1442946195602417, "step": 1510, "valid_targets_mean": 9361.6, "valid_targets_min": 4450 }, { "epoch": 2.5677966101694913, "grad_norm": 0.4020720093483181, "learning_rate": 3.194769103417709e-05, "loss": 0.2901, "loss_nan_ranks": 0, "loss_rank_avg": 0.2034224271774292, "step": 1515, "valid_targets_mean": 8227.0, "valid_targets_min": 2913 }, { "epoch": 2.576271186440678, "grad_norm": 0.47515037487881684, "learning_rate": 3.1879803659495015e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.09358513355255127, "step": 1520, "valid_targets_mean": 5848.9, "valid_targets_min": 2633 }, { "epoch": 2.584745762711864, "grad_norm": 0.4525136249871132, "learning_rate": 3.181170412493906e-05, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.14096501469612122, "step": 1525, "valid_targets_mean": 5804.8, "valid_targets_min": 2873 }, { "epoch": 2.593220338983051, "grad_norm": 0.44499842842422144, "learning_rate": 3.1743393646689996e-05, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.13607238233089447, "step": 1530, "valid_targets_mean": 7015.5, "valid_targets_min": 3650 }, { "epoch": 2.601694915254237, "grad_norm": 0.39010435281227923, "learning_rate": 3.1674873444695804e-05, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.15358000993728638, "step": 1535, "valid_targets_mean": 8212.6, "valid_targets_min": 4561 }, { "epoch": 2.610169491525424, "grad_norm": 0.38705505466621165, "learning_rate": 3.1606144742649875e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.18068253993988037, "step": 1540, "valid_targets_mean": 9366.8, "valid_targets_min": 3442 }, { "epoch": 2.6186440677966103, "grad_norm": 0.4645250007783615, "learning_rate": 3.15372087679692e-05, "loss": 0.2697, "loss_nan_ranks": 0, "loss_rank_avg": 0.16335920989513397, "step": 1545, "valid_targets_mean": 7294.8, "valid_targets_min": 2880 }, { "epoch": 2.6271186440677967, "grad_norm": 0.5969381310791982, "learning_rate": 3.1468066751772415e-05, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.20474021136760712, "step": 1550, "valid_targets_mean": 9866.2, "valid_targets_min": 3896 }, { "epoch": 2.635593220338983, "grad_norm": 0.39986488663805625, "learning_rate": 3.1398719928857834e-05, "loss": 0.2852, "loss_nan_ranks": 0, "loss_rank_avg": 0.16469399631023407, "step": 1555, "valid_targets_mean": 9266.1, "valid_targets_min": 2559 }, { "epoch": 2.6440677966101696, "grad_norm": 0.42603497362335596, "learning_rate": 3.132916953768137e-05, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.15886007249355316, "step": 1560, "valid_targets_mean": 7792.9, "valid_targets_min": 2695 }, { "epoch": 2.652542372881356, "grad_norm": 0.4477773300510562, "learning_rate": 3.1259416820334446e-05, "loss": 0.2917, "loss_nan_ranks": 0, "loss_rank_avg": 0.1468237042427063, "step": 1565, "valid_targets_mean": 6308.1, "valid_targets_min": 2530 }, { "epoch": 2.6610169491525424, "grad_norm": 0.413038718975138, "learning_rate": 3.118946302252181e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.11161170154809952, "step": 1570, "valid_targets_mean": 5875.2, "valid_targets_min": 3706 }, { "epoch": 2.669491525423729, "grad_norm": 0.40102607092450826, "learning_rate": 3.1119309393539256e-05, "loss": 0.2763, "loss_nan_ranks": 0, "loss_rank_avg": 0.1047399640083313, "step": 1575, "valid_targets_mean": 6100.2, "valid_targets_min": 2617 }, { "epoch": 2.6779661016949152, "grad_norm": 0.4487526831600451, "learning_rate": 3.104895718625136e-05, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.19679084420204163, "step": 1580, "valid_targets_mean": 9194.9, "valid_targets_min": 3588 }, { "epoch": 2.6864406779661016, "grad_norm": 0.4319081942251288, "learning_rate": 3.097840765706908e-05, "loss": 0.3087, "loss_nan_ranks": 0, "loss_rank_avg": 0.16104386746883392, "step": 1585, "valid_targets_mean": 7758.5, "valid_targets_min": 2699 }, { "epoch": 2.694915254237288, "grad_norm": 0.4362156095926864, "learning_rate": 3.0907662065927297e-05, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.17210246622562408, "step": 1590, "valid_targets_mean": 7771.1, "valid_targets_min": 4059 }, { "epoch": 2.7033898305084745, "grad_norm": 0.3805861970091732, "learning_rate": 3.083672167626237e-05, "loss": 0.3063, "loss_nan_ranks": 0, "loss_rank_avg": 0.1351141780614853, "step": 1595, "valid_targets_mean": 8147.1, "valid_targets_min": 3440 }, { "epoch": 2.711864406779661, "grad_norm": 0.41117431133265786, "learning_rate": 3.0765587754989516e-05, "loss": 0.2884, "loss_nan_ranks": 0, "loss_rank_avg": 0.2080633044242859, "step": 1600, "valid_targets_mean": 10313.1, "valid_targets_min": 4746 }, { "epoch": 2.7203389830508473, "grad_norm": 0.4193393539029648, "learning_rate": 3.069426157248022e-05, "loss": 0.2883, "loss_nan_ranks": 0, "loss_rank_avg": 0.1242239847779274, "step": 1605, "valid_targets_mean": 7685.4, "valid_targets_min": 2538 }, { "epoch": 2.7288135593220337, "grad_norm": 0.40390165294921654, "learning_rate": 3.062274440253953e-05, "loss": 0.3238, "loss_nan_ranks": 0, "loss_rank_avg": 0.1672280728816986, "step": 1610, "valid_targets_mean": 8736.0, "valid_targets_min": 2510 }, { "epoch": 2.7372881355932206, "grad_norm": 0.4597361076436166, "learning_rate": 3.0551037522383325e-05, "loss": 0.3077, "loss_nan_ranks": 0, "loss_rank_avg": 0.13972532749176025, "step": 1615, "valid_targets_mean": 6083.9, "valid_targets_min": 2965 }, { "epoch": 2.7457627118644066, "grad_norm": 0.3801055818275529, "learning_rate": 3.0479142212615457e-05, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.14896857738494873, "step": 1620, "valid_targets_mean": 8904.1, "valid_targets_min": 2302 }, { "epoch": 2.7542372881355934, "grad_norm": 0.37492323834267705, "learning_rate": 3.0407059757204968e-05, "loss": 0.3108, "loss_nan_ranks": 0, "loss_rank_avg": 0.11933213472366333, "step": 1625, "valid_targets_mean": 7426.5, "valid_targets_min": 2795 }, { "epoch": 2.7627118644067794, "grad_norm": 0.39976463787165845, "learning_rate": 3.033479144346308e-05, "loss": 0.3374, "loss_nan_ranks": 0, "loss_rank_avg": 0.16365092992782593, "step": 1630, "valid_targets_mean": 8906.2, "valid_targets_min": 4011 }, { "epoch": 2.7711864406779663, "grad_norm": 0.3997723207190587, "learning_rate": 3.0262338562020246e-05, "loss": 0.3026, "loss_nan_ranks": 0, "loss_rank_avg": 0.11927295476198196, "step": 1635, "valid_targets_mean": 6491.0, "valid_targets_min": 2532 }, { "epoch": 2.7796610169491527, "grad_norm": 0.36564215466073935, "learning_rate": 3.018970240680308e-05, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.19709117710590363, "step": 1640, "valid_targets_mean": 11646.2, "valid_targets_min": 4338 }, { "epoch": 2.788135593220339, "grad_norm": 0.40505026371761105, "learning_rate": 3.011688427501126e-05, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.19479559361934662, "step": 1645, "valid_targets_mean": 10186.4, "valid_targets_min": 4347 }, { "epoch": 2.7966101694915255, "grad_norm": 0.39795771334611546, "learning_rate": 3.0043885467094382e-05, "loss": 0.3121, "loss_nan_ranks": 0, "loss_rank_avg": 0.09027592837810516, "step": 1650, "valid_targets_mean": 5524.0, "valid_targets_min": 2597 }, { "epoch": 2.805084745762712, "grad_norm": 0.4041662599563723, "learning_rate": 2.9970707286728676e-05, "loss": 0.2997, "loss_nan_ranks": 0, "loss_rank_avg": 0.1600339710712433, "step": 1655, "valid_targets_mean": 7957.8, "valid_targets_min": 3054 }, { "epoch": 2.8135593220338984, "grad_norm": 0.437401544209369, "learning_rate": 2.9897351040793786e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.11536328494548798, "step": 1660, "valid_targets_mean": 5436.1, "valid_targets_min": 2823 }, { "epoch": 2.8220338983050848, "grad_norm": 0.37522109968246403, "learning_rate": 2.9823818039349407e-05, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.15367770195007324, "step": 1665, "valid_targets_mean": 8713.4, "valid_targets_min": 2676 }, { "epoch": 2.830508474576271, "grad_norm": 0.3849792093810754, "learning_rate": 2.9750109595611884e-05, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.14932164549827576, "step": 1670, "valid_targets_mean": 8313.9, "valid_targets_min": 2584 }, { "epoch": 2.8389830508474576, "grad_norm": 0.4863619459847622, "learning_rate": 2.967622702593074e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.1424635946750641, "step": 1675, "valid_targets_mean": 6796.4, "valid_targets_min": 2567 }, { "epoch": 2.847457627118644, "grad_norm": 0.396918930200827, "learning_rate": 2.9602171649765235e-05, "loss": 0.3067, "loss_nan_ranks": 0, "loss_rank_avg": 0.14382398128509521, "step": 1680, "valid_targets_mean": 9150.9, "valid_targets_min": 4866 }, { "epoch": 2.8559322033898304, "grad_norm": 0.4963487698731554, "learning_rate": 2.9527944789660732e-05, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.13725848495960236, "step": 1685, "valid_targets_mean": 8448.1, "valid_targets_min": 3413 }, { "epoch": 2.864406779661017, "grad_norm": 0.4856540030020508, "learning_rate": 2.9453547771225088e-05, "loss": 0.2873, "loss_nan_ranks": 0, "loss_rank_avg": 0.13087928295135498, "step": 1690, "valid_targets_mean": 6625.8, "valid_targets_min": 2060 }, { "epoch": 2.8728813559322033, "grad_norm": 0.4718602599329464, "learning_rate": 2.9378981923105026e-05, "loss": 0.2803, "loss_nan_ranks": 0, "loss_rank_avg": 0.12425769120454788, "step": 1695, "valid_targets_mean": 6502.9, "valid_targets_min": 3374 }, { "epoch": 2.8813559322033897, "grad_norm": 0.429811308643893, "learning_rate": 2.930424857696236e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.11679084599018097, "step": 1700, "valid_targets_mean": 6725.0, "valid_targets_min": 3680 }, { "epoch": 2.889830508474576, "grad_norm": 0.6106285244411059, "learning_rate": 2.922934906745024e-05, "loss": 0.3187, "loss_nan_ranks": 0, "loss_rank_avg": 0.17136754095554352, "step": 1705, "valid_targets_mean": 8815.4, "valid_targets_min": 3296 }, { "epoch": 2.898305084745763, "grad_norm": 0.40881667558157, "learning_rate": 2.9154284732189285e-05, "loss": 0.3147, "loss_nan_ranks": 0, "loss_rank_avg": 0.103614941239357, "step": 1710, "valid_targets_mean": 7344.6, "valid_targets_min": 3896 }, { "epoch": 2.906779661016949, "grad_norm": 0.40167051142083, "learning_rate": 2.907905691174374e-05, "loss": 0.2885, "loss_nan_ranks": 0, "loss_rank_avg": 0.15157365798950195, "step": 1715, "valid_targets_mean": 7305.6, "valid_targets_min": 2406 }, { "epoch": 2.915254237288136, "grad_norm": 0.44454100171373195, "learning_rate": 2.90036669495975e-05, "loss": 0.3193, "loss_nan_ranks": 0, "loss_rank_avg": 0.2535397410392761, "step": 1720, "valid_targets_mean": 10899.9, "valid_targets_min": 4113 }, { "epoch": 2.923728813559322, "grad_norm": 0.40742031882359336, "learning_rate": 2.8928116192130127e-05, "loss": 0.3201, "loss_nan_ranks": 0, "loss_rank_avg": 0.15399280190467834, "step": 1725, "valid_targets_mean": 8970.1, "valid_targets_min": 4604 }, { "epoch": 2.9322033898305087, "grad_norm": 0.3808270536515648, "learning_rate": 2.8852405988592802e-05, "loss": 0.2801, "loss_nan_ranks": 0, "loss_rank_avg": 0.125367671251297, "step": 1730, "valid_targets_mean": 6888.9, "valid_targets_min": 3687 }, { "epoch": 2.940677966101695, "grad_norm": 0.38551744389083203, "learning_rate": 2.8776537691084247e-05, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.2000572681427002, "step": 1735, "valid_targets_mean": 9901.8, "valid_targets_min": 5423 }, { "epoch": 2.9491525423728815, "grad_norm": 0.3958071016569807, "learning_rate": 2.8700512654526543e-05, "loss": 0.303, "loss_nan_ranks": 0, "loss_rank_avg": 0.1151888519525528, "step": 1740, "valid_targets_mean": 6846.0, "valid_targets_min": 3356 }, { "epoch": 2.957627118644068, "grad_norm": 0.4049169362567717, "learning_rate": 2.8624332236640975e-05, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.15298178791999817, "step": 1745, "valid_targets_mean": 8275.1, "valid_targets_min": 3234 }, { "epoch": 2.9661016949152543, "grad_norm": 0.40926795857010767, "learning_rate": 2.854799779792375e-05, "loss": 0.2807, "loss_nan_ranks": 0, "loss_rank_avg": 0.122572161257267, "step": 1750, "valid_targets_mean": 6125.0, "valid_targets_min": 1440 }, { "epoch": 2.9745762711864407, "grad_norm": 0.4120145141696389, "learning_rate": 2.8471510701621708e-05, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.14707563817501068, "step": 1755, "valid_targets_mean": 8006.0, "valid_targets_min": 2888 }, { "epoch": 2.983050847457627, "grad_norm": 0.4336376958519921, "learning_rate": 2.8394872313707998e-05, "loss": 0.3134, "loss_nan_ranks": 0, "loss_rank_avg": 0.2632421851158142, "step": 1760, "valid_targets_mean": 9177.8, "valid_targets_min": 2312 }, { "epoch": 2.9915254237288136, "grad_norm": 0.44528199555148923, "learning_rate": 2.8318084002857654e-05, "loss": 0.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.14627692103385925, "step": 1765, "valid_targets_mean": 6893.6, "valid_targets_min": 4435 }, { "epoch": 3.0, "grad_norm": 0.4240883829673781, "learning_rate": 2.824114714042317e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.1557423323392868, "step": 1770, "valid_targets_mean": 6871.1, "valid_targets_min": 2648 }, { "epoch": 3.0084745762711864, "grad_norm": 0.3897900675954003, "learning_rate": 2.8164063100409992e-05, "loss": 0.306, "loss_nan_ranks": 0, "loss_rank_avg": 0.17762136459350586, "step": 1775, "valid_targets_mean": 11193.6, "valid_targets_min": 5241 }, { "epoch": 3.016949152542373, "grad_norm": 0.47647182837107177, "learning_rate": 2.8086833259452006e-05, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.1492662876844406, "step": 1780, "valid_targets_mean": 7162.5, "valid_targets_min": 2970 }, { "epoch": 3.0254237288135593, "grad_norm": 0.48623120655281904, "learning_rate": 2.8009458996786934e-05, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.12112700194120407, "step": 1785, "valid_targets_mean": 7915.6, "valid_targets_min": 4167 }, { "epoch": 3.0338983050847457, "grad_norm": 0.48482652840024115, "learning_rate": 2.7931941694231705e-05, "loss": 0.3197, "loss_nan_ranks": 0, "loss_rank_avg": 0.19166266918182373, "step": 1790, "valid_targets_mean": 9350.4, "valid_targets_min": 3952 }, { "epoch": 3.042372881355932, "grad_norm": 0.43430659240936026, "learning_rate": 2.7854282736157777e-05, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.10274215042591095, "step": 1795, "valid_targets_mean": 6751.6, "valid_targets_min": 3033 }, { "epoch": 3.0508474576271185, "grad_norm": 0.42824230463335977, "learning_rate": 2.777648350946642e-05, "loss": 0.3051, "loss_nan_ranks": 0, "loss_rank_avg": 0.14262977242469788, "step": 1800, "valid_targets_mean": 7915.8, "valid_targets_min": 4544 }, { "epoch": 3.059322033898305, "grad_norm": 0.39171848978515866, "learning_rate": 2.7698545403563934e-05, "loss": 0.2846, "loss_nan_ranks": 0, "loss_rank_avg": 0.17258086800575256, "step": 1805, "valid_targets_mean": 10852.6, "valid_targets_min": 4410 }, { "epoch": 3.0677966101694913, "grad_norm": 0.42586366102628226, "learning_rate": 2.7620469810336854e-05, "loss": 0.2595, "loss_nan_ranks": 0, "loss_rank_avg": 0.10813435912132263, "step": 1810, "valid_targets_mean": 7451.9, "valid_targets_min": 3605 }, { "epoch": 3.0762711864406778, "grad_norm": 0.5024156841387737, "learning_rate": 2.754225812412708e-05, "loss": 0.286, "loss_nan_ranks": 0, "loss_rank_avg": 0.2416592836380005, "step": 1815, "valid_targets_mean": 10524.9, "valid_targets_min": 3310 }, { "epoch": 3.084745762711864, "grad_norm": 0.4048547245262977, "learning_rate": 2.7463911741706982e-05, "loss": 0.3173, "loss_nan_ranks": 0, "loss_rank_avg": 0.207644984126091, "step": 1820, "valid_targets_mean": 12621.1, "valid_targets_min": 5029 }, { "epoch": 3.093220338983051, "grad_norm": 0.4307490078277596, "learning_rate": 2.738543206225445e-05, "loss": 0.3163, "loss_nan_ranks": 0, "loss_rank_avg": 0.1587986946105957, "step": 1825, "valid_targets_mean": 7724.6, "valid_targets_min": 3033 }, { "epoch": 3.1016949152542375, "grad_norm": 0.3979456347157598, "learning_rate": 2.7306820487327906e-05, "loss": 0.2543, "loss_nan_ranks": 0, "loss_rank_avg": 0.09165980666875839, "step": 1830, "valid_targets_mean": 6352.9, "valid_targets_min": 3636 }, { "epoch": 3.110169491525424, "grad_norm": 0.41012860288675734, "learning_rate": 2.7228078420841277e-05, "loss": 0.2854, "loss_nan_ranks": 0, "loss_rank_avg": 0.15160031616687775, "step": 1835, "valid_targets_mean": 8778.5, "valid_targets_min": 4517 }, { "epoch": 3.1186440677966103, "grad_norm": 0.3676896512476812, "learning_rate": 2.714920726903892e-05, "loss": 0.2595, "loss_nan_ranks": 0, "loss_rank_avg": 0.12810014188289642, "step": 1840, "valid_targets_mean": 9615.2, "valid_targets_min": 2341 }, { "epoch": 3.1271186440677967, "grad_norm": 0.4376407960674012, "learning_rate": 2.7070208440470525e-05, "loss": 0.2995, "loss_nan_ranks": 0, "loss_rank_avg": 0.10664518177509308, "step": 1845, "valid_targets_mean": 6728.5, "valid_targets_min": 1635 }, { "epoch": 3.135593220338983, "grad_norm": 0.4408544143757849, "learning_rate": 2.699108334596592e-05, "loss": 0.2933, "loss_nan_ranks": 0, "loss_rank_avg": 0.13383883237838745, "step": 1850, "valid_targets_mean": 6220.6, "valid_targets_min": 1893 }, { "epoch": 3.1440677966101696, "grad_norm": 0.4171325307219931, "learning_rate": 2.6911833398609923e-05, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.13895325362682343, "step": 1855, "valid_targets_mean": 7073.8, "valid_targets_min": 3127 }, { "epoch": 3.152542372881356, "grad_norm": 0.38458629105978887, "learning_rate": 2.683246001371706e-05, "loss": 0.2848, "loss_nan_ranks": 0, "loss_rank_avg": 0.15742285549640656, "step": 1860, "valid_targets_mean": 8551.6, "valid_targets_min": 3754 }, { "epoch": 3.1610169491525424, "grad_norm": 0.43171473858147835, "learning_rate": 2.6752964608806338e-05, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.16160979866981506, "step": 1865, "valid_targets_mean": 8368.9, "valid_targets_min": 2778 }, { "epoch": 3.169491525423729, "grad_norm": 0.4050340176255496, "learning_rate": 2.6673348603575884e-05, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.11083655059337616, "step": 1870, "valid_targets_mean": 7184.9, "valid_targets_min": 2213 }, { "epoch": 3.1779661016949152, "grad_norm": 0.387647020584462, "learning_rate": 2.6593613419877615e-05, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.143922820687294, "step": 1875, "valid_targets_mean": 7900.6, "valid_targets_min": 3621 }, { "epoch": 3.1864406779661016, "grad_norm": 0.42761047108532324, "learning_rate": 2.6513760481691842e-05, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.20920830965042114, "step": 1880, "valid_targets_mean": 10595.6, "valid_targets_min": 4433 }, { "epoch": 3.194915254237288, "grad_norm": 0.41992267855603493, "learning_rate": 2.6433791215101848e-05, "loss": 0.2867, "loss_nan_ranks": 0, "loss_rank_avg": 0.16483736038208008, "step": 1885, "valid_targets_mean": 8851.0, "valid_targets_min": 2382 }, { "epoch": 3.2033898305084745, "grad_norm": 0.4957805375483976, "learning_rate": 2.6353707048268397e-05, "loss": 0.3328, "loss_nan_ranks": 0, "loss_rank_avg": 0.19370196759700775, "step": 1890, "valid_targets_mean": 6473.1, "valid_targets_min": 2295 }, { "epoch": 3.211864406779661, "grad_norm": 0.44788686707718267, "learning_rate": 2.6273509411404234e-05, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.1875634789466858, "step": 1895, "valid_targets_mean": 8210.6, "valid_targets_min": 2503 }, { "epoch": 3.2203389830508473, "grad_norm": 0.4152706213229902, "learning_rate": 2.6193199736748572e-05, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.1070324182510376, "step": 1900, "valid_targets_mean": 6541.2, "valid_targets_min": 3099 }, { "epoch": 3.2288135593220337, "grad_norm": 0.4205334323132011, "learning_rate": 2.611277945854148e-05, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.12432655692100525, "step": 1905, "valid_targets_mean": 7172.9, "valid_targets_min": 2347 }, { "epoch": 3.23728813559322, "grad_norm": 0.42085706446217025, "learning_rate": 2.603225001299829e-05, "loss": 0.2999, "loss_nan_ranks": 0, "loss_rank_avg": 0.1846511960029602, "step": 1910, "valid_targets_mean": 9515.6, "valid_targets_min": 2967 }, { "epoch": 3.2457627118644066, "grad_norm": 0.45800092129429243, "learning_rate": 2.595161283828392e-05, "loss": 0.3104, "loss_nan_ranks": 0, "loss_rank_avg": 0.10589482635259628, "step": 1915, "valid_targets_mean": 5909.1, "valid_targets_min": 2628 }, { "epoch": 3.2542372881355934, "grad_norm": 0.4274729974353385, "learning_rate": 2.5870869374487227e-05, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.1856462061405182, "step": 1920, "valid_targets_mean": 8283.9, "valid_targets_min": 4400 }, { "epoch": 3.26271186440678, "grad_norm": 0.45054085287704343, "learning_rate": 2.579002106359527e-05, "loss": 0.2954, "loss_nan_ranks": 0, "loss_rank_avg": 0.16199690103530884, "step": 1925, "valid_targets_mean": 6181.9, "valid_targets_min": 2319 }, { "epoch": 3.2711864406779663, "grad_norm": 0.40980194755456195, "learning_rate": 2.5709069349467562e-05, "loss": 0.3383, "loss_nan_ranks": 0, "loss_rank_avg": 0.13299697637557983, "step": 1930, "valid_targets_mean": 8032.4, "valid_targets_min": 2865 }, { "epoch": 3.2796610169491527, "grad_norm": 0.3829926624037664, "learning_rate": 2.562801567781026e-05, "loss": 0.2986, "loss_nan_ranks": 0, "loss_rank_avg": 0.10366646200418472, "step": 1935, "valid_targets_mean": 8115.5, "valid_targets_min": 3637 }, { "epoch": 3.288135593220339, "grad_norm": 0.42359013428814046, "learning_rate": 2.554686149615038e-05, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.12953156232833862, "step": 1940, "valid_targets_mean": 8511.0, "valid_targets_min": 5177 }, { "epoch": 3.2966101694915255, "grad_norm": 0.39940930819276965, "learning_rate": 2.5465608253809944e-05, "loss": 0.2642, "loss_nan_ranks": 0, "loss_rank_avg": 0.10232742875814438, "step": 1945, "valid_targets_mean": 7172.9, "valid_targets_min": 1999 }, { "epoch": 3.305084745762712, "grad_norm": 0.43955208594397505, "learning_rate": 2.5384257401880077e-05, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.1324247121810913, "step": 1950, "valid_targets_mean": 7481.0, "valid_targets_min": 3559 }, { "epoch": 3.3135593220338984, "grad_norm": 0.4759603073565482, "learning_rate": 2.530281039319509e-05, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.1068073958158493, "step": 1955, "valid_targets_mean": 5274.9, "valid_targets_min": 2989 }, { "epoch": 3.3220338983050848, "grad_norm": 0.39533664131007507, "learning_rate": 2.5221268682306565e-05, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.12157115340232849, "step": 1960, "valid_targets_mean": 8086.8, "valid_targets_min": 3023 }, { "epoch": 3.330508474576271, "grad_norm": 0.4025452212806949, "learning_rate": 2.5139633725457345e-05, "loss": 0.3042, "loss_nan_ranks": 0, "loss_rank_avg": 0.1479698270559311, "step": 1965, "valid_targets_mean": 8655.5, "valid_targets_min": 3906 }, { "epoch": 3.3389830508474576, "grad_norm": 0.42521063572004575, "learning_rate": 2.505790698055554e-05, "loss": 0.2786, "loss_nan_ranks": 0, "loss_rank_avg": 0.11045683920383453, "step": 1970, "valid_targets_mean": 7279.1, "valid_targets_min": 5657 }, { "epoch": 3.347457627118644, "grad_norm": 0.48755661717841947, "learning_rate": 2.49760899071485e-05, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.17295318841934204, "step": 1975, "valid_targets_mean": 7348.9, "valid_targets_min": 2427 }, { "epoch": 3.3559322033898304, "grad_norm": 0.4254688178029983, "learning_rate": 2.4894183966396735e-05, "loss": 0.2686, "loss_nan_ranks": 0, "loss_rank_avg": 0.09378187358379364, "step": 1980, "valid_targets_mean": 5475.5, "valid_targets_min": 2778 }, { "epoch": 3.364406779661017, "grad_norm": 0.367434521784498, "learning_rate": 2.4812190621047822e-05, "loss": 0.294, "loss_nan_ranks": 0, "loss_rank_avg": 0.10478046536445618, "step": 1985, "valid_targets_mean": 8775.1, "valid_targets_min": 4384 }, { "epoch": 3.3728813559322033, "grad_norm": 0.4189507633838683, "learning_rate": 2.4730111335410298e-05, "loss": 0.304, "loss_nan_ranks": 0, "loss_rank_avg": 0.17582011222839355, "step": 1990, "valid_targets_mean": 7836.2, "valid_targets_min": 1645 }, { "epoch": 3.3813559322033897, "grad_norm": 0.400233301929351, "learning_rate": 2.4647947575327468e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.09607855975627899, "step": 1995, "valid_targets_mean": 5813.9, "valid_targets_min": 3494 }, { "epoch": 3.389830508474576, "grad_norm": 0.4336791016592384, "learning_rate": 2.4565700808151297e-05, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.10696402192115784, "step": 2000, "valid_targets_mean": 6734.2, "valid_targets_min": 3928 }, { "epoch": 3.3983050847457625, "grad_norm": 0.41428448011026164, "learning_rate": 2.4483372502716124e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.0847843810915947, "step": 2005, "valid_targets_mean": 5492.8, "valid_targets_min": 3844 }, { "epoch": 3.406779661016949, "grad_norm": 0.40964037100046546, "learning_rate": 2.44009641293125e-05, "loss": 0.2883, "loss_nan_ranks": 0, "loss_rank_avg": 0.14137449860572815, "step": 2010, "valid_targets_mean": 7062.4, "valid_targets_min": 2779 }, { "epoch": 3.415254237288136, "grad_norm": 0.38682559049197435, "learning_rate": 2.431847715966087e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.0912858098745346, "step": 2015, "valid_targets_mean": 6138.2, "valid_targets_min": 2715 }, { "epoch": 3.423728813559322, "grad_norm": 0.48692004450222665, "learning_rate": 2.423591306688534e-05, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.11212123930454254, "step": 2020, "valid_targets_mean": 6439.9, "valid_targets_min": 2940 }, { "epoch": 3.4322033898305087, "grad_norm": 0.5255657570421769, "learning_rate": 2.4153273325487346e-05, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.1764291524887085, "step": 2025, "valid_targets_mean": 8640.4, "valid_targets_min": 2608 }, { "epoch": 3.440677966101695, "grad_norm": 0.4266344445319651, "learning_rate": 2.407055941131932e-05, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.18718381226062775, "step": 2030, "valid_targets_mean": 7492.9, "valid_targets_min": 2960 }, { "epoch": 3.4491525423728815, "grad_norm": 0.4211828179123291, "learning_rate": 2.3987772801558328e-05, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.21861864626407623, "step": 2035, "valid_targets_mean": 8366.5, "valid_targets_min": 3066 }, { "epoch": 3.457627118644068, "grad_norm": 0.4160233489369109, "learning_rate": 2.3904914974679705e-05, "loss": 0.2831, "loss_nan_ranks": 0, "loss_rank_avg": 0.10223515331745148, "step": 2040, "valid_targets_mean": 6495.2, "valid_targets_min": 3637 }, { "epoch": 3.4661016949152543, "grad_norm": 0.40882160997249284, "learning_rate": 2.3821987410430646e-05, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.12576085329055786, "step": 2045, "valid_targets_mean": 7358.2, "valid_targets_min": 2607 }, { "epoch": 3.4745762711864407, "grad_norm": 0.36672520626623, "learning_rate": 2.3738991589803783e-05, "loss": 0.2965, "loss_nan_ranks": 0, "loss_rank_avg": 0.20486734807491302, "step": 2050, "valid_targets_mean": 12180.8, "valid_targets_min": 7787 }, { "epoch": 3.483050847457627, "grad_norm": 0.3853682329233998, "learning_rate": 2.36559289950107e-05, "loss": 0.2794, "loss_nan_ranks": 0, "loss_rank_avg": 0.18601134419441223, "step": 2055, "valid_targets_mean": 9524.1, "valid_targets_min": 3073 }, { "epoch": 3.4915254237288136, "grad_norm": 0.3801472492117076, "learning_rate": 2.357280110945552e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.15141558647155762, "step": 2060, "valid_targets_mean": 9554.1, "valid_targets_min": 4884 }, { "epoch": 3.5, "grad_norm": 0.38281552006385716, "learning_rate": 2.3489609417708383e-05, "loss": 0.3091, "loss_nan_ranks": 0, "loss_rank_avg": 0.07897169888019562, "step": 2065, "valid_targets_mean": 6056.4, "valid_targets_min": 2487 }, { "epoch": 3.5084745762711864, "grad_norm": 0.4084426268312189, "learning_rate": 2.340635540547892e-05, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.09317970275878906, "step": 2070, "valid_targets_mean": 6611.2, "valid_targets_min": 2457 }, { "epoch": 3.516949152542373, "grad_norm": 0.43668463366477434, "learning_rate": 2.3323040559589755e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.1499471664428711, "step": 2075, "valid_targets_mean": 7579.8, "valid_targets_min": 2966 }, { "epoch": 3.5254237288135593, "grad_norm": 0.3983631104396672, "learning_rate": 2.3239666367949917e-05, "loss": 0.2827, "loss_nan_ranks": 0, "loss_rank_avg": 0.1473519206047058, "step": 2080, "valid_targets_mean": 7799.1, "valid_targets_min": 3621 }, { "epoch": 3.5338983050847457, "grad_norm": 0.4120452974947437, "learning_rate": 2.3156234319528295e-05, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.0906115174293518, "step": 2085, "valid_targets_mean": 6207.0, "valid_targets_min": 2847 }, { "epoch": 3.542372881355932, "grad_norm": 0.44363425545735335, "learning_rate": 2.3072745904327015e-05, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.09172677993774414, "step": 2090, "valid_targets_mean": 6414.6, "valid_targets_min": 5234 }, { "epoch": 3.5508474576271185, "grad_norm": 0.38869052034458823, "learning_rate": 2.298920261335488e-05, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.09527749568223953, "step": 2095, "valid_targets_mean": 6330.2, "valid_targets_min": 2577 }, { "epoch": 3.559322033898305, "grad_norm": 0.36643178759344713, "learning_rate": 2.2905605938600685e-05, "loss": 0.2891, "loss_nan_ranks": 0, "loss_rank_avg": 0.20668168365955353, "step": 2100, "valid_targets_mean": 12464.9, "valid_targets_min": 6539 }, { "epoch": 3.5677966101694913, "grad_norm": 0.3959504607284564, "learning_rate": 2.2821957373006617e-05, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.18114525079727173, "step": 2105, "valid_targets_mean": 10751.5, "valid_targets_min": 6678 }, { "epoch": 3.576271186440678, "grad_norm": 0.41062663468779714, "learning_rate": 2.273825841044156e-05, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.15731394290924072, "step": 2110, "valid_targets_mean": 8485.2, "valid_targets_min": 2609 }, { "epoch": 3.584745762711864, "grad_norm": 0.374346290872505, "learning_rate": 2.2654510545674442e-05, "loss": 0.2772, "loss_nan_ranks": 0, "loss_rank_avg": 0.1397765576839447, "step": 2115, "valid_targets_mean": 8244.4, "valid_targets_min": 3700 }, { "epoch": 3.593220338983051, "grad_norm": 0.39875361896903927, "learning_rate": 2.257071527434753e-05, "loss": 0.2967, "loss_nan_ranks": 0, "loss_rank_avg": 0.14811114966869354, "step": 2120, "valid_targets_mean": 7846.0, "valid_targets_min": 3187 }, { "epoch": 3.601694915254237, "grad_norm": 0.39347828360733145, "learning_rate": 2.2486874092949708e-05, "loss": 0.2814, "loss_nan_ranks": 0, "loss_rank_avg": 0.12575045228004456, "step": 2125, "valid_targets_mean": 8018.4, "valid_targets_min": 3985 }, { "epoch": 3.610169491525424, "grad_norm": 0.4164173242177716, "learning_rate": 2.2402988498789767e-05, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.10205131769180298, "step": 2130, "valid_targets_mean": 7143.9, "valid_targets_min": 2676 }, { "epoch": 3.6186440677966103, "grad_norm": 0.4125444447963192, "learning_rate": 2.2319059989969668e-05, "loss": 0.2925, "loss_nan_ranks": 0, "loss_rank_avg": 0.16392400860786438, "step": 2135, "valid_targets_mean": 7902.1, "valid_targets_min": 3675 }, { "epoch": 3.6271186440677967, "grad_norm": 0.40524649599732243, "learning_rate": 2.2235090065357773e-05, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.18411213159561157, "step": 2140, "valid_targets_mean": 8892.9, "valid_targets_min": 4234 }, { "epoch": 3.635593220338983, "grad_norm": 0.4088874114510119, "learning_rate": 2.215108022456208e-05, "loss": 0.3024, "loss_nan_ranks": 0, "loss_rank_avg": 0.14849057793617249, "step": 2145, "valid_targets_mean": 8279.2, "valid_targets_min": 4495 }, { "epoch": 3.6440677966101696, "grad_norm": 0.4831151083725686, "learning_rate": 2.2067031967903443e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.13207237422466278, "step": 2150, "valid_targets_mean": 9388.2, "valid_targets_min": 4290 }, { "epoch": 3.652542372881356, "grad_norm": 0.3733280663746573, "learning_rate": 2.1982946796388788e-05, "loss": 0.3061, "loss_nan_ranks": 0, "loss_rank_avg": 0.17002075910568237, "step": 2155, "valid_targets_mean": 11468.6, "valid_targets_min": 4610 }, { "epoch": 3.6610169491525424, "grad_norm": 0.4173341617806821, "learning_rate": 2.1898826211684297e-05, "loss": 0.2735, "loss_nan_ranks": 0, "loss_rank_avg": 0.1557663381099701, "step": 2160, "valid_targets_mean": 8174.9, "valid_targets_min": 3753 }, { "epoch": 3.669491525423729, "grad_norm": 0.4186670500997302, "learning_rate": 2.1814671716088593e-05, "loss": 0.3066, "loss_nan_ranks": 0, "loss_rank_avg": 0.08113788068294525, "step": 2165, "valid_targets_mean": 6345.8, "valid_targets_min": 2595 }, { "epoch": 3.6779661016949152, "grad_norm": 0.4101685556228967, "learning_rate": 2.17304848125059e-05, "loss": 0.2923, "loss_nan_ranks": 0, "loss_rank_avg": 0.16531658172607422, "step": 2170, "valid_targets_mean": 8883.8, "valid_targets_min": 4246 }, { "epoch": 3.6864406779661016, "grad_norm": 0.41763151825852196, "learning_rate": 2.1646267004419218e-05, "loss": 0.2746, "loss_nan_ranks": 0, "loss_rank_avg": 0.1397768259048462, "step": 2175, "valid_targets_mean": 7207.2, "valid_targets_min": 2605 }, { "epoch": 3.694915254237288, "grad_norm": 0.440242674224947, "learning_rate": 2.1562019795863463e-05, "loss": 0.2954, "loss_nan_ranks": 0, "loss_rank_avg": 0.22693797945976257, "step": 2180, "valid_targets_mean": 9268.8, "valid_targets_min": 4187 }, { "epoch": 3.7033898305084745, "grad_norm": 0.44197333796797894, "learning_rate": 2.147774469139863e-05, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.10422711074352264, "step": 2185, "valid_targets_mean": 6519.4, "valid_targets_min": 3589 }, { "epoch": 3.711864406779661, "grad_norm": 0.40539121412831586, "learning_rate": 2.1393443196082867e-05, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.2202359437942505, "step": 2190, "valid_targets_mean": 11366.1, "valid_targets_min": 4141 }, { "epoch": 3.7203389830508473, "grad_norm": 0.430547381803079, "learning_rate": 2.1309116815445665e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.09388360381126404, "step": 2195, "valid_targets_mean": 5664.4, "valid_targets_min": 3034 }, { "epoch": 3.7288135593220337, "grad_norm": 0.42608356334048153, "learning_rate": 2.1224767055460922e-05, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.10148052871227264, "step": 2200, "valid_targets_mean": 6436.9, "valid_targets_min": 3169 }, { "epoch": 3.7372881355932206, "grad_norm": 0.4210448690634892, "learning_rate": 2.114039542252008e-05, "loss": 0.2988, "loss_nan_ranks": 0, "loss_rank_avg": 0.1500019133090973, "step": 2205, "valid_targets_mean": 7466.1, "valid_targets_min": 3197 }, { "epoch": 3.7457627118644066, "grad_norm": 0.8119317714900413, "learning_rate": 2.1056003423405178e-05, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.22710689902305603, "step": 2210, "valid_targets_mean": 8778.1, "valid_targets_min": 2972 }, { "epoch": 3.7542372881355934, "grad_norm": 0.4821378308753357, "learning_rate": 2.0971592565262005e-05, "loss": 0.2924, "loss_nan_ranks": 0, "loss_rank_avg": 0.19904181361198425, "step": 2215, "valid_targets_mean": 10680.4, "valid_targets_min": 6006 }, { "epoch": 3.7627118644067794, "grad_norm": 0.4372433360996204, "learning_rate": 2.088716435557313e-05, "loss": 0.2795, "loss_nan_ranks": 0, "loss_rank_avg": 0.10062790662050247, "step": 2220, "valid_targets_mean": 7107.2, "valid_targets_min": 3544 }, { "epoch": 3.7711864406779663, "grad_norm": 0.37024338787318023, "learning_rate": 2.0802720302131016e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.1332758069038391, "step": 2225, "valid_targets_mean": 8794.9, "valid_targets_min": 1389 }, { "epoch": 3.7796610169491527, "grad_norm": 0.41076254617672314, "learning_rate": 2.0718261913011055e-05, "loss": 0.2873, "loss_nan_ranks": 0, "loss_rank_avg": 0.15456616878509521, "step": 2230, "valid_targets_mean": 7351.8, "valid_targets_min": 3400 }, { "epoch": 3.788135593220339, "grad_norm": 0.42262471917169897, "learning_rate": 2.063379069654468e-05, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.09343097358942032, "step": 2235, "valid_targets_mean": 5882.2, "valid_targets_min": 1584 }, { "epoch": 3.7966101694915255, "grad_norm": 0.4069130983703195, "learning_rate": 2.0549308161292405e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.1469895988702774, "step": 2240, "valid_targets_mean": 7706.8, "valid_targets_min": 2311 }, { "epoch": 3.805084745762712, "grad_norm": 0.4321629041786689, "learning_rate": 2.0464815816016866e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.11798998713493347, "step": 2245, "valid_targets_mean": 6210.6, "valid_targets_min": 3443 }, { "epoch": 3.8135593220338984, "grad_norm": 0.3846555018208555, "learning_rate": 2.0380315169655905e-05, "loss": 0.3082, "loss_nan_ranks": 0, "loss_rank_avg": 0.15529337525367737, "step": 2250, "valid_targets_mean": 8531.0, "valid_targets_min": 3768 }, { "epoch": 3.8220338983050848, "grad_norm": 0.43425368654131496, "learning_rate": 2.0295807731295628e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.16532611846923828, "step": 2255, "valid_targets_mean": 10186.9, "valid_targets_min": 5887 }, { "epoch": 3.830508474576271, "grad_norm": 0.4060353944725796, "learning_rate": 2.021129501014342e-05, "loss": 0.2618, "loss_nan_ranks": 0, "loss_rank_avg": 0.20302706956863403, "step": 2260, "valid_targets_mean": 9178.1, "valid_targets_min": 3145 }, { "epoch": 3.8389830508474576, "grad_norm": 0.4419753942797279, "learning_rate": 2.0126778515501e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.1332482248544693, "step": 2265, "valid_targets_mean": 6810.1, "valid_targets_min": 2611 }, { "epoch": 3.847457627118644, "grad_norm": 0.3860661265841699, "learning_rate": 2.0042259756737508e-05, "loss": 0.3056, "loss_nan_ranks": 0, "loss_rank_avg": 0.12230737507343292, "step": 2270, "valid_targets_mean": 7196.2, "valid_targets_min": 2703 }, { "epoch": 3.8559322033898304, "grad_norm": 0.4232795474780064, "learning_rate": 1.99577402432625e-05, "loss": 0.2909, "loss_nan_ranks": 0, "loss_rank_avg": 0.14375734329223633, "step": 2275, "valid_targets_mean": 7267.1, "valid_targets_min": 3181 }, { "epoch": 3.864406779661017, "grad_norm": 0.4224770166929963, "learning_rate": 1.9873221484499006e-05, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.17108933627605438, "step": 2280, "valid_targets_mean": 8647.1, "valid_targets_min": 2676 }, { "epoch": 3.8728813559322033, "grad_norm": 0.38764218963486163, "learning_rate": 1.978870498985659e-05, "loss": 0.2931, "loss_nan_ranks": 0, "loss_rank_avg": 0.1058858335018158, "step": 2285, "valid_targets_mean": 6942.6, "valid_targets_min": 2277 }, { "epoch": 3.8813559322033897, "grad_norm": 0.4395517223806546, "learning_rate": 1.9704192268704372e-05, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.10128942131996155, "step": 2290, "valid_targets_mean": 5997.0, "valid_targets_min": 1707 }, { "epoch": 3.889830508474576, "grad_norm": 0.37259316195160275, "learning_rate": 1.96196848303441e-05, "loss": 0.2855, "loss_nan_ranks": 0, "loss_rank_avg": 0.18444445729255676, "step": 2295, "valid_targets_mean": 9367.5, "valid_targets_min": 4451 }, { "epoch": 3.898305084745763, "grad_norm": 0.44009690363461895, "learning_rate": 1.953518418398314e-05, "loss": 0.2737, "loss_nan_ranks": 0, "loss_rank_avg": 0.14901164174079895, "step": 2300, "valid_targets_mean": 6996.6, "valid_targets_min": 2612 }, { "epoch": 3.906779661016949, "grad_norm": 0.4064339811743784, "learning_rate": 1.94506918387076e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.15096023678779602, "step": 2305, "valid_targets_mean": 8826.8, "valid_targets_min": 3590 }, { "epoch": 3.915254237288136, "grad_norm": 0.4395725069154411, "learning_rate": 1.9366209303455322e-05, "loss": 0.2886, "loss_nan_ranks": 0, "loss_rank_avg": 0.14768223464488983, "step": 2310, "valid_targets_mean": 8623.0, "valid_targets_min": 5117 }, { "epoch": 3.923728813559322, "grad_norm": 0.3938918935844931, "learning_rate": 1.928173808698895e-05, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.08866434544324875, "step": 2315, "valid_targets_mean": 6831.0, "valid_targets_min": 4091 }, { "epoch": 3.9322033898305087, "grad_norm": 0.38259904582950616, "learning_rate": 1.919727969786899e-05, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.14592121541500092, "step": 2320, "valid_targets_mean": 8793.0, "valid_targets_min": 2865 }, { "epoch": 3.940677966101695, "grad_norm": 0.3874042376620344, "learning_rate": 1.911283564442687e-05, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.15052124857902527, "step": 2325, "valid_targets_mean": 8260.5, "valid_targets_min": 2791 }, { "epoch": 3.9491525423728815, "grad_norm": 0.48083269380960864, "learning_rate": 1.9028407434737998e-05, "loss": 0.2774, "loss_nan_ranks": 0, "loss_rank_avg": 0.15742509067058563, "step": 2330, "valid_targets_mean": 6578.2, "valid_targets_min": 712 }, { "epoch": 3.957627118644068, "grad_norm": 0.3922858402598884, "learning_rate": 1.894399657659483e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.1299702376127243, "step": 2335, "valid_targets_mean": 8018.9, "valid_targets_min": 4466 }, { "epoch": 3.9661016949152543, "grad_norm": 0.4193645141156418, "learning_rate": 1.8859604577479927e-05, "loss": 0.2677, "loss_nan_ranks": 0, "loss_rank_avg": 0.1529259979724884, "step": 2340, "valid_targets_mean": 7416.6, "valid_targets_min": 2801 }, { "epoch": 3.9745762711864407, "grad_norm": 0.4485830985098884, "learning_rate": 1.877523294453908e-05, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.11698532849550247, "step": 2345, "valid_targets_mean": 5913.9, "valid_targets_min": 2271 }, { "epoch": 3.983050847457627, "grad_norm": 0.39041637106352106, "learning_rate": 1.869088318455434e-05, "loss": 0.2821, "loss_nan_ranks": 0, "loss_rank_avg": 0.12944526970386505, "step": 2350, "valid_targets_mean": 7937.2, "valid_targets_min": 4038 }, { "epoch": 3.9915254237288136, "grad_norm": 0.4206277849161821, "learning_rate": 1.8606556803917136e-05, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.12252271175384521, "step": 2355, "valid_targets_mean": 7135.5, "valid_targets_min": 2557 }, { "epoch": 4.0, "grad_norm": 0.42395282370877047, "learning_rate": 1.8522255308601378e-05, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.14860565960407257, "step": 2360, "valid_targets_mean": 6954.8, "valid_targets_min": 1915 }, { "epoch": 4.008474576271187, "grad_norm": 0.4394981579743167, "learning_rate": 1.8437980204136537e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.1371266394853592, "step": 2365, "valid_targets_mean": 6881.1, "valid_targets_min": 3617 }, { "epoch": 4.016949152542373, "grad_norm": 0.39865371969450675, "learning_rate": 1.8353732995580786e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.1319272816181183, "step": 2370, "valid_targets_mean": 7666.8, "valid_targets_min": 3523 }, { "epoch": 4.02542372881356, "grad_norm": 0.4335576658492927, "learning_rate": 1.826951518749411e-05, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.15865981578826904, "step": 2375, "valid_targets_mean": 9701.0, "valid_targets_min": 4588 }, { "epoch": 4.033898305084746, "grad_norm": 0.37429007480712123, "learning_rate": 1.8185328283911417e-05, "loss": 0.2631, "loss_nan_ranks": 0, "loss_rank_avg": 0.11880265921354294, "step": 2380, "valid_targets_mean": 8349.1, "valid_targets_min": 3445 }, { "epoch": 4.0423728813559325, "grad_norm": 0.4653775490052777, "learning_rate": 1.8101173788315707e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.17142072319984436, "step": 2385, "valid_targets_mean": 8055.1, "valid_targets_min": 2989 }, { "epoch": 4.0508474576271185, "grad_norm": 0.38759263121062476, "learning_rate": 1.8017053203611215e-05, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.13516907393932343, "step": 2390, "valid_targets_mean": 8046.6, "valid_targets_min": 3542 }, { "epoch": 4.059322033898305, "grad_norm": 0.40174040501426045, "learning_rate": 1.7932968032096564e-05, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.07665864378213882, "step": 2395, "valid_targets_mean": 5400.4, "valid_targets_min": 2670 }, { "epoch": 4.067796610169491, "grad_norm": 0.40431475588899, "learning_rate": 1.7848919775437924e-05, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.11547114700078964, "step": 2400, "valid_targets_mean": 7075.5, "valid_targets_min": 2911 }, { "epoch": 4.076271186440678, "grad_norm": 0.41851164508496586, "learning_rate": 1.776490993464223e-05, "loss": 0.2873, "loss_nan_ranks": 0, "loss_rank_avg": 0.13930678367614746, "step": 2405, "valid_targets_mean": 8866.9, "valid_targets_min": 4799 }, { "epoch": 4.084745762711864, "grad_norm": 0.42772766629398995, "learning_rate": 1.768094001003033e-05, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.12916797399520874, "step": 2410, "valid_targets_mean": 7858.2, "valid_targets_min": 4104 }, { "epoch": 4.093220338983051, "grad_norm": 0.42053509359988245, "learning_rate": 1.759701150121024e-05, "loss": 0.2457, "loss_nan_ranks": 0, "loss_rank_avg": 0.12978839874267578, "step": 2415, "valid_targets_mean": 7875.4, "valid_targets_min": 2319 }, { "epoch": 4.101694915254237, "grad_norm": 0.5009497034489835, "learning_rate": 1.7513125907050302e-05, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.22473761439323425, "step": 2420, "valid_targets_mean": 6372.8, "valid_targets_min": 2271 }, { "epoch": 4.110169491525424, "grad_norm": 0.43870007930354155, "learning_rate": 1.742928472565248e-05, "loss": 0.27, "loss_nan_ranks": 0, "loss_rank_avg": 0.09245385229587555, "step": 2425, "valid_targets_mean": 5360.8, "valid_targets_min": 2382 }, { "epoch": 4.11864406779661, "grad_norm": 0.44775043625125593, "learning_rate": 1.7345489454325564e-05, "loss": 0.2703, "loss_nan_ranks": 0, "loss_rank_avg": 0.0709337666630745, "step": 2430, "valid_targets_mean": 5598.9, "valid_targets_min": 2645 }, { "epoch": 4.127118644067797, "grad_norm": 0.39217639662993736, "learning_rate": 1.7261741589558448e-05, "loss": 0.288, "loss_nan_ranks": 0, "loss_rank_avg": 0.0978158563375473, "step": 2435, "valid_targets_mean": 7005.9, "valid_targets_min": 3151 }, { "epoch": 4.135593220338983, "grad_norm": 0.4552504409470467, "learning_rate": 1.717804262699339e-05, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.1586516797542572, "step": 2440, "valid_targets_mean": 8164.1, "valid_targets_min": 4684 }, { "epoch": 4.1440677966101696, "grad_norm": 0.6110641883530884, "learning_rate": 1.7094394061399318e-05, "loss": 0.2571, "loss_nan_ranks": 0, "loss_rank_avg": 0.11182674765586853, "step": 2445, "valid_targets_mean": 6517.5, "valid_targets_min": 3535 }, { "epoch": 4.1525423728813555, "grad_norm": 0.4189713731531144, "learning_rate": 1.701079738664512e-05, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.1106354147195816, "step": 2450, "valid_targets_mean": 7306.5, "valid_targets_min": 2984 }, { "epoch": 4.161016949152542, "grad_norm": 0.4353514390157063, "learning_rate": 1.6927254095672992e-05, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.10617899894714355, "step": 2455, "valid_targets_mean": 5812.9, "valid_targets_min": 2453 }, { "epoch": 4.169491525423728, "grad_norm": 0.4219809852768852, "learning_rate": 1.6843765680471715e-05, "loss": 0.2742, "loss_nan_ranks": 0, "loss_rank_avg": 0.11135134100914001, "step": 2460, "valid_targets_mean": 7021.0, "valid_targets_min": 3043 }, { "epoch": 4.177966101694915, "grad_norm": 0.5654406681363515, "learning_rate": 1.6760333632050086e-05, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.11446435004472733, "step": 2465, "valid_targets_mean": 6612.6, "valid_targets_min": 3022 }, { "epoch": 4.186440677966102, "grad_norm": 0.47653784967954316, "learning_rate": 1.667695944041025e-05, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.11347555369138718, "step": 2470, "valid_targets_mean": 7101.2, "valid_targets_min": 2948 }, { "epoch": 4.194915254237288, "grad_norm": 0.4662821933614443, "learning_rate": 1.6593644594521082e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.13076099753379822, "step": 2475, "valid_targets_mean": 7465.9, "valid_targets_min": 2341 }, { "epoch": 4.203389830508475, "grad_norm": 0.4080427666049444, "learning_rate": 1.6510390582291624e-05, "loss": 0.2611, "loss_nan_ranks": 0, "loss_rank_avg": 0.18516531586647034, "step": 2480, "valid_targets_mean": 9916.2, "valid_targets_min": 5024 }, { "epoch": 4.211864406779661, "grad_norm": 0.42008095154266495, "learning_rate": 1.6427198890544483e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.14330461621284485, "step": 2485, "valid_targets_mean": 8390.0, "valid_targets_min": 2523 }, { "epoch": 4.220338983050848, "grad_norm": 0.41276959099838073, "learning_rate": 1.634407100498931e-05, "loss": 0.264, "loss_nan_ranks": 0, "loss_rank_avg": 0.11455489695072174, "step": 2490, "valid_targets_mean": 7962.2, "valid_targets_min": 4119 }, { "epoch": 4.228813559322034, "grad_norm": 0.43611233307799147, "learning_rate": 1.626100841019623e-05, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.11222334951162338, "step": 2495, "valid_targets_mean": 6606.1, "valid_targets_min": 3702 }, { "epoch": 4.237288135593221, "grad_norm": 0.5784961476511713, "learning_rate": 1.6178012589569358e-05, "loss": 0.2881, "loss_nan_ranks": 0, "loss_rank_avg": 0.20426484942436218, "step": 2500, "valid_targets_mean": 9576.0, "valid_targets_min": 4395 }, { "epoch": 4.245762711864407, "grad_norm": 0.41472930754303877, "learning_rate": 1.60950850253203e-05, "loss": 0.2774, "loss_nan_ranks": 0, "loss_rank_avg": 0.18941691517829895, "step": 2505, "valid_targets_mean": 9656.6, "valid_targets_min": 4846 }, { "epoch": 4.254237288135593, "grad_norm": 0.39746772521027784, "learning_rate": 1.601222719844168e-05, "loss": 0.2598, "loss_nan_ranks": 0, "loss_rank_avg": 0.10123373568058014, "step": 2510, "valid_targets_mean": 8234.5, "valid_targets_min": 4070 }, { "epoch": 4.262711864406779, "grad_norm": 0.40487688980861414, "learning_rate": 1.5929440588680688e-05, "loss": 0.239, "loss_nan_ranks": 0, "loss_rank_avg": 0.1368967741727829, "step": 2515, "valid_targets_mean": 9803.1, "valid_targets_min": 3305 }, { "epoch": 4.271186440677966, "grad_norm": 0.38573108303487735, "learning_rate": 1.5846726674512654e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.09613785147666931, "step": 2520, "valid_targets_mean": 7835.9, "valid_targets_min": 3348 }, { "epoch": 4.279661016949152, "grad_norm": 0.43145138808268946, "learning_rate": 1.576408693311466e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.18399053812026978, "step": 2525, "valid_targets_mean": 9229.1, "valid_targets_min": 3336 }, { "epoch": 4.288135593220339, "grad_norm": 0.4562660091012742, "learning_rate": 1.5681522840339143e-05, "loss": 0.2722, "loss_nan_ranks": 0, "loss_rank_avg": 0.1121688187122345, "step": 2530, "valid_targets_mean": 6697.4, "valid_targets_min": 1611 }, { "epoch": 4.296610169491525, "grad_norm": 0.5087600350546465, "learning_rate": 1.5599035870687515e-05, "loss": 0.2855, "loss_nan_ranks": 0, "loss_rank_avg": 0.12653526663780212, "step": 2535, "valid_targets_mean": 6205.5, "valid_targets_min": 2504 }, { "epoch": 4.305084745762712, "grad_norm": 0.438881885643239, "learning_rate": 1.5516627497283882e-05, "loss": 0.2753, "loss_nan_ranks": 0, "loss_rank_avg": 0.19421055912971497, "step": 2540, "valid_targets_mean": 9667.5, "valid_targets_min": 2638 }, { "epoch": 4.313559322033898, "grad_norm": 0.45645782507464455, "learning_rate": 1.5434299191848713e-05, "loss": 0.2795, "loss_nan_ranks": 0, "loss_rank_avg": 0.1491662859916687, "step": 2545, "valid_targets_mean": 7809.4, "valid_targets_min": 2630 }, { "epoch": 4.322033898305085, "grad_norm": 0.4353487772661872, "learning_rate": 1.5352052424672535e-05, "loss": 0.2644, "loss_nan_ranks": 0, "loss_rank_avg": 0.13219210505485535, "step": 2550, "valid_targets_mean": 6678.6, "valid_targets_min": 1032 }, { "epoch": 4.330508474576272, "grad_norm": 0.4386593211818938, "learning_rate": 1.5269888664589712e-05, "loss": 0.2586, "loss_nan_ranks": 0, "loss_rank_avg": 0.09329979121685028, "step": 2555, "valid_targets_mean": 6891.2, "valid_targets_min": 3901 }, { "epoch": 4.338983050847458, "grad_norm": 0.45062923880238476, "learning_rate": 1.5187809378952182e-05, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.10724156349897385, "step": 2560, "valid_targets_mean": 6354.0, "valid_targets_min": 1847 }, { "epoch": 4.3474576271186445, "grad_norm": 0.4720009798967789, "learning_rate": 1.5105816033603266e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.09511254727840424, "step": 2565, "valid_targets_mean": 6438.9, "valid_targets_min": 3573 }, { "epoch": 4.3559322033898304, "grad_norm": 0.47501420296893465, "learning_rate": 1.5023910092851509e-05, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.14761820435523987, "step": 2570, "valid_targets_mean": 7794.8, "valid_targets_min": 4409 }, { "epoch": 4.364406779661017, "grad_norm": 0.46228965195292865, "learning_rate": 1.4942093019444468e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.21561656892299652, "step": 2575, "valid_targets_mean": 7940.1, "valid_targets_min": 2271 }, { "epoch": 4.372881355932203, "grad_norm": 0.4310289841712482, "learning_rate": 1.4860366274542663e-05, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.15172511339187622, "step": 2580, "valid_targets_mean": 6876.4, "valid_targets_min": 3609 }, { "epoch": 4.38135593220339, "grad_norm": 0.3817393899077175, "learning_rate": 1.4778731317693442e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.1488693356513977, "step": 2585, "valid_targets_mean": 10913.8, "valid_targets_min": 2336 }, { "epoch": 4.389830508474576, "grad_norm": 0.4396698768007295, "learning_rate": 1.4697189606804914e-05, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.11185161769390106, "step": 2590, "valid_targets_mean": 7252.6, "valid_targets_min": 4278 }, { "epoch": 4.398305084745763, "grad_norm": 0.4425465024994567, "learning_rate": 1.4615742598119927e-05, "loss": 0.2621, "loss_nan_ranks": 0, "loss_rank_avg": 0.10830656439065933, "step": 2595, "valid_targets_mean": 7119.5, "valid_targets_min": 2530 }, { "epoch": 4.406779661016949, "grad_norm": 0.4071900412191274, "learning_rate": 1.4534391746190056e-05, "loss": 0.2762, "loss_nan_ranks": 0, "loss_rank_avg": 0.10529286414384842, "step": 2600, "valid_targets_mean": 7428.5, "valid_targets_min": 2578 }, { "epoch": 4.415254237288136, "grad_norm": 0.40288822455342677, "learning_rate": 1.4453138503849622e-05, "loss": 0.3073, "loss_nan_ranks": 0, "loss_rank_avg": 0.11631416529417038, "step": 2605, "valid_targets_mean": 7269.8, "valid_targets_min": 3017 }, { "epoch": 4.423728813559322, "grad_norm": 0.42750798117550126, "learning_rate": 1.4371984322189754e-05, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.14900711178779602, "step": 2610, "valid_targets_mean": 8732.9, "valid_targets_min": 4282 }, { "epoch": 4.432203389830509, "grad_norm": 0.44095759717826927, "learning_rate": 1.4290930650532448e-05, "loss": 0.2676, "loss_nan_ranks": 0, "loss_rank_avg": 0.1209695041179657, "step": 2615, "valid_targets_mean": 6879.2, "valid_targets_min": 3422 }, { "epoch": 4.440677966101695, "grad_norm": 0.424552739901633, "learning_rate": 1.4209978936404731e-05, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.1218380331993103, "step": 2620, "valid_targets_mean": 6677.4, "valid_targets_min": 3274 }, { "epoch": 4.4491525423728815, "grad_norm": 0.39167231606947506, "learning_rate": 1.4129130625512776e-05, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.12196886539459229, "step": 2625, "valid_targets_mean": 9059.2, "valid_targets_min": 3095 }, { "epoch": 4.4576271186440675, "grad_norm": 0.3954677586985334, "learning_rate": 1.4048387161716086e-05, "loss": 0.2739, "loss_nan_ranks": 0, "loss_rank_avg": 0.13891199231147766, "step": 2630, "valid_targets_mean": 8787.0, "valid_targets_min": 4182 }, { "epoch": 4.466101694915254, "grad_norm": 0.3922770972346297, "learning_rate": 1.3967749987001717e-05, "loss": 0.2644, "loss_nan_ranks": 0, "loss_rank_avg": 0.15331467986106873, "step": 2635, "valid_targets_mean": 8593.4, "valid_targets_min": 2049 }, { "epoch": 4.47457627118644, "grad_norm": 0.416498484310529, "learning_rate": 1.3887220541458521e-05, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.14011646807193756, "step": 2640, "valid_targets_mean": 6794.2, "valid_targets_min": 1697 }, { "epoch": 4.483050847457627, "grad_norm": 0.3977702816938163, "learning_rate": 1.380680026325143e-05, "loss": 0.236, "loss_nan_ranks": 0, "loss_rank_avg": 0.10949341207742691, "step": 2645, "valid_targets_mean": 7184.6, "valid_targets_min": 1466 }, { "epoch": 4.491525423728813, "grad_norm": 0.43575966118057613, "learning_rate": 1.3726490588595776e-05, "loss": 0.267, "loss_nan_ranks": 0, "loss_rank_avg": 0.16025930643081665, "step": 2650, "valid_targets_mean": 8080.8, "valid_targets_min": 4200 }, { "epoch": 4.5, "grad_norm": 0.4929537665321967, "learning_rate": 1.3646292951731615e-05, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.12223613262176514, "step": 2655, "valid_targets_mean": 7641.6, "valid_targets_min": 2772 }, { "epoch": 4.508474576271187, "grad_norm": 0.4542816770985378, "learning_rate": 1.3566208784898157e-05, "loss": 0.2684, "loss_nan_ranks": 0, "loss_rank_avg": 0.10347205400466919, "step": 2660, "valid_targets_mean": 7062.9, "valid_targets_min": 3917 }, { "epoch": 4.516949152542373, "grad_norm": 0.6154023708778347, "learning_rate": 1.348623951830816e-05, "loss": 0.2597, "loss_nan_ranks": 0, "loss_rank_avg": 0.12198853492736816, "step": 2665, "valid_targets_mean": 6628.5, "valid_targets_min": 2337 }, { "epoch": 4.52542372881356, "grad_norm": 0.4401656665983104, "learning_rate": 1.3406386580122389e-05, "loss": 0.2879, "loss_nan_ranks": 0, "loss_rank_avg": 0.06955887377262115, "step": 2670, "valid_targets_mean": 4901.9, "valid_targets_min": 2179 }, { "epoch": 4.533898305084746, "grad_norm": 0.407257406794763, "learning_rate": 1.332665139642412e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.21901419758796692, "step": 2675, "valid_targets_mean": 10808.1, "valid_targets_min": 3359 }, { "epoch": 4.5423728813559325, "grad_norm": 0.4171993331704572, "learning_rate": 1.3247035391193664e-05, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.08096012473106384, "step": 2680, "valid_targets_mean": 6991.5, "valid_targets_min": 3342 }, { "epoch": 4.5508474576271185, "grad_norm": 0.4216667198517297, "learning_rate": 1.3167539986282938e-05, "loss": 0.2414, "loss_nan_ranks": 0, "loss_rank_avg": 0.12701958417892456, "step": 2685, "valid_targets_mean": 7187.9, "valid_targets_min": 3835 }, { "epoch": 4.559322033898305, "grad_norm": 0.4007002554100059, "learning_rate": 1.3088166601390087e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.13677562773227692, "step": 2690, "valid_targets_mean": 8478.9, "valid_targets_min": 3949 }, { "epoch": 4.567796610169491, "grad_norm": 0.44906505243084627, "learning_rate": 1.3008916654034085e-05, "loss": 0.3112, "loss_nan_ranks": 0, "loss_rank_avg": 0.12453994154930115, "step": 2695, "valid_targets_mean": 6475.2, "valid_targets_min": 2863 }, { "epoch": 4.576271186440678, "grad_norm": 0.4695955316852692, "learning_rate": 1.2929791559529484e-05, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.1315167248249054, "step": 2700, "valid_targets_mean": 8320.2, "valid_targets_min": 4323 }, { "epoch": 4.584745762711864, "grad_norm": 0.480923032502113, "learning_rate": 1.2850792730961082e-05, "loss": 0.2867, "loss_nan_ranks": 0, "loss_rank_avg": 0.10258597880601883, "step": 2705, "valid_targets_mean": 6287.9, "valid_targets_min": 2432 }, { "epoch": 4.593220338983051, "grad_norm": 0.4053593691587642, "learning_rate": 1.2771921579158728e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.20100140571594238, "step": 2710, "valid_targets_mean": 11134.0, "valid_targets_min": 5394 }, { "epoch": 4.601694915254237, "grad_norm": 0.5133696354264329, "learning_rate": 1.26931795126721e-05, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.19328990578651428, "step": 2715, "valid_targets_mean": 8126.9, "valid_targets_min": 2713 }, { "epoch": 4.610169491525424, "grad_norm": 0.40346643930406395, "learning_rate": 1.2614567937745554e-05, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.12850111722946167, "step": 2720, "valid_targets_mean": 8410.1, "valid_targets_min": 3309 }, { "epoch": 4.61864406779661, "grad_norm": 0.4112102027826456, "learning_rate": 1.2536088258293018e-05, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.11901889741420746, "step": 2725, "valid_targets_mean": 7852.2, "valid_targets_min": 3343 }, { "epoch": 4.627118644067797, "grad_norm": 0.43842191631154037, "learning_rate": 1.2457741875872928e-05, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.12838314473628998, "step": 2730, "valid_targets_mean": 8761.0, "valid_targets_min": 3660 }, { "epoch": 4.635593220338983, "grad_norm": 0.4232260475024782, "learning_rate": 1.2379530189663156e-05, "loss": 0.2686, "loss_nan_ranks": 0, "loss_rank_avg": 0.16140376031398773, "step": 2735, "valid_targets_mean": 7674.8, "valid_targets_min": 1973 }, { "epoch": 4.6440677966101696, "grad_norm": 0.4001326172915943, "learning_rate": 1.2301454596436076e-05, "loss": 0.2578, "loss_nan_ranks": 0, "loss_rank_avg": 0.1508510857820511, "step": 2740, "valid_targets_mean": 8669.1, "valid_targets_min": 3636 }, { "epoch": 4.652542372881356, "grad_norm": 0.46641967025775893, "learning_rate": 1.222351649053359e-05, "loss": 0.2457, "loss_nan_ranks": 0, "loss_rank_avg": 0.08667419850826263, "step": 2745, "valid_targets_mean": 6366.4, "valid_targets_min": 2728 }, { "epoch": 4.661016949152542, "grad_norm": 0.41058878739853244, "learning_rate": 1.2145717263842228e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.14657464623451233, "step": 2750, "valid_targets_mean": 10316.6, "valid_targets_min": 4889 }, { "epoch": 4.669491525423728, "grad_norm": 0.43047052682197245, "learning_rate": 1.2068058305768298e-05, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.17472457885742188, "step": 2755, "valid_targets_mean": 8935.2, "valid_targets_min": 1559 }, { "epoch": 4.677966101694915, "grad_norm": 0.48052761275513234, "learning_rate": 1.1990541003213072e-05, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.1159568727016449, "step": 2760, "valid_targets_mean": 5699.4, "valid_targets_min": 1794 }, { "epoch": 4.686440677966102, "grad_norm": 0.42086376935943387, "learning_rate": 1.1913166740547999e-05, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.15755105018615723, "step": 2765, "valid_targets_mean": 8291.0, "valid_targets_min": 2110 }, { "epoch": 4.694915254237288, "grad_norm": 0.4261819528196372, "learning_rate": 1.1835936899590017e-05, "loss": 0.2767, "loss_nan_ranks": 0, "loss_rank_avg": 0.12719427049160004, "step": 2770, "valid_targets_mean": 7391.2, "valid_targets_min": 3754 }, { "epoch": 4.703389830508475, "grad_norm": 0.41188015404081924, "learning_rate": 1.1758852859576842e-05, "loss": 0.2791, "loss_nan_ranks": 0, "loss_rank_avg": 0.09580564498901367, "step": 2775, "valid_targets_mean": 6902.0, "valid_targets_min": 4403 }, { "epoch": 4.711864406779661, "grad_norm": 0.42367310030699584, "learning_rate": 1.1681915997142354e-05, "loss": 0.2698, "loss_nan_ranks": 0, "loss_rank_avg": 0.1462278664112091, "step": 2780, "valid_targets_mean": 8892.1, "valid_targets_min": 2956 }, { "epoch": 4.720338983050848, "grad_norm": 0.3983024142470498, "learning_rate": 1.1605127686292009e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.18142619729042053, "step": 2785, "valid_targets_mean": 11195.0, "valid_targets_min": 4341 }, { "epoch": 4.728813559322034, "grad_norm": 0.43308748942127245, "learning_rate": 1.15284892983783e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.11833596974611282, "step": 2790, "valid_targets_mean": 7267.1, "valid_targets_min": 3360 }, { "epoch": 4.737288135593221, "grad_norm": 0.42170297161536185, "learning_rate": 1.1452002202076256e-05, "loss": 0.289, "loss_nan_ranks": 0, "loss_rank_avg": 0.1312982141971588, "step": 2795, "valid_targets_mean": 8055.4, "valid_targets_min": 2530 }, { "epoch": 4.745762711864407, "grad_norm": 0.3919530604528147, "learning_rate": 1.1375667763359031e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.14995722472667694, "step": 2800, "valid_targets_mean": 8652.5, "valid_targets_min": 3923 }, { "epoch": 4.754237288135593, "grad_norm": 0.4210088857440684, "learning_rate": 1.1299487345473457e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.10921230912208557, "step": 2805, "valid_targets_mean": 7063.4, "valid_targets_min": 3390 }, { "epoch": 4.762711864406779, "grad_norm": 0.46524547077364725, "learning_rate": 1.1223462308915767e-05, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.16076411306858063, "step": 2810, "valid_targets_mean": 7103.1, "valid_targets_min": 2713 }, { "epoch": 4.771186440677966, "grad_norm": 0.3987547098085568, "learning_rate": 1.1147594011407203e-05, "loss": 0.2921, "loss_nan_ranks": 0, "loss_rank_avg": 0.15100906789302826, "step": 2815, "valid_targets_mean": 9900.6, "valid_targets_min": 4761 }, { "epoch": 4.779661016949152, "grad_norm": 0.4867606351030108, "learning_rate": 1.1071883807869886e-05, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.1709168553352356, "step": 2820, "valid_targets_mean": 7995.1, "valid_targets_min": 3848 }, { "epoch": 4.788135593220339, "grad_norm": 0.4243770648885672, "learning_rate": 1.0996333050402503e-05, "loss": 0.29, "loss_nan_ranks": 0, "loss_rank_avg": 0.11102272570133209, "step": 2825, "valid_targets_mean": 6283.8, "valid_targets_min": 3432 }, { "epoch": 4.796610169491525, "grad_norm": 0.37807523819250266, "learning_rate": 1.0920943088256266e-05, "loss": 0.2929, "loss_nan_ranks": 0, "loss_rank_avg": 0.17590108513832092, "step": 2830, "valid_targets_mean": 11326.0, "valid_targets_min": 3696 }, { "epoch": 4.805084745762712, "grad_norm": 0.5285744602943411, "learning_rate": 1.0845715267810716e-05, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.16316203773021698, "step": 2835, "valid_targets_mean": 6556.4, "valid_targets_min": 1843 }, { "epoch": 4.813559322033898, "grad_norm": 0.409867873854923, "learning_rate": 1.0770650932549768e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.16258347034454346, "step": 2840, "valid_targets_mean": 9091.2, "valid_targets_min": 3104 }, { "epoch": 4.822033898305085, "grad_norm": 0.4612130048394203, "learning_rate": 1.0695751423037639e-05, "loss": 0.2593, "loss_nan_ranks": 0, "loss_rank_avg": 0.14501486718654633, "step": 2845, "valid_targets_mean": 9458.6, "valid_targets_min": 5624 }, { "epoch": 4.830508474576272, "grad_norm": 0.4165122048257007, "learning_rate": 1.0621018076894984e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.1871585100889206, "step": 2850, "valid_targets_mean": 9650.6, "valid_targets_min": 2319 }, { "epoch": 4.838983050847458, "grad_norm": 0.4447768666450171, "learning_rate": 1.0546452228774919e-05, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.2016182541847229, "step": 2855, "valid_targets_mean": 9618.0, "valid_targets_min": 2098 }, { "epoch": 4.847457627118644, "grad_norm": 0.45706910235659043, "learning_rate": 1.047205521033928e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.07524390518665314, "step": 2860, "valid_targets_mean": 5177.8, "valid_targets_min": 1795 }, { "epoch": 4.8559322033898304, "grad_norm": 0.4082417794116573, "learning_rate": 1.0397828350234765e-05, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.07515836507081985, "step": 2865, "valid_targets_mean": 5618.4, "valid_targets_min": 3548 }, { "epoch": 4.864406779661017, "grad_norm": 0.43699485002864896, "learning_rate": 1.032377297406926e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.15624886751174927, "step": 2870, "valid_targets_mean": 8017.9, "valid_targets_min": 3896 }, { "epoch": 4.872881355932203, "grad_norm": 0.4475219215390075, "learning_rate": 1.0249890404388121e-05, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.13607046008110046, "step": 2875, "valid_targets_mean": 7762.4, "valid_targets_min": 2731 }, { "epoch": 4.88135593220339, "grad_norm": 0.4010893872939635, "learning_rate": 1.0176181960650595e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.2050163745880127, "step": 2880, "valid_targets_mean": 10443.4, "valid_targets_min": 4967 }, { "epoch": 4.889830508474576, "grad_norm": 0.43399489366456434, "learning_rate": 1.0102648959206212e-05, "loss": 0.2465, "loss_nan_ranks": 0, "loss_rank_avg": 0.09470526874065399, "step": 2885, "valid_targets_mean": 6960.6, "valid_targets_min": 1501 }, { "epoch": 4.898305084745763, "grad_norm": 0.409246582546555, "learning_rate": 1.0029292713271334e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.16161762177944183, "step": 2890, "valid_targets_mean": 7954.8, "valid_targets_min": 3290 }, { "epoch": 4.906779661016949, "grad_norm": 0.43312261146531655, "learning_rate": 9.956114532905625e-06, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.12446765601634979, "step": 2895, "valid_targets_mean": 7838.4, "valid_targets_min": 4758 }, { "epoch": 4.915254237288136, "grad_norm": 0.4301864357851658, "learning_rate": 9.883115724988743e-06, "loss": 0.2753, "loss_nan_ranks": 0, "loss_rank_avg": 0.12632432579994202, "step": 2900, "valid_targets_mean": 7188.4, "valid_targets_min": 2425 }, { "epoch": 4.923728813559322, "grad_norm": 0.5636109539825138, "learning_rate": 9.810297593196922e-06, "loss": 0.2839, "loss_nan_ranks": 0, "loss_rank_avg": 0.1164482980966568, "step": 2905, "valid_targets_mean": 7041.4, "valid_targets_min": 1517 }, { "epoch": 4.932203389830509, "grad_norm": 0.41163855796829296, "learning_rate": 9.73766143797976e-06, "loss": 0.2975, "loss_nan_ranks": 0, "loss_rank_avg": 0.18512123823165894, "step": 2910, "valid_targets_mean": 9377.4, "valid_targets_min": 3063 }, { "epoch": 4.940677966101695, "grad_norm": 0.3999145511854064, "learning_rate": 9.665208556536918e-06, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.15674389898777008, "step": 2915, "valid_targets_mean": 10361.1, "valid_targets_min": 2778 }, { "epoch": 4.9491525423728815, "grad_norm": 0.41681357372277467, "learning_rate": 9.592940242795035e-06, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.1276121735572815, "step": 2920, "valid_targets_mean": 7945.4, "valid_targets_min": 4230 }, { "epoch": 4.9576271186440675, "grad_norm": 0.4103109872648721, "learning_rate": 9.520857787384548e-06, "loss": 0.2913, "loss_nan_ranks": 0, "loss_rank_avg": 0.2234308123588562, "step": 2925, "valid_targets_mean": 10142.1, "valid_targets_min": 4081 }, { "epoch": 4.966101694915254, "grad_norm": 0.4773090185998591, "learning_rate": 9.44896247761669e-06, "loss": 0.2859, "loss_nan_ranks": 0, "loss_rank_avg": 0.11663774400949478, "step": 2930, "valid_targets_mean": 7561.9, "valid_targets_min": 2388 }, { "epoch": 4.97457627118644, "grad_norm": 0.4519877157560931, "learning_rate": 9.377255597460469e-06, "loss": 0.2697, "loss_nan_ranks": 0, "loss_rank_avg": 0.14655426144599915, "step": 2935, "valid_targets_mean": 7012.6, "valid_targets_min": 2452 }, { "epoch": 4.983050847457627, "grad_norm": 0.46442379360691927, "learning_rate": 9.305738427519782e-06, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.10421495884656906, "step": 2940, "valid_targets_mean": 5663.6, "valid_targets_min": 2072 }, { "epoch": 4.991525423728813, "grad_norm": 0.38014541504707516, "learning_rate": 9.234412245010482e-06, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.16515886783599854, "step": 2945, "valid_targets_mean": 9815.4, "valid_targets_min": 2340 }, { "epoch": 5.0, "grad_norm": 0.40418734474649126, "learning_rate": 9.163278323737635e-06, "loss": 0.2861, "loss_nan_ranks": 0, "loss_rank_avg": 0.17972296476364136, "step": 2950, "valid_targets_mean": 9544.8, "valid_targets_min": 3286 }, { "epoch": 5.008474576271187, "grad_norm": 0.38884902460392823, "learning_rate": 9.092337934072703e-06, "loss": 0.27, "loss_nan_ranks": 0, "loss_rank_avg": 0.12223666906356812, "step": 2955, "valid_targets_mean": 8354.1, "valid_targets_min": 3525 }, { "epoch": 5.016949152542373, "grad_norm": 0.4358731046466529, "learning_rate": 9.021592342930928e-06, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.10257917642593384, "step": 2960, "valid_targets_mean": 8100.0, "valid_targets_min": 4173 }, { "epoch": 5.02542372881356, "grad_norm": 0.43373781383804855, "learning_rate": 8.951042813748645e-06, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.18158259987831116, "step": 2965, "valid_targets_mean": 10387.9, "valid_targets_min": 5211 }, { "epoch": 5.033898305084746, "grad_norm": 0.5249679818676168, "learning_rate": 8.880690606460754e-06, "loss": 0.2915, "loss_nan_ranks": 0, "loss_rank_avg": 0.10569009184837341, "step": 2970, "valid_targets_mean": 6634.9, "valid_targets_min": 2482 }, { "epoch": 5.0423728813559325, "grad_norm": 0.42560397590925436, "learning_rate": 8.8105369774782e-06, "loss": 0.2722, "loss_nan_ranks": 0, "loss_rank_avg": 0.157941997051239, "step": 2975, "valid_targets_mean": 8599.6, "valid_targets_min": 2981 }, { "epoch": 5.0508474576271185, "grad_norm": 0.4355648091689131, "learning_rate": 8.74058317966556e-06, "loss": 0.2488, "loss_nan_ranks": 0, "loss_rank_avg": 0.08466358482837677, "step": 2980, "valid_targets_mean": 5620.9, "valid_targets_min": 3876 }, { "epoch": 5.059322033898305, "grad_norm": 0.4188697143373527, "learning_rate": 8.670830462318633e-06, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.06649868935346603, "step": 2985, "valid_targets_mean": 5346.4, "valid_targets_min": 2357 }, { "epoch": 5.067796610169491, "grad_norm": 0.43278797414764, "learning_rate": 8.60128007114217e-06, "loss": 0.2706, "loss_nan_ranks": 0, "loss_rank_avg": 0.1381576806306839, "step": 2990, "valid_targets_mean": 8565.6, "valid_targets_min": 1759 }, { "epoch": 5.076271186440678, "grad_norm": 0.40143576428343275, "learning_rate": 8.531933248227582e-06, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.10228410363197327, "step": 2995, "valid_targets_mean": 5543.6, "valid_targets_min": 2229 }, { "epoch": 5.084745762711864, "grad_norm": 0.4286280311865031, "learning_rate": 8.462791232030803e-06, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.13835610449314117, "step": 3000, "valid_targets_mean": 8272.5, "valid_targets_min": 4373 }, { "epoch": 5.093220338983051, "grad_norm": 0.41785258691109217, "learning_rate": 8.393855257350132e-06, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.11477389186620712, "step": 3005, "valid_targets_mean": 8371.8, "valid_targets_min": 4218 }, { "epoch": 5.101694915254237, "grad_norm": 0.42839185232988447, "learning_rate": 8.325126555304208e-06, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.1777895838022232, "step": 3010, "valid_targets_mean": 9394.4, "valid_targets_min": 4110 }, { "epoch": 5.110169491525424, "grad_norm": 0.4337647626076782, "learning_rate": 8.256606353310003e-06, "loss": 0.2472, "loss_nan_ranks": 0, "loss_rank_avg": 0.14281994104385376, "step": 3015, "valid_targets_mean": 9484.0, "valid_targets_min": 3434 }, { "epoch": 5.11864406779661, "grad_norm": 0.4295355742774288, "learning_rate": 8.188295875060943e-06, "loss": 0.2746, "loss_nan_ranks": 0, "loss_rank_avg": 0.0776737704873085, "step": 3020, "valid_targets_mean": 4949.9, "valid_targets_min": 3294 }, { "epoch": 5.127118644067797, "grad_norm": 0.3676364308403277, "learning_rate": 8.12019634050499e-06, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.08112052828073502, "step": 3025, "valid_targets_mean": 7908.5, "valid_targets_min": 4680 }, { "epoch": 5.135593220338983, "grad_norm": 0.4454936935125421, "learning_rate": 8.052308965822916e-06, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.1395069807767868, "step": 3030, "valid_targets_mean": 7846.9, "valid_targets_min": 4498 }, { "epoch": 5.1440677966101696, "grad_norm": 0.4122037084305391, "learning_rate": 7.984634963406537e-06, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.14162138104438782, "step": 3035, "valid_targets_mean": 8179.1, "valid_targets_min": 4548 }, { "epoch": 5.1525423728813555, "grad_norm": 0.463084879888614, "learning_rate": 7.917175541837101e-06, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.09783188998699188, "step": 3040, "valid_targets_mean": 5998.4, "valid_targets_min": 2460 }, { "epoch": 5.161016949152542, "grad_norm": 0.4748887059748165, "learning_rate": 7.849931905863672e-06, "loss": 0.2885, "loss_nan_ranks": 0, "loss_rank_avg": 0.12707798182964325, "step": 3045, "valid_targets_mean": 6415.8, "valid_targets_min": 3785 }, { "epoch": 5.169491525423728, "grad_norm": 0.45526749296808317, "learning_rate": 7.78290525638163e-06, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.18409213423728943, "step": 3050, "valid_targets_mean": 11028.6, "valid_targets_min": 3734 }, { "epoch": 5.177966101694915, "grad_norm": 0.4462181398544631, "learning_rate": 7.71609679041121e-06, "loss": 0.2503, "loss_nan_ranks": 0, "loss_rank_avg": 0.15138982236385345, "step": 3055, "valid_targets_mean": 7039.2, "valid_targets_min": 3502 }, { "epoch": 5.186440677966102, "grad_norm": 0.3963924524169505, "learning_rate": 7.649507701076164e-06, "loss": 0.2633, "loss_nan_ranks": 0, "loss_rank_avg": 0.17887073755264282, "step": 3060, "valid_targets_mean": 10073.6, "valid_targets_min": 2114 }, { "epoch": 5.194915254237288, "grad_norm": 0.5348841144000112, "learning_rate": 7.583139177582395e-06, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.2061377465724945, "step": 3065, "valid_targets_mean": 7855.2, "valid_targets_min": 3111 }, { "epoch": 5.203389830508475, "grad_norm": 0.41577883860215764, "learning_rate": 7.516992405196772e-06, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.13540074229240417, "step": 3070, "valid_targets_mean": 8547.1, "valid_targets_min": 4854 }, { "epoch": 5.211864406779661, "grad_norm": 0.4271021340563035, "learning_rate": 7.45106856522593e-06, "loss": 0.2686, "loss_nan_ranks": 0, "loss_rank_avg": 0.10686710476875305, "step": 3075, "valid_targets_mean": 5644.2, "valid_targets_min": 2827 }, { "epoch": 5.220338983050848, "grad_norm": 0.4303321911070651, "learning_rate": 7.385368834995168e-06, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.07251991331577301, "step": 3080, "valid_targets_mean": 5377.9, "valid_targets_min": 2896 }, { "epoch": 5.228813559322034, "grad_norm": 0.4414950670458604, "learning_rate": 7.319894387827473e-06, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.12613925337791443, "step": 3085, "valid_targets_mean": 7042.0, "valid_targets_min": 3869 }, { "epoch": 5.237288135593221, "grad_norm": 0.42597819657193176, "learning_rate": 7.254646393022502e-06, "loss": 0.2804, "loss_nan_ranks": 0, "loss_rank_avg": 0.1456468105316162, "step": 3090, "valid_targets_mean": 8970.8, "valid_targets_min": 2240 }, { "epoch": 5.245762711864407, "grad_norm": 0.3910096201156548, "learning_rate": 7.189626015835733e-06, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.14637431502342224, "step": 3095, "valid_targets_mean": 9771.9, "valid_targets_min": 2504 }, { "epoch": 5.254237288135593, "grad_norm": 0.4720410475372794, "learning_rate": 7.124834417457664e-06, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.10337448865175247, "step": 3100, "valid_targets_mean": 6589.2, "valid_targets_min": 2630 }, { "epoch": 5.262711864406779, "grad_norm": 0.4165414378767662, "learning_rate": 7.060272754993051e-06, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.10730390250682831, "step": 3105, "valid_targets_mean": 7689.1, "valid_targets_min": 3877 }, { "epoch": 5.271186440677966, "grad_norm": 0.4773925338374391, "learning_rate": 6.9959421814402494e-06, "loss": 0.2686, "loss_nan_ranks": 0, "loss_rank_avg": 0.09607205539941788, "step": 3110, "valid_targets_mean": 6103.0, "valid_targets_min": 2958 }, { "epoch": 5.279661016949152, "grad_norm": 0.405934436370515, "learning_rate": 6.931843845670647e-06, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.18584570288658142, "step": 3115, "valid_targets_mean": 11376.5, "valid_targets_min": 6700 }, { "epoch": 5.288135593220339, "grad_norm": 0.40944718673488073, "learning_rate": 6.867978892408101e-06, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.06526018679141998, "step": 3120, "valid_targets_mean": 5554.6, "valid_targets_min": 1909 }, { "epoch": 5.296610169491525, "grad_norm": 0.3969787353916221, "learning_rate": 6.804348462208548e-06, "loss": 0.251, "loss_nan_ranks": 0, "loss_rank_avg": 0.14641955494880676, "step": 3125, "valid_targets_mean": 10160.4, "valid_targets_min": 4904 }, { "epoch": 5.305084745762712, "grad_norm": 0.40381438825051413, "learning_rate": 6.7409536914395866e-06, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.12536650896072388, "step": 3130, "valid_targets_mean": 8634.0, "valid_targets_min": 6440 }, { "epoch": 5.313559322033898, "grad_norm": 0.4407810032396024, "learning_rate": 6.677795712260206e-06, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.10065967589616776, "step": 3135, "valid_targets_mean": 6554.6, "valid_targets_min": 3413 }, { "epoch": 5.322033898305085, "grad_norm": 0.43225307653715944, "learning_rate": 6.6148756526005855e-06, "loss": 0.2621, "loss_nan_ranks": 0, "loss_rank_avg": 0.17093005776405334, "step": 3140, "valid_targets_mean": 7674.1, "valid_targets_min": 2705 }, { "epoch": 5.330508474576272, "grad_norm": 0.42168841714997635, "learning_rate": 6.552194636141909e-06, "loss": 0.2444, "loss_nan_ranks": 0, "loss_rank_avg": 0.1504831612110138, "step": 3145, "valid_targets_mean": 8807.0, "valid_targets_min": 3609 }, { "epoch": 5.338983050847458, "grad_norm": 0.4721877133160371, "learning_rate": 6.489753782296315e-06, "loss": 0.2603, "loss_nan_ranks": 0, "loss_rank_avg": 0.1312541961669922, "step": 3150, "valid_targets_mean": 6869.5, "valid_targets_min": 2014 }, { "epoch": 5.3474576271186445, "grad_norm": 0.5627993433253363, "learning_rate": 6.427554206186939e-06, "loss": 0.2598, "loss_nan_ranks": 0, "loss_rank_avg": 0.12869901955127716, "step": 3155, "valid_targets_mean": 8781.0, "valid_targets_min": 3073 }, { "epoch": 5.3559322033898304, "grad_norm": 0.5975905344692939, "learning_rate": 6.3655970186279314e-06, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.15334156155586243, "step": 3160, "valid_targets_mean": 7974.1, "valid_targets_min": 4571 }, { "epoch": 5.364406779661017, "grad_norm": 0.4399240043257231, "learning_rate": 6.30388332610469e-06, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.09615137428045273, "step": 3165, "valid_targets_mean": 6191.0, "valid_targets_min": 2960 }, { "epoch": 5.372881355932203, "grad_norm": 0.43555573486472715, "learning_rate": 6.242414230754044e-06, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.1269509643316269, "step": 3170, "valid_targets_mean": 7501.0, "valid_targets_min": 2635 }, { "epoch": 5.38135593220339, "grad_norm": 0.4707060650067185, "learning_rate": 6.181190830344601e-06, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.14338397979736328, "step": 3175, "valid_targets_mean": 6411.2, "valid_targets_min": 3296 }, { "epoch": 5.389830508474576, "grad_norm": 0.42574272563993854, "learning_rate": 6.120214218257128e-06, "loss": 0.2553, "loss_nan_ranks": 0, "loss_rank_avg": 0.20924800634384155, "step": 3180, "valid_targets_mean": 9852.9, "valid_targets_min": 4562 }, { "epoch": 5.398305084745763, "grad_norm": 0.39823088488510644, "learning_rate": 6.059485483465048e-06, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.12313079833984375, "step": 3185, "valid_targets_mean": 7619.0, "valid_targets_min": 3737 }, { "epoch": 5.406779661016949, "grad_norm": 0.9536002287476373, "learning_rate": 5.999005710514956e-06, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.09335184842348099, "step": 3190, "valid_targets_mean": 5375.0, "valid_targets_min": 1635 }, { "epoch": 5.415254237288136, "grad_norm": 0.431612528522527, "learning_rate": 5.938775979507287e-06, "loss": 0.2625, "loss_nan_ranks": 0, "loss_rank_avg": 0.13442601263523102, "step": 3195, "valid_targets_mean": 7720.2, "valid_targets_min": 2911 }, { "epoch": 5.423728813559322, "grad_norm": 0.44860126013223406, "learning_rate": 5.878797366076994e-06, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.12965793907642365, "step": 3200, "valid_targets_mean": 6444.4, "valid_targets_min": 2340 }, { "epoch": 5.432203389830509, "grad_norm": 0.42018341577045487, "learning_rate": 5.819070941374368e-06, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.14158044755458832, "step": 3205, "valid_targets_mean": 8188.9, "valid_targets_min": 3917 }, { "epoch": 5.440677966101695, "grad_norm": 0.48422403137134756, "learning_rate": 5.759597772045882e-06, "loss": 0.2805, "loss_nan_ranks": 0, "loss_rank_avg": 0.1876494586467743, "step": 3210, "valid_targets_mean": 9145.9, "valid_targets_min": 5285 }, { "epoch": 5.4491525423728815, "grad_norm": 0.46211420065830605, "learning_rate": 5.700378920215159e-06, "loss": 0.2735, "loss_nan_ranks": 0, "loss_rank_avg": 0.21201786398887634, "step": 3215, "valid_targets_mean": 7421.4, "valid_targets_min": 2476 }, { "epoch": 5.4576271186440675, "grad_norm": 0.4264912650604428, "learning_rate": 5.641415443463994e-06, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.1297842115163803, "step": 3220, "valid_targets_mean": 7719.5, "valid_targets_min": 1584 }, { "epoch": 5.466101694915254, "grad_norm": 0.5482676590741974, "learning_rate": 5.5827083948134876e-06, "loss": 0.2821, "loss_nan_ranks": 0, "loss_rank_avg": 0.11752267181873322, "step": 3225, "valid_targets_mean": 6575.1, "valid_targets_min": 1240 }, { "epoch": 5.47457627118644, "grad_norm": 0.5019414160677941, "learning_rate": 5.524258822705202e-06, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.12094447016716003, "step": 3230, "valid_targets_mean": 7180.8, "valid_targets_min": 4446 }, { "epoch": 5.483050847457627, "grad_norm": 0.4037586289857663, "learning_rate": 5.466067770982482e-06, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.10668241232633591, "step": 3235, "valid_targets_mean": 6875.6, "valid_targets_min": 2801 }, { "epoch": 5.491525423728813, "grad_norm": 0.4432879666748049, "learning_rate": 5.4081362788717625e-06, "loss": 0.2908, "loss_nan_ranks": 0, "loss_rank_avg": 0.09486261010169983, "step": 3240, "valid_targets_mean": 5720.0, "valid_targets_min": 2827 }, { "epoch": 5.5, "grad_norm": 0.41525930005316086, "learning_rate": 5.350465380964076e-06, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.12814128398895264, "step": 3245, "valid_targets_mean": 8286.4, "valid_targets_min": 3278 }, { "epoch": 5.508474576271187, "grad_norm": 0.3967241521552427, "learning_rate": 5.293056107196488e-06, "loss": 0.2819, "loss_nan_ranks": 0, "loss_rank_avg": 0.10649764537811279, "step": 3250, "valid_targets_mean": 9235.5, "valid_targets_min": 3054 }, { "epoch": 5.516949152542373, "grad_norm": 0.4104500751756487, "learning_rate": 5.235909482833797e-06, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.07652749121189117, "step": 3255, "valid_targets_mean": 5837.8, "valid_targets_min": 3543 }, { "epoch": 5.52542372881356, "grad_norm": 0.4548802593937043, "learning_rate": 5.179026528450146e-06, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.10874311625957489, "step": 3260, "valid_targets_mean": 6713.8, "valid_targets_min": 3128 }, { "epoch": 5.533898305084746, "grad_norm": 0.42626630165063617, "learning_rate": 5.1224082599108584e-06, "loss": 0.2444, "loss_nan_ranks": 0, "loss_rank_avg": 0.11963523179292679, "step": 3265, "valid_targets_mean": 7900.5, "valid_targets_min": 4232 }, { "epoch": 5.5423728813559325, "grad_norm": 0.42226966542492606, "learning_rate": 5.066055688354246e-06, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.1330696940422058, "step": 3270, "valid_targets_mean": 7405.2, "valid_targets_min": 3859 }, { "epoch": 5.5508474576271185, "grad_norm": 0.41559115903205107, "learning_rate": 5.0099698201735855e-06, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.18021991848945618, "step": 3275, "valid_targets_mean": 9442.4, "valid_targets_min": 2425 }, { "epoch": 5.559322033898305, "grad_norm": 0.4473698575482938, "learning_rate": 4.954151656999122e-06, "loss": 0.2595, "loss_nan_ranks": 0, "loss_rank_avg": 0.18893000483512878, "step": 3280, "valid_targets_mean": 8873.5, "valid_targets_min": 2503 }, { "epoch": 5.567796610169491, "grad_norm": 0.4126655990570961, "learning_rate": 4.898602195680214e-06, "loss": 0.257, "loss_nan_ranks": 0, "loss_rank_avg": 0.17205744981765747, "step": 3285, "valid_targets_mean": 10166.2, "valid_targets_min": 2566 }, { "epoch": 5.576271186440678, "grad_norm": 0.4436803493070262, "learning_rate": 4.843322428267465e-06, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.1269497573375702, "step": 3290, "valid_targets_mean": 7204.2, "valid_targets_min": 2145 }, { "epoch": 5.584745762711864, "grad_norm": 0.41757091681380304, "learning_rate": 4.788313341995096e-06, "loss": 0.3007, "loss_nan_ranks": 0, "loss_rank_avg": 0.12728919088840485, "step": 3295, "valid_targets_mean": 7854.6, "valid_targets_min": 3467 }, { "epoch": 5.593220338983051, "grad_norm": 0.4333169695340451, "learning_rate": 4.733575919263238e-06, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.197248175740242, "step": 3300, "valid_targets_mean": 9669.5, "valid_targets_min": 2530 }, { "epoch": 5.601694915254237, "grad_norm": 0.4217198882582936, "learning_rate": 4.679111137620442e-06, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.0994122177362442, "step": 3305, "valid_targets_mean": 7220.2, "valid_targets_min": 2826 }, { "epoch": 5.610169491525424, "grad_norm": 0.45922876277681324, "learning_rate": 4.624919969746171e-06, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.143977552652359, "step": 3310, "valid_targets_mean": 7108.6, "valid_targets_min": 3254 }, { "epoch": 5.61864406779661, "grad_norm": 0.4497468341605269, "learning_rate": 4.571003383433481e-06, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.15260854363441467, "step": 3315, "valid_targets_mean": 7907.2, "valid_targets_min": 2748 }, { "epoch": 5.627118644067797, "grad_norm": 0.45353082867834693, "learning_rate": 4.517362341571687e-06, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.1295567750930786, "step": 3320, "valid_targets_mean": 7593.5, "valid_targets_min": 2355 }, { "epoch": 5.635593220338983, "grad_norm": 0.4119838194637205, "learning_rate": 4.463997802129221e-06, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.1388033777475357, "step": 3325, "valid_targets_mean": 8385.2, "valid_targets_min": 4455 }, { "epoch": 5.6440677966101696, "grad_norm": 0.4140759472855946, "learning_rate": 4.410910718136454e-06, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.15042278170585632, "step": 3330, "valid_targets_mean": 9002.2, "valid_targets_min": 2717 }, { "epoch": 5.652542372881356, "grad_norm": 0.4400439343964711, "learning_rate": 4.3581020376687566e-06, "loss": 0.2625, "loss_nan_ranks": 0, "loss_rank_avg": 0.10155346989631653, "step": 3335, "valid_targets_mean": 7740.9, "valid_targets_min": 3495 }, { "epoch": 5.661016949152542, "grad_norm": 0.45980924813766, "learning_rate": 4.305572703829495e-06, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.11865295469760895, "step": 3340, "valid_targets_mean": 8350.5, "valid_targets_min": 4097 }, { "epoch": 5.669491525423728, "grad_norm": 0.47385129359550743, "learning_rate": 4.253323654733248e-06, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.10272833704948425, "step": 3345, "valid_targets_mean": 6288.5, "valid_targets_min": 2754 }, { "epoch": 5.677966101694915, "grad_norm": 0.42022120557595954, "learning_rate": 4.201355823488999e-06, "loss": 0.2676, "loss_nan_ranks": 0, "loss_rank_avg": 0.14795033633708954, "step": 3350, "valid_targets_mean": 7618.1, "valid_targets_min": 2832 }, { "epoch": 5.686440677966102, "grad_norm": 0.43924218046367447, "learning_rate": 4.149670138183526e-06, "loss": 0.2512, "loss_nan_ranks": 0, "loss_rank_avg": 0.08661969006061554, "step": 3355, "valid_targets_mean": 6429.2, "valid_targets_min": 1434 }, { "epoch": 5.694915254237288, "grad_norm": 0.4633969763685704, "learning_rate": 4.098267521864772e-06, "loss": 0.2385, "loss_nan_ranks": 0, "loss_rank_avg": 0.1861276477575302, "step": 3360, "valid_targets_mean": 9499.4, "valid_targets_min": 2276 }, { "epoch": 5.703389830508475, "grad_norm": 0.45898066026283985, "learning_rate": 4.047148892525403e-06, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.1299194097518921, "step": 3365, "valid_targets_mean": 6270.8, "valid_targets_min": 2471 }, { "epoch": 5.711864406779661, "grad_norm": 0.43083386950054814, "learning_rate": 3.996315163086391e-06, "loss": 0.2581, "loss_nan_ranks": 0, "loss_rank_avg": 0.15286263823509216, "step": 3370, "valid_targets_mean": 8112.6, "valid_targets_min": 1794 }, { "epoch": 5.720338983050848, "grad_norm": 0.467520944139597, "learning_rate": 3.945767241380732e-06, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.18376997113227844, "step": 3375, "valid_targets_mean": 7821.9, "valid_targets_min": 1652 }, { "epoch": 5.728813559322034, "grad_norm": 0.41645203978501605, "learning_rate": 3.895506030137195e-06, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.12087373435497284, "step": 3380, "valid_targets_mean": 7218.1, "valid_targets_min": 3939 }, { "epoch": 5.737288135593221, "grad_norm": 0.41823635458160535, "learning_rate": 3.845532426964252e-06, "loss": 0.2501, "loss_nan_ranks": 0, "loss_rank_avg": 0.10257397592067719, "step": 3385, "valid_targets_mean": 6861.1, "valid_targets_min": 3023 }, { "epoch": 5.745762711864407, "grad_norm": 0.43232642787196573, "learning_rate": 3.79584732433399e-06, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.12480692565441132, "step": 3390, "valid_targets_mean": 7853.9, "valid_targets_min": 2572 }, { "epoch": 5.754237288135593, "grad_norm": 0.49325336882654114, "learning_rate": 3.746451609566233e-06, "loss": 0.267, "loss_nan_ranks": 0, "loss_rank_avg": 0.24762919545173645, "step": 3395, "valid_targets_mean": 9721.4, "valid_targets_min": 5420 }, { "epoch": 5.762711864406779, "grad_norm": 0.4212695658266242, "learning_rate": 3.697346164812643e-06, "loss": 0.2424, "loss_nan_ranks": 0, "loss_rank_avg": 0.11336623877286911, "step": 3400, "valid_targets_mean": 7380.5, "valid_targets_min": 3715 }, { "epoch": 5.771186440677966, "grad_norm": 0.4588086641728118, "learning_rate": 3.6485318670409896e-06, "loss": 0.2611, "loss_nan_ranks": 0, "loss_rank_avg": 0.10371188074350357, "step": 3405, "valid_targets_mean": 6874.6, "valid_targets_min": 2581 }, { "epoch": 5.779661016949152, "grad_norm": 0.44398724002047824, "learning_rate": 3.6000095880194905e-06, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.11031177639961243, "step": 3410, "valid_targets_mean": 7567.9, "valid_targets_min": 4255 }, { "epoch": 5.788135593220339, "grad_norm": 0.42924629006736004, "learning_rate": 3.5517801943012443e-06, "loss": 0.2643, "loss_nan_ranks": 0, "loss_rank_avg": 0.1974351704120636, "step": 3415, "valid_targets_mean": 9567.6, "valid_targets_min": 4475 }, { "epoch": 5.796610169491525, "grad_norm": 0.46016588572316125, "learning_rate": 3.5038445472087324e-06, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.13061898946762085, "step": 3420, "valid_targets_mean": 7301.4, "valid_targets_min": 2394 }, { "epoch": 5.805084745762712, "grad_norm": 0.4058426308160901, "learning_rate": 3.456203502818476e-06, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.11977847665548325, "step": 3425, "valid_targets_mean": 7847.4, "valid_targets_min": 3901 }, { "epoch": 5.813559322033898, "grad_norm": 0.48970336832788647, "learning_rate": 3.408857911945702e-06, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.18240872025489807, "step": 3430, "valid_targets_mean": 9729.4, "valid_targets_min": 2322 }, { "epoch": 5.822033898305085, "grad_norm": 0.39563623240144213, "learning_rate": 3.36180862012919e-06, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.20780718326568604, "step": 3435, "valid_targets_mean": 11158.8, "valid_targets_min": 3305 }, { "epoch": 5.830508474576272, "grad_norm": 0.49787796279197905, "learning_rate": 3.3150564676161402e-06, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.10818520188331604, "step": 3440, "valid_targets_mean": 5966.9, "valid_targets_min": 3336 }, { "epoch": 5.838983050847458, "grad_norm": 0.43084579663109984, "learning_rate": 3.268602289347185e-06, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.19690270721912384, "step": 3445, "valid_targets_mean": 11298.9, "valid_targets_min": 7754 }, { "epoch": 5.847457627118644, "grad_norm": 0.4218069624746767, "learning_rate": 3.222446914941468e-06, "loss": 0.2746, "loss_nan_ranks": 0, "loss_rank_avg": 0.17221492528915405, "step": 3450, "valid_targets_mean": 8413.1, "valid_targets_min": 3225 }, { "epoch": 5.8559322033898304, "grad_norm": 0.4671618570113744, "learning_rate": 3.176591168681851e-06, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.13562491536140442, "step": 3455, "valid_targets_mean": 7066.1, "valid_targets_min": 2472 }, { "epoch": 5.864406779661017, "grad_norm": 0.4590320225196124, "learning_rate": 3.131035869500152e-06, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.09656020998954773, "step": 3460, "valid_targets_mean": 5605.9, "valid_targets_min": 3660 }, { "epoch": 5.872881355932203, "grad_norm": 0.4238092707837205, "learning_rate": 3.085781830962564e-06, "loss": 0.26, "loss_nan_ranks": 0, "loss_rank_avg": 0.11015133559703827, "step": 3465, "valid_targets_mean": 6491.9, "valid_targets_min": 2791 }, { "epoch": 5.88135593220339, "grad_norm": 0.4388528153492548, "learning_rate": 3.0408298612550878e-06, "loss": 0.2349, "loss_nan_ranks": 0, "loss_rank_avg": 0.17622537910938263, "step": 3470, "valid_targets_mean": 8512.5, "valid_targets_min": 2873 }, { "epoch": 5.889830508474576, "grad_norm": 0.4306978345104024, "learning_rate": 2.996180763169132e-06, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.09644504636526108, "step": 3475, "valid_targets_mean": 5898.6, "valid_targets_min": 1697 }, { "epoch": 5.898305084745763, "grad_norm": 0.4429192567068347, "learning_rate": 2.95183533408715e-06, "loss": 0.2562, "loss_nan_ranks": 0, "loss_rank_avg": 0.09832319617271423, "step": 3480, "valid_targets_mean": 6330.5, "valid_targets_min": 4248 }, { "epoch": 5.906779661016949, "grad_norm": 0.5042107811710015, "learning_rate": 2.907794365968413e-06, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.14449542760849, "step": 3485, "valid_targets_mean": 7709.2, "valid_targets_min": 4466 }, { "epoch": 5.915254237288136, "grad_norm": 0.38111377370566013, "learning_rate": 2.864058645334853e-06, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.1592138707637787, "step": 3490, "valid_targets_mean": 9714.1, "valid_targets_min": 4445 }, { "epoch": 5.923728813559322, "grad_norm": 0.4523598810623572, "learning_rate": 2.820628953257052e-06, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.11317625641822815, "step": 3495, "valid_targets_mean": 6696.9, "valid_targets_min": 1438 }, { "epoch": 5.932203389830509, "grad_norm": 0.38284023698249975, "learning_rate": 2.7775060653402387e-06, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.1514039784669876, "step": 3500, "valid_targets_mean": 9845.6, "valid_targets_min": 4052 }, { "epoch": 5.940677966101695, "grad_norm": 0.4164588979342514, "learning_rate": 2.7346907517104894e-06, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.209864541888237, "step": 3505, "valid_targets_mean": 11032.0, "valid_targets_min": 5443 }, { "epoch": 5.9491525423728815, "grad_norm": 0.3835673805693966, "learning_rate": 2.692183777000932e-06, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.12400268763303757, "step": 3510, "valid_targets_mean": 9057.1, "valid_targets_min": 2882 }, { "epoch": 5.9576271186440675, "grad_norm": 0.48693557523835473, "learning_rate": 2.64998590033813e-06, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.09107373654842377, "step": 3515, "valid_targets_mean": 5536.4, "valid_targets_min": 1342 }, { "epoch": 5.966101694915254, "grad_norm": 0.46983127864689195, "learning_rate": 2.608097875328488e-06, "loss": 0.2467, "loss_nan_ranks": 0, "loss_rank_avg": 0.08910076320171356, "step": 3520, "valid_targets_mean": 4977.9, "valid_targets_min": 1896 }, { "epoch": 5.97457627118644, "grad_norm": 0.45050680482743777, "learning_rate": 2.5665204500448137e-06, "loss": 0.2483, "loss_nan_ranks": 0, "loss_rank_avg": 0.06933078914880753, "step": 3525, "valid_targets_mean": 4338.5, "valid_targets_min": 1973 }, { "epoch": 5.983050847457627, "grad_norm": 0.449771116335777, "learning_rate": 2.525254367012955e-06, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.17051050066947937, "step": 3530, "valid_targets_mean": 8545.4, "valid_targets_min": 3602 }, { "epoch": 5.991525423728813, "grad_norm": 0.46300251369792844, "learning_rate": 2.4843003631985486e-06, "loss": 0.2955, "loss_nan_ranks": 0, "loss_rank_avg": 0.07504920661449432, "step": 3535, "valid_targets_mean": 5244.5, "valid_targets_min": 3387 }, { "epoch": 6.0, "grad_norm": 0.4255488380121361, "learning_rate": 2.4436591699938305e-06, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.10396578907966614, "step": 3540, "valid_targets_mean": 8307.2, "valid_targets_min": 3542 }, { "epoch": 6.008474576271187, "grad_norm": 0.4079638692535048, "learning_rate": 2.403331513204612e-06, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.132585346698761, "step": 3545, "valid_targets_mean": 8225.9, "valid_targets_min": 3132 }, { "epoch": 6.016949152542373, "grad_norm": 0.42095335043120474, "learning_rate": 2.363318113037283e-06, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.19237245619297028, "step": 3550, "valid_targets_mean": 8534.2, "valid_targets_min": 2336 }, { "epoch": 6.02542372881356, "grad_norm": 0.4247831459112695, "learning_rate": 2.323619684085976e-06, "loss": 0.2412, "loss_nan_ranks": 0, "loss_rank_avg": 0.10242437571287155, "step": 3555, "valid_targets_mean": 8372.6, "valid_targets_min": 3019 }, { "epoch": 6.033898305084746, "grad_norm": 0.5101711223801056, "learning_rate": 2.2842369353197858e-06, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.10061325132846832, "step": 3560, "valid_targets_mean": 6458.5, "valid_targets_min": 3200 }, { "epoch": 6.0423728813559325, "grad_norm": 0.46951651616591455, "learning_rate": 2.2451705700701185e-06, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.09043577313423157, "step": 3565, "valid_targets_mean": 6405.8, "valid_targets_min": 1973 }, { "epoch": 6.0508474576271185, "grad_norm": 0.43838570005499733, "learning_rate": 2.2064212860181258e-06, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.1115138828754425, "step": 3570, "valid_targets_mean": 6562.5, "valid_targets_min": 2966 }, { "epoch": 6.059322033898305, "grad_norm": 0.4105990788568166, "learning_rate": 2.1679897751822532e-06, "loss": 0.245, "loss_nan_ranks": 0, "loss_rank_avg": 0.14000532031059265, "step": 3575, "valid_targets_mean": 8664.9, "valid_targets_min": 3036 }, { "epoch": 6.067796610169491, "grad_norm": 0.4000234466993258, "learning_rate": 2.1298767239058684e-06, "loss": 0.2781, "loss_nan_ranks": 0, "loss_rank_avg": 0.17599308490753174, "step": 3580, "valid_targets_mean": 10298.4, "valid_targets_min": 3167 }, { "epoch": 6.076271186440678, "grad_norm": 0.4630894417075392, "learning_rate": 2.0920828128450197e-06, "loss": 0.2412, "loss_nan_ranks": 0, "loss_rank_avg": 0.16314397752285004, "step": 3585, "valid_targets_mean": 8534.8, "valid_targets_min": 4293 }, { "epoch": 6.084745762711864, "grad_norm": 0.4227879675646018, "learning_rate": 2.054608716956259e-06, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.1060272678732872, "step": 3590, "valid_targets_mean": 7418.1, "valid_targets_min": 1916 }, { "epoch": 6.093220338983051, "grad_norm": 0.4463726939777628, "learning_rate": 2.0174551054846158e-06, "loss": 0.2406, "loss_nan_ranks": 0, "loss_rank_avg": 0.11649863421916962, "step": 3595, "valid_targets_mean": 6681.9, "valid_targets_min": 2538 }, { "epoch": 6.101694915254237, "grad_norm": 0.44505007275052016, "learning_rate": 1.9806226419516195e-06, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.10530796647071838, "step": 3600, "valid_targets_mean": 7766.4, "valid_targets_min": 5614 }, { "epoch": 6.110169491525424, "grad_norm": 0.38470113587130134, "learning_rate": 1.94411198414346e-06, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.14323177933692932, "step": 3605, "valid_targets_mean": 10445.9, "valid_targets_min": 2694 }, { "epoch": 6.11864406779661, "grad_norm": 0.5125177576701928, "learning_rate": 1.9079237840992416e-06, "loss": 0.2332, "loss_nan_ranks": 0, "loss_rank_avg": 0.09224593639373779, "step": 3610, "valid_targets_mean": 6256.4, "valid_targets_min": 2591 }, { "epoch": 6.127118644067797, "grad_norm": 0.40141614645721524, "learning_rate": 1.8720586880993452e-06, "loss": 0.2753, "loss_nan_ranks": 0, "loss_rank_avg": 0.13916637003421783, "step": 3615, "valid_targets_mean": 8134.5, "valid_targets_min": 1875 }, { "epoch": 6.135593220338983, "grad_norm": 0.4648377214616805, "learning_rate": 1.8365173366538647e-06, "loss": 0.2984, "loss_nan_ranks": 0, "loss_rank_avg": 0.1737988442182541, "step": 3620, "valid_targets_mean": 8593.6, "valid_targets_min": 2950 }, { "epoch": 6.1440677966101696, "grad_norm": 0.3970149435933971, "learning_rate": 1.8013003644911987e-06, "loss": 0.2869, "loss_nan_ranks": 0, "loss_rank_avg": 0.1591392606496811, "step": 3625, "valid_targets_mean": 7797.2, "valid_targets_min": 2927 }, { "epoch": 6.1525423728813555, "grad_norm": 0.4329881802584791, "learning_rate": 1.7664084005466796e-06, "loss": 0.2586, "loss_nan_ranks": 0, "loss_rank_avg": 0.1466069221496582, "step": 3630, "valid_targets_mean": 7398.9, "valid_targets_min": 2493 }, { "epoch": 6.161016949152542, "grad_norm": 0.40044188924352225, "learning_rate": 1.7318420679513725e-06, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.09767980873584747, "step": 3635, "valid_targets_mean": 7647.6, "valid_targets_min": 5285 }, { "epoch": 6.169491525423728, "grad_norm": 0.4666515135940152, "learning_rate": 1.6976019840209334e-06, "loss": 0.2487, "loss_nan_ranks": 0, "loss_rank_avg": 0.13460057973861694, "step": 3640, "valid_targets_mean": 6764.6, "valid_targets_min": 3017 }, { "epoch": 6.177966101694915, "grad_norm": 0.4310188952800369, "learning_rate": 1.6636887602445839e-06, "loss": 0.2494, "loss_nan_ranks": 0, "loss_rank_avg": 0.14499178528785706, "step": 3645, "valid_targets_mean": 8610.5, "valid_targets_min": 4089 }, { "epoch": 6.186440677966102, "grad_norm": 0.47475101684614096, "learning_rate": 1.6301030022741837e-06, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.12736810743808746, "step": 3650, "valid_targets_mean": 6779.5, "valid_targets_min": 2699 }, { "epoch": 6.194915254237288, "grad_norm": 0.5568318024157459, "learning_rate": 1.596845309913444e-06, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.13458159565925598, "step": 3655, "valid_targets_mean": 6805.9, "valid_targets_min": 1820 }, { "epoch": 6.203389830508475, "grad_norm": 0.4321942421836466, "learning_rate": 1.5639162771071736e-06, "loss": 0.2582, "loss_nan_ranks": 0, "loss_rank_avg": 0.17277520895004272, "step": 3660, "valid_targets_mean": 8875.1, "valid_targets_min": 3888 }, { "epoch": 6.211864406779661, "grad_norm": 0.4459991928762019, "learning_rate": 1.5313164919307033e-06, "loss": 0.2631, "loss_nan_ranks": 0, "loss_rank_avg": 0.11502149701118469, "step": 3665, "valid_targets_mean": 7180.1, "valid_targets_min": 4359 }, { "epoch": 6.220338983050848, "grad_norm": 0.42250806309461797, "learning_rate": 1.499046536579374e-06, "loss": 0.282, "loss_nan_ranks": 0, "loss_rank_avg": 0.17123055458068848, "step": 3670, "valid_targets_mean": 8993.6, "valid_targets_min": 4613 }, { "epoch": 6.228813559322034, "grad_norm": 0.4108820724486728, "learning_rate": 1.4671069873581312e-06, "loss": 0.2852, "loss_nan_ranks": 0, "loss_rank_avg": 0.15709635615348816, "step": 3675, "valid_targets_mean": 9469.9, "valid_targets_min": 5070 }, { "epoch": 6.237288135593221, "grad_norm": 0.4437412702980212, "learning_rate": 1.4354984146712503e-06, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.11063840240240097, "step": 3680, "valid_targets_mean": 6998.9, "valid_targets_min": 2213 }, { "epoch": 6.245762711864407, "grad_norm": 0.4733988446311304, "learning_rate": 1.4042213830121344e-06, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.14029532670974731, "step": 3685, "valid_targets_mean": 6649.2, "valid_targets_min": 3248 }, { "epoch": 6.254237288135593, "grad_norm": 0.38655289252851993, "learning_rate": 1.3732764509532316e-06, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.13541369140148163, "step": 3690, "valid_targets_mean": 9996.2, "valid_targets_min": 5577 }, { "epoch": 6.262711864406779, "grad_norm": 0.4419355294886104, "learning_rate": 1.3426641711360788e-06, "loss": 0.2543, "loss_nan_ranks": 0, "loss_rank_avg": 0.12257914245128632, "step": 3695, "valid_targets_mean": 7234.6, "valid_targets_min": 3465 }, { "epoch": 6.271186440677966, "grad_norm": 0.4944609384643766, "learning_rate": 1.3123850902614143e-06, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.09550976008176804, "step": 3700, "valid_targets_mean": 5357.8, "valid_targets_min": 2337 }, { "epoch": 6.279661016949152, "grad_norm": 0.458073682292656, "learning_rate": 1.2824397490794115e-06, "loss": 0.2791, "loss_nan_ranks": 0, "loss_rank_avg": 0.12735655903816223, "step": 3705, "valid_targets_mean": 8300.4, "valid_targets_min": 2948 }, { "epoch": 6.288135593220339, "grad_norm": 0.44512304664485036, "learning_rate": 1.2528286823800495e-06, "loss": 0.2496, "loss_nan_ranks": 0, "loss_rank_avg": 0.12010197341442108, "step": 3710, "valid_targets_mean": 6729.8, "valid_targets_min": 2551 }, { "epoch": 6.296610169491525, "grad_norm": 0.4241959010800955, "learning_rate": 1.223552418983518e-06, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.1606883406639099, "step": 3715, "valid_targets_mean": 8563.4, "valid_targets_min": 2422 }, { "epoch": 6.305084745762712, "grad_norm": 0.4458826979380267, "learning_rate": 1.1946114817308207e-06, "loss": 0.2453, "loss_nan_ranks": 0, "loss_rank_avg": 0.126150980591774, "step": 3720, "valid_targets_mean": 6960.0, "valid_targets_min": 2437 }, { "epoch": 6.313559322033898, "grad_norm": 0.39768023598211966, "learning_rate": 1.166006387474401e-06, "loss": 0.2429, "loss_nan_ranks": 0, "loss_rank_avg": 0.1836184561252594, "step": 3725, "valid_targets_mean": 10689.0, "valid_targets_min": 3353 }, { "epoch": 6.322033898305085, "grad_norm": 0.4787935493604884, "learning_rate": 1.1377376470689328e-06, "loss": 0.271, "loss_nan_ranks": 0, "loss_rank_avg": 0.12405265867710114, "step": 3730, "valid_targets_mean": 6661.1, "valid_targets_min": 3367 }, { "epoch": 6.330508474576272, "grad_norm": 0.513993676048688, "learning_rate": 1.1098057653621775e-06, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.16209466755390167, "step": 3735, "valid_targets_mean": 7460.2, "valid_targets_min": 3795 }, { "epoch": 6.338983050847458, "grad_norm": 0.45485260063869304, "learning_rate": 1.0822112411860042e-06, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.0905480831861496, "step": 3740, "valid_targets_mean": 5860.2, "valid_targets_min": 2406 }, { "epoch": 6.3474576271186445, "grad_norm": 0.47528112960496416, "learning_rate": 1.0549545673474304e-06, "loss": 0.2461, "loss_nan_ranks": 0, "loss_rank_avg": 0.0847092866897583, "step": 3745, "valid_targets_mean": 6441.5, "valid_targets_min": 3400 }, { "epoch": 6.3559322033898304, "grad_norm": 0.417189000217903, "learning_rate": 1.0280362306198732e-06, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.1653599739074707, "step": 3750, "valid_targets_mean": 9874.0, "valid_targets_min": 3847 }, { "epoch": 6.364406779661017, "grad_norm": 0.44496662963253514, "learning_rate": 1.0014567117344121e-06, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.14929382503032684, "step": 3755, "valid_targets_mean": 6836.2, "valid_targets_min": 2605 }, { "epoch": 6.372881355932203, "grad_norm": 0.4711935019321799, "learning_rate": 9.752164853712355e-07, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.11264555901288986, "step": 3760, "valid_targets_mean": 7332.9, "valid_targets_min": 3422 }, { "epoch": 6.38135593220339, "grad_norm": 0.503630625795691, "learning_rate": 9.493160201511409e-07, "loss": 0.2658, "loss_nan_ranks": 0, "loss_rank_avg": 0.11310052871704102, "step": 3765, "valid_targets_mean": 7008.2, "valid_targets_min": 1707 }, { "epoch": 6.389830508474576, "grad_norm": 0.5778340405809688, "learning_rate": 9.2375577862718e-07, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.09299856424331665, "step": 3770, "valid_targets_mean": 6915.5, "valid_targets_min": 2350 }, { "epoch": 6.398305084745763, "grad_norm": 0.42295528500037055, "learning_rate": 8.985362172763933e-07, "loss": 0.2444, "loss_nan_ranks": 0, "loss_rank_avg": 0.09429045021533966, "step": 3775, "valid_targets_mean": 6875.8, "valid_targets_min": 2364 }, { "epoch": 6.406779661016949, "grad_norm": 0.39896345678565265, "learning_rate": 8.736577864916617e-07, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.11996320635080338, "step": 3780, "valid_targets_mean": 7433.8, "valid_targets_min": 2417 }, { "epoch": 6.415254237288136, "grad_norm": 0.42165435770722925, "learning_rate": 8.491209305736525e-07, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.13380880653858185, "step": 3785, "valid_targets_mean": 7627.2, "valid_targets_min": 2303 }, { "epoch": 6.423728813559322, "grad_norm": 0.4505139819346616, "learning_rate": 8.249260877228993e-07, "loss": 0.2862, "loss_nan_ranks": 0, "loss_rank_avg": 0.14228764176368713, "step": 3790, "valid_targets_mean": 8098.2, "valid_targets_min": 3002 }, { "epoch": 6.432203389830509, "grad_norm": 0.4321271164525556, "learning_rate": 8.010736900319615e-07, "loss": 0.2721, "loss_nan_ranks": 0, "loss_rank_avg": 0.09055182337760925, "step": 3795, "valid_targets_mean": 6403.5, "valid_targets_min": 2779 }, { "epoch": 6.440677966101695, "grad_norm": 0.4445613645730953, "learning_rate": 7.775641634777198e-07, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.11796161532402039, "step": 3800, "valid_targets_mean": 7846.5, "valid_targets_min": 3128 }, { "epoch": 6.4491525423728815, "grad_norm": 0.4983181318128694, "learning_rate": 7.543979279137592e-07, "loss": 0.2583, "loss_nan_ranks": 0, "loss_rank_avg": 0.11737058311700821, "step": 3805, "valid_targets_mean": 6364.1, "valid_targets_min": 2068 }, { "epoch": 6.4576271186440675, "grad_norm": 0.4637887645159089, "learning_rate": 7.315753970628825e-07, "loss": 0.2487, "loss_nan_ranks": 0, "loss_rank_avg": 0.09322785586118698, "step": 3810, "valid_targets_mean": 6619.9, "valid_targets_min": 2636 }, { "epoch": 6.466101694915254, "grad_norm": 0.40047532995209967, "learning_rate": 7.090969785097046e-07, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.13654407858848572, "step": 3815, "valid_targets_mean": 9421.6, "valid_targets_min": 5966 }, { "epoch": 6.47457627118644, "grad_norm": 0.4390708368570101, "learning_rate": 6.869630736933963e-07, "loss": 0.242, "loss_nan_ranks": 0, "loss_rank_avg": 0.07607319951057434, "step": 3820, "valid_targets_mean": 6052.5, "valid_targets_min": 3828 }, { "epoch": 6.483050847457627, "grad_norm": 0.42364553715790104, "learning_rate": 6.651740779004878e-07, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.1431792676448822, "step": 3825, "valid_targets_mean": 8558.6, "valid_targets_min": 2566 }, { "epoch": 6.491525423728813, "grad_norm": 0.47872145294990065, "learning_rate": 6.437303802578365e-07, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.09658294916152954, "step": 3830, "valid_targets_mean": 5816.0, "valid_targets_min": 2772 }, { "epoch": 6.5, "grad_norm": 0.42695972686370715, "learning_rate": 6.226323637256592e-07, "loss": 0.2558, "loss_nan_ranks": 0, "loss_rank_avg": 0.09363295882940292, "step": 3835, "valid_targets_mean": 6977.9, "valid_targets_min": 2840 }, { "epoch": 6.508474576271187, "grad_norm": 0.448749456041159, "learning_rate": 6.018804050906957e-07, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.1705683469772339, "step": 3840, "valid_targets_mean": 9966.0, "valid_targets_min": 3703 }, { "epoch": 6.516949152542373, "grad_norm": 0.44110593342725196, "learning_rate": 5.814748749594845e-07, "loss": 0.2921, "loss_nan_ranks": 0, "loss_rank_avg": 0.15280672907829285, "step": 3845, "valid_targets_mean": 7834.5, "valid_targets_min": 2385 }, { "epoch": 6.52542372881356, "grad_norm": 0.41011102728994003, "learning_rate": 5.614161377517491e-07, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.10929296910762787, "step": 3850, "valid_targets_mean": 7395.1, "valid_targets_min": 2328 }, { "epoch": 6.533898305084746, "grad_norm": 0.37684976767116324, "learning_rate": 5.417045516938712e-07, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.15998807549476624, "step": 3855, "valid_targets_mean": 11794.1, "valid_targets_min": 3559 }, { "epoch": 6.5423728813559325, "grad_norm": 0.4502091870017217, "learning_rate": 5.223404688125189e-07, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.08542191982269287, "step": 3860, "valid_targets_mean": 5364.5, "valid_targets_min": 1501 }, { "epoch": 6.5508474576271185, "grad_norm": 0.4518810494268951, "learning_rate": 5.033242349283307e-07, "loss": 0.2461, "loss_nan_ranks": 0, "loss_rank_avg": 0.13581258058547974, "step": 3865, "valid_targets_mean": 7274.4, "valid_targets_min": 2654 }, { "epoch": 6.559322033898305, "grad_norm": 0.467029591171528, "learning_rate": 4.846561896497682e-07, "loss": 0.2871, "loss_nan_ranks": 0, "loss_rank_avg": 0.10872132331132889, "step": 3870, "valid_targets_mean": 7022.8, "valid_targets_min": 4600 }, { "epoch": 6.567796610169491, "grad_norm": 0.4409609140769841, "learning_rate": 4.6633666636703325e-07, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.11535359919071198, "step": 3875, "valid_targets_mean": 7674.4, "valid_targets_min": 4116 }, { "epoch": 6.576271186440678, "grad_norm": 0.42972659095916, "learning_rate": 4.4836599224611586e-07, "loss": 0.2518, "loss_nan_ranks": 0, "loss_rank_avg": 0.09469720721244812, "step": 3880, "valid_targets_mean": 7193.9, "valid_targets_min": 712 }, { "epoch": 6.584745762711864, "grad_norm": 0.45334276617935493, "learning_rate": 4.3074448822295165e-07, "loss": 0.266, "loss_nan_ranks": 0, "loss_rank_avg": 0.23430021107196808, "step": 3885, "valid_targets_mean": 11505.8, "valid_targets_min": 2009 }, { "epoch": 6.593220338983051, "grad_norm": 0.43929363356639645, "learning_rate": 4.1347246899770435e-07, "loss": 0.252, "loss_nan_ranks": 0, "loss_rank_avg": 0.16690164804458618, "step": 3890, "valid_targets_mean": 7407.8, "valid_targets_min": 3494 }, { "epoch": 6.601694915254237, "grad_norm": 0.4147188602054449, "learning_rate": 3.965502430291235e-07, "loss": 0.2583, "loss_nan_ranks": 0, "loss_rank_avg": 0.16083547472953796, "step": 3895, "valid_targets_mean": 11111.1, "valid_targets_min": 5126 }, { "epoch": 6.610169491525424, "grad_norm": 0.455809497113382, "learning_rate": 3.7997811252905135e-07, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.10246642678976059, "step": 3900, "valid_targets_mean": 6430.8, "valid_targets_min": 2509 }, { "epoch": 6.61864406779661, "grad_norm": 0.48481248655451537, "learning_rate": 3.6375637345701376e-07, "loss": 0.2921, "loss_nan_ranks": 0, "loss_rank_avg": 0.12926767766475677, "step": 3905, "valid_targets_mean": 8199.2, "valid_targets_min": 3433 }, { "epoch": 6.627118644067797, "grad_norm": 0.42600486230878915, "learning_rate": 3.4788531551495307e-07, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.1657295525074005, "step": 3910, "valid_targets_mean": 9773.5, "valid_targets_min": 3644 }, { "epoch": 6.635593220338983, "grad_norm": 0.44131521564665016, "learning_rate": 3.323652221420326e-07, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.11407070606946945, "step": 3915, "valid_targets_mean": 7225.0, "valid_targets_min": 3796 }, { "epoch": 6.6440677966101696, "grad_norm": 0.4377236209372105, "learning_rate": 3.1719637050958706e-07, "loss": 0.2443, "loss_nan_ranks": 0, "loss_rank_avg": 0.16772839426994324, "step": 3920, "valid_targets_mean": 7740.8, "valid_targets_min": 2711 }, { "epoch": 6.652542372881356, "grad_norm": 0.48773453863500077, "learning_rate": 3.023790315161734e-07, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.08592482656240463, "step": 3925, "valid_targets_mean": 5208.9, "valid_targets_min": 2740 }, { "epoch": 6.661016949152542, "grad_norm": 0.4720937825623047, "learning_rate": 2.8791346978273015e-07, "loss": 0.2457, "loss_nan_ranks": 0, "loss_rank_avg": 0.14076513051986694, "step": 3930, "valid_targets_mean": 7652.5, "valid_targets_min": 2939 }, { "epoch": 6.669491525423728, "grad_norm": 0.3859609875387887, "learning_rate": 2.7379994364784556e-07, "loss": 0.2748, "loss_nan_ranks": 0, "loss_rank_avg": 0.149990051984787, "step": 3935, "valid_targets_mean": 10438.9, "valid_targets_min": 6415 }, { "epoch": 6.677966101694915, "grad_norm": 0.5550308272010621, "learning_rate": 2.60038705163157e-07, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.08144932985305786, "step": 3940, "valid_targets_mean": 5604.2, "valid_targets_min": 3387 }, { "epoch": 6.686440677966102, "grad_norm": 0.3979338951489735, "learning_rate": 2.4663000008883664e-07, "loss": 0.2958, "loss_nan_ranks": 0, "loss_rank_avg": 0.16274738311767578, "step": 3945, "valid_targets_mean": 9629.6, "valid_targets_min": 3399 }, { "epoch": 6.694915254237288, "grad_norm": 0.46083448051365644, "learning_rate": 2.335740678892129e-07, "loss": 0.2563, "loss_nan_ranks": 0, "loss_rank_avg": 0.14789345860481262, "step": 3950, "valid_targets_mean": 7863.1, "valid_targets_min": 2423 }, { "epoch": 6.703389830508475, "grad_norm": 0.41684119058343516, "learning_rate": 2.20871141728487e-07, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.2013491988182068, "step": 3955, "valid_targets_mean": 10909.6, "valid_targets_min": 3286 }, { "epoch": 6.711864406779661, "grad_norm": 0.40804130143632766, "learning_rate": 2.0852144846656764e-07, "loss": 0.254, "loss_nan_ranks": 0, "loss_rank_avg": 0.11485549807548523, "step": 3960, "valid_targets_mean": 7442.1, "valid_targets_min": 1795 }, { "epoch": 6.720338983050848, "grad_norm": 0.41669778757995984, "learning_rate": 1.9652520865502734e-07, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.11961879581212997, "step": 3965, "valid_targets_mean": 6853.5, "valid_targets_min": 2648 }, { "epoch": 6.728813559322034, "grad_norm": 0.4152131127329952, "learning_rate": 1.848826365331613e-07, "loss": 0.2728, "loss_nan_ranks": 0, "loss_rank_avg": 0.09015417098999023, "step": 3970, "valid_targets_mean": 6583.1, "valid_targets_min": 3468 }, { "epoch": 6.737288135593221, "grad_norm": 0.40715982611325285, "learning_rate": 1.7359394002415265e-07, "loss": 0.2537, "loss_nan_ranks": 0, "loss_rank_avg": 0.0808727890253067, "step": 3975, "valid_targets_mean": 7092.9, "valid_targets_min": 2970 }, { "epoch": 6.745762711864407, "grad_norm": 0.5044552290709712, "learning_rate": 1.626593207313709e-07, "loss": 0.2494, "loss_nan_ranks": 0, "loss_rank_avg": 0.08215104788541794, "step": 3980, "valid_targets_mean": 5966.9, "valid_targets_min": 2607 }, { "epoch": 6.754237288135593, "grad_norm": 0.43110120943383057, "learning_rate": 1.520789739347617e-07, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.14837504923343658, "step": 3985, "valid_targets_mean": 8823.1, "valid_targets_min": 4021 }, { "epoch": 6.762711864406779, "grad_norm": 0.4055433819445956, "learning_rate": 1.4185308858737367e-07, "loss": 0.2864, "loss_nan_ranks": 0, "loss_rank_avg": 0.1624079942703247, "step": 3990, "valid_targets_mean": 7929.6, "valid_targets_min": 2855 }, { "epoch": 6.771186440677966, "grad_norm": 0.477581742178108, "learning_rate": 1.3198184731196162e-07, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.10930319130420685, "step": 3995, "valid_targets_mean": 7842.5, "valid_targets_min": 3884 }, { "epoch": 6.779661016949152, "grad_norm": 0.46632621619817743, "learning_rate": 1.2246542639774871e-07, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.08825379610061646, "step": 4000, "valid_targets_mean": 5714.2, "valid_targets_min": 2503 }, { "epoch": 6.788135593220339, "grad_norm": 0.40822795025329855, "learning_rate": 1.1330399579725814e-07, "loss": 0.2502, "loss_nan_ranks": 0, "loss_rank_avg": 0.12100020796060562, "step": 4005, "valid_targets_mean": 7386.6, "valid_targets_min": 2520 }, { "epoch": 6.796610169491525, "grad_norm": 0.4869071996289484, "learning_rate": 1.0449771912329543e-07, "loss": 0.2679, "loss_nan_ranks": 0, "loss_rank_avg": 0.13639283180236816, "step": 4010, "valid_targets_mean": 6874.1, "valid_targets_min": 3308 }, { "epoch": 6.805084745762712, "grad_norm": 0.4514466969309618, "learning_rate": 9.604675364601079e-08, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.16514557600021362, "step": 4015, "valid_targets_mean": 8557.4, "valid_targets_min": 2551 }, { "epoch": 6.813559322033898, "grad_norm": 0.45927796348806976, "learning_rate": 8.795125029010587e-08, "loss": 0.2344, "loss_nan_ranks": 0, "loss_rank_avg": 0.14747881889343262, "step": 4020, "valid_targets_mean": 7801.5, "valid_targets_min": 1934 }, { "epoch": 6.822033898305085, "grad_norm": 0.4736824137520606, "learning_rate": 8.021135363212252e-08, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.1297898292541504, "step": 4025, "valid_targets_mean": 7571.8, "valid_targets_min": 3105 }, { "epoch": 6.830508474576272, "grad_norm": 0.44820578616508494, "learning_rate": 7.282720189787374e-08, "loss": 0.2582, "loss_nan_ranks": 0, "loss_rank_avg": 0.11103338748216629, "step": 4030, "valid_targets_mean": 7009.0, "valid_targets_min": 2167 }, { "epoch": 6.838983050847458, "grad_norm": 0.41724902537057335, "learning_rate": 6.579892695996571e-08, "loss": 0.2534, "loss_nan_ranks": 0, "loss_rank_avg": 0.11125913262367249, "step": 4035, "valid_targets_mean": 7157.2, "valid_targets_min": 4536 }, { "epoch": 6.847457627118644, "grad_norm": 0.43675935476999767, "learning_rate": 5.912665433545517e-08, "loss": 0.2585, "loss_nan_ranks": 0, "loss_rank_avg": 0.13949739933013916, "step": 4040, "valid_targets_mean": 7369.8, "valid_targets_min": 2319 }, { "epoch": 6.8559322033898304, "grad_norm": 0.3967356930940284, "learning_rate": 5.281050318358683e-08, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.11958187818527222, "step": 4045, "valid_targets_mean": 9524.0, "valid_targets_min": 3222 }, { "epoch": 6.864406779661017, "grad_norm": 0.3764643187198624, "learning_rate": 4.685058630369055e-08, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.14520995318889618, "step": 4050, "valid_targets_mean": 10037.6, "valid_targets_min": 3726 }, { "epoch": 6.872881355932203, "grad_norm": 0.4472913726578498, "learning_rate": 4.124701013314969e-08, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.13814541697502136, "step": 4055, "valid_targets_mean": 8044.9, "valid_targets_min": 1559 }, { "epoch": 6.88135593220339, "grad_norm": 0.4304758387859473, "learning_rate": 3.599987474550259e-08, "loss": 0.2661, "loss_nan_ranks": 0, "loss_rank_avg": 0.17096751928329468, "step": 4060, "valid_targets_mean": 8318.6, "valid_targets_min": 2625 }, { "epoch": 6.889830508474576, "grad_norm": 0.4255133064645767, "learning_rate": 3.110927384865958e-08, "loss": 0.2771, "loss_nan_ranks": 0, "loss_rank_avg": 0.18236063420772552, "step": 4065, "valid_targets_mean": 10562.4, "valid_targets_min": 4446 }, { "epoch": 6.898305084745763, "grad_norm": 0.42579147928580874, "learning_rate": 2.6575294783230954e-08, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.0787440836429596, "step": 4070, "valid_targets_mean": 5780.5, "valid_targets_min": 2433 }, { "epoch": 6.906779661016949, "grad_norm": 0.41394744030559266, "learning_rate": 2.239801852095935e-08, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.160111665725708, "step": 4075, "valid_targets_mean": 10663.0, "valid_targets_min": 4448 }, { "epoch": 6.915254237288136, "grad_norm": 0.4398804522507922, "learning_rate": 1.8577519663278697e-08, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.11937999725341797, "step": 4080, "valid_targets_mean": 8688.0, "valid_targets_min": 4993 }, { "epoch": 6.923728813559322, "grad_norm": 0.4242647115439553, "learning_rate": 1.5113866439986357e-08, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.16489309072494507, "step": 4085, "valid_targets_mean": 8224.9, "valid_targets_min": 2579 }, { "epoch": 6.932203389830509, "grad_norm": 0.4463993067738115, "learning_rate": 1.2007120708015241e-08, "loss": 0.2719, "loss_nan_ranks": 0, "loss_rank_avg": 0.13091351091861725, "step": 4090, "valid_targets_mean": 6447.1, "valid_targets_min": 2442 }, { "epoch": 6.940677966101695, "grad_norm": 0.3869465593180131, "learning_rate": 9.257337950332456e-09, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.12474340200424194, "step": 4095, "valid_targets_mean": 8366.1, "valid_targets_min": 3401 }, { "epoch": 6.9491525423728815, "grad_norm": 0.4310417118559466, "learning_rate": 6.864567274955658e-09, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.1725938618183136, "step": 4100, "valid_targets_mean": 8291.4, "valid_targets_min": 2433 }, { "epoch": 6.9576271186440675, "grad_norm": 0.495997210458029, "learning_rate": 4.828851414062641e-09, "loss": 0.2767, "loss_nan_ranks": 0, "loss_rank_avg": 0.15047688782215118, "step": 4105, "valid_targets_mean": 9112.9, "valid_targets_min": 4448 }, { "epoch": 6.966101694915254, "grad_norm": 0.40916895754360966, "learning_rate": 3.150226723243055e-09, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.12793532013893127, "step": 4110, "valid_targets_mean": 8339.1, "valid_targets_min": 2695 }, { "epoch": 6.97457627118644, "grad_norm": 0.4136374005938968, "learning_rate": 1.8287231808322702e-09, "loss": 0.2591, "loss_nan_ranks": 0, "loss_rank_avg": 0.14656734466552734, "step": 4115, "valid_targets_mean": 10133.8, "valid_targets_min": 6907 }, { "epoch": 6.983050847457627, "grad_norm": 0.44077122285507164, "learning_rate": 8.643643873962326e-10, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.10336880385875702, "step": 4120, "valid_targets_mean": 7540.5, "valid_targets_min": 4074 }, { "epoch": 6.991525423728813, "grad_norm": 1.279550969019676, "learning_rate": 2.5716756528959553e-10, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.16964712738990784, "step": 4125, "valid_targets_mean": 9376.9, "valid_targets_min": 3622 }, { "epoch": 7.0, "grad_norm": 0.42781761566450044, "learning_rate": 7.143558364841597e-12, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.07686486095190048, "step": 4130, "valid_targets_mean": 6255.1, "valid_targets_min": 3251 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.07686486095190048, "step": 4130, "total_flos": 2.65446196155043e+18, "train_loss": 0.30306281665335555, "train_runtime": 64515.1665, "train_samples_per_second": 1.024, "train_steps_per_second": 0.064, "valid_targets_mean": 6255.1, "valid_targets_min": 3251 } ], "logging_steps": 5, "max_steps": 4130, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2.65446196155043e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }