diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,9133 @@ +{ + "best_global_step": null, + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 7.0, + "eval_steps": 500, + "global_step": 4130, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.00847457627118644, + "grad_norm": 12.236435102750375, + "learning_rate": 3.8740920096852305e-07, + "loss": 0.8295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2684570252895355, + "step": 5, + "valid_targets_mean": 4368.4, + "valid_targets_min": 2939 + }, + { + "epoch": 0.01694915254237288, + "grad_norm": 10.058309821274516, + "learning_rate": 8.716707021791768e-07, + "loss": 0.8055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5616639852523804, + "step": 10, + "valid_targets_mean": 9545.8, + "valid_targets_min": 4547 + }, + { + "epoch": 0.025423728813559324, + "grad_norm": 8.52945178256474, + "learning_rate": 1.3559322033898307e-06, + "loss": 0.7631, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4021530747413635, + "step": 15, + "valid_targets_mean": 9586.9, + "valid_targets_min": 5112 + }, + { + "epoch": 0.03389830508474576, + "grad_norm": 5.980922520646845, + "learning_rate": 1.8401937046004845e-06, + "loss": 0.7736, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.41938316822052, + "step": 20, + "valid_targets_mean": 8228.5, + "valid_targets_min": 3550 + }, + { + "epoch": 0.0423728813559322, + "grad_norm": 3.7984612636995125, + "learning_rate": 2.324455205811138e-06, + "loss": 0.7283, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4073244035243988, + "step": 25, + "valid_targets_mean": 10135.8, + "valid_targets_min": 4168 + }, + { + "epoch": 0.05084745762711865, + "grad_norm": 2.94113455953092, + "learning_rate": 2.808716707021792e-06, + "loss": 0.7287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3122481405735016, + "step": 30, + "valid_targets_mean": 8561.0, + "valid_targets_min": 3843 + }, + { + "epoch": 0.059322033898305086, + "grad_norm": 2.719124371329246, + "learning_rate": 3.2929782082324455e-06, + "loss": 0.7333, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31176847219467163, + "step": 35, + "valid_targets_mean": 5976.4, + "valid_targets_min": 3033 + }, + { + "epoch": 0.06779661016949153, + "grad_norm": 1.8367152849661372, + "learning_rate": 3.7772397094430994e-06, + "loss": 0.6223, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3117915391921997, + "step": 40, + "valid_targets_mean": 6918.5, + "valid_targets_min": 3257 + }, + { + "epoch": 0.07627118644067797, + "grad_norm": 1.202874459401654, + "learning_rate": 4.261501210653753e-06, + "loss": 0.6556, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36333340406417847, + "step": 45, + "valid_targets_mean": 9124.4, + "valid_targets_min": 2913 + }, + { + "epoch": 0.0847457627118644, + "grad_norm": 1.0786502836699934, + "learning_rate": 4.745762711864408e-06, + "loss": 0.5957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32077574729919434, + "step": 50, + "valid_targets_mean": 9160.0, + "valid_targets_min": 4550 + }, + { + "epoch": 0.09322033898305085, + "grad_norm": 0.9850973794351479, + "learning_rate": 5.230024213075061e-06, + "loss": 0.5574, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28348320722579956, + "step": 55, + "valid_targets_mean": 7648.8, + "valid_targets_min": 2230 + }, + { + "epoch": 0.1016949152542373, + "grad_norm": 0.9506271905194752, + "learning_rate": 5.7142857142857145e-06, + "loss": 0.5513, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35213959217071533, + "step": 60, + "valid_targets_mean": 9959.1, + "valid_targets_min": 6620 + }, + { + "epoch": 0.11016949152542373, + "grad_norm": 0.7568590634359315, + "learning_rate": 6.198547215496369e-06, + "loss": 0.5441, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32353514432907104, + "step": 65, + "valid_targets_mean": 8611.0, + "valid_targets_min": 3485 + }, + { + "epoch": 0.11864406779661017, + "grad_norm": 0.8003434826466195, + "learning_rate": 6.682808716707022e-06, + "loss": 0.5294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2963908612728119, + "step": 70, + "valid_targets_mean": 8577.6, + "valid_targets_min": 4103 + }, + { + "epoch": 0.1271186440677966, + "grad_norm": 0.6819382378620414, + "learning_rate": 7.1670702179176766e-06, + "loss": 0.5266, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29446882009506226, + "step": 75, + "valid_targets_mean": 9525.9, + "valid_targets_min": 2096 + }, + { + "epoch": 0.13559322033898305, + "grad_norm": 0.5426614937193089, + "learning_rate": 7.65133171912833e-06, + "loss": 0.4912, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1997358202934265, + "step": 80, + "valid_targets_mean": 6563.4, + "valid_targets_min": 2943 + }, + { + "epoch": 0.1440677966101695, + "grad_norm": 0.5948300852884347, + "learning_rate": 8.135593220338983e-06, + "loss": 0.5251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4521056115627289, + "step": 85, + "valid_targets_mean": 12116.9, + "valid_targets_min": 3622 + }, + { + "epoch": 0.15254237288135594, + "grad_norm": 0.49709515079932287, + "learning_rate": 8.619854721549637e-06, + "loss": 0.5206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.284382164478302, + "step": 90, + "valid_targets_mean": 8606.2, + "valid_targets_min": 3501 + }, + { + "epoch": 0.16101694915254236, + "grad_norm": 0.4713133451299385, + "learning_rate": 9.10411622276029e-06, + "loss": 0.474, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15513190627098083, + "step": 95, + "valid_targets_mean": 6271.8, + "valid_targets_min": 3023 + }, + { + "epoch": 0.1694915254237288, + "grad_norm": 0.4457304349817586, + "learning_rate": 9.588377723970946e-06, + "loss": 0.4661, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2053360641002655, + "step": 100, + "valid_targets_mean": 7486.0, + "valid_targets_min": 3465 + }, + { + "epoch": 0.17796610169491525, + "grad_norm": 0.44154277874061937, + "learning_rate": 1.0072639225181599e-05, + "loss": 0.4511, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20671820640563965, + "step": 105, + "valid_targets_mean": 6911.2, + "valid_targets_min": 2853 + }, + { + "epoch": 0.1864406779661017, + "grad_norm": 0.48622015880781266, + "learning_rate": 1.0556900726392252e-05, + "loss": 0.4333, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.292965292930603, + "step": 110, + "valid_targets_mean": 8936.8, + "valid_targets_min": 1718 + }, + { + "epoch": 0.19491525423728814, + "grad_norm": 0.4945674916588067, + "learning_rate": 1.1041162227602906e-05, + "loss": 0.46, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15357142686843872, + "step": 115, + "valid_targets_mean": 6594.0, + "valid_targets_min": 1819 + }, + { + "epoch": 0.2033898305084746, + "grad_norm": 0.5260662505419903, + "learning_rate": 1.1525423728813561e-05, + "loss": 0.4256, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2100408673286438, + "step": 120, + "valid_targets_mean": 6844.6, + "valid_targets_min": 2819 + }, + { + "epoch": 0.211864406779661, + "grad_norm": 0.4859160469605518, + "learning_rate": 1.2009685230024215e-05, + "loss": 0.4549, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29052165150642395, + "step": 125, + "valid_targets_mean": 9443.6, + "valid_targets_min": 2351 + }, + { + "epoch": 0.22033898305084745, + "grad_norm": 0.4887408500988149, + "learning_rate": 1.2493946731234868e-05, + "loss": 0.4533, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32517391443252563, + "step": 130, + "valid_targets_mean": 9598.9, + "valid_targets_min": 3221 + }, + { + "epoch": 0.2288135593220339, + "grad_norm": 0.44709723187595857, + "learning_rate": 1.2978208232445521e-05, + "loss": 0.4038, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22177180647850037, + "step": 135, + "valid_targets_mean": 7938.1, + "valid_targets_min": 1772 + }, + { + "epoch": 0.23728813559322035, + "grad_norm": 0.47189922671995305, + "learning_rate": 1.3462469733656177e-05, + "loss": 0.4447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19433565437793732, + "step": 140, + "valid_targets_mean": 7033.0, + "valid_targets_min": 3731 + }, + { + "epoch": 0.2457627118644068, + "grad_norm": 0.7896370250308062, + "learning_rate": 1.3946731234866828e-05, + "loss": 0.4819, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25007662177085876, + "step": 145, + "valid_targets_mean": 7750.5, + "valid_targets_min": 3290 + }, + { + "epoch": 0.2542372881355932, + "grad_norm": 1.167473809507481, + "learning_rate": 1.4430992736077482e-05, + "loss": 0.3776, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19537419080734253, + "step": 150, + "valid_targets_mean": 7780.4, + "valid_targets_min": 2228 + }, + { + "epoch": 0.2627118644067797, + "grad_norm": 0.4604199039648987, + "learning_rate": 1.4915254237288137e-05, + "loss": 0.4206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20237131416797638, + "step": 155, + "valid_targets_mean": 6237.5, + "valid_targets_min": 2797 + }, + { + "epoch": 0.2711864406779661, + "grad_norm": 1.2851421474093927, + "learning_rate": 1.5399515738498792e-05, + "loss": 0.3927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1901024878025055, + "step": 160, + "valid_targets_mean": 7075.9, + "valid_targets_min": 3662 + }, + { + "epoch": 0.2796610169491525, + "grad_norm": 0.4580396609863836, + "learning_rate": 1.5883777239709442e-05, + "loss": 0.3924, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.146134614944458, + "step": 165, + "valid_targets_mean": 7100.8, + "valid_targets_min": 3506 + }, + { + "epoch": 0.288135593220339, + "grad_norm": 0.4849064596017498, + "learning_rate": 1.63680387409201e-05, + "loss": 0.4289, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18006592988967896, + "step": 170, + "valid_targets_mean": 8865.8, + "valid_targets_min": 3261 + }, + { + "epoch": 0.2966101694915254, + "grad_norm": 0.4697056355654206, + "learning_rate": 1.6852300242130752e-05, + "loss": 0.3988, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23008233308792114, + "step": 175, + "valid_targets_mean": 8906.1, + "valid_targets_min": 3874 + }, + { + "epoch": 0.3050847457627119, + "grad_norm": 0.4186025820722969, + "learning_rate": 1.7336561743341406e-05, + "loss": 0.4076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21983414888381958, + "step": 180, + "valid_targets_mean": 9217.2, + "valid_targets_min": 4157 + }, + { + "epoch": 0.3135593220338983, + "grad_norm": 0.4880177558476617, + "learning_rate": 1.782082324455206e-05, + "loss": 0.408, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20033296942710876, + "step": 185, + "valid_targets_mean": 8644.5, + "valid_targets_min": 5639 + }, + { + "epoch": 0.3220338983050847, + "grad_norm": 0.506835537780777, + "learning_rate": 1.8305084745762713e-05, + "loss": 0.4345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15411603450775146, + "step": 190, + "valid_targets_mean": 5940.5, + "valid_targets_min": 2975 + }, + { + "epoch": 0.3305084745762712, + "grad_norm": 0.5175806823084516, + "learning_rate": 1.8789346246973366e-05, + "loss": 0.3823, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22352342307567596, + "step": 195, + "valid_targets_mean": 6518.9, + "valid_targets_min": 1922 + }, + { + "epoch": 0.3389830508474576, + "grad_norm": 0.39209882371312016, + "learning_rate": 1.927360774818402e-05, + "loss": 0.4033, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23113977909088135, + "step": 200, + "valid_targets_mean": 11211.2, + "valid_targets_min": 5692 + }, + { + "epoch": 0.3474576271186441, + "grad_norm": 0.5642312831981638, + "learning_rate": 1.9757869249394673e-05, + "loss": 0.4274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29515933990478516, + "step": 205, + "valid_targets_mean": 12401.2, + "valid_targets_min": 5602 + }, + { + "epoch": 0.3559322033898305, + "grad_norm": 0.4694784872364969, + "learning_rate": 2.0242130750605327e-05, + "loss": 0.3671, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22254446148872375, + "step": 210, + "valid_targets_mean": 9149.9, + "valid_targets_min": 3145 + }, + { + "epoch": 0.3644067796610169, + "grad_norm": 0.4729181140659464, + "learning_rate": 2.072639225181598e-05, + "loss": 0.3811, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1420256644487381, + "step": 215, + "valid_targets_mean": 6157.2, + "valid_targets_min": 2493 + }, + { + "epoch": 0.3728813559322034, + "grad_norm": 0.48751693402766566, + "learning_rate": 2.1210653753026637e-05, + "loss": 0.3637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30695676803588867, + "step": 220, + "valid_targets_mean": 10364.8, + "valid_targets_min": 4940 + }, + { + "epoch": 0.3813559322033898, + "grad_norm": 0.4492368775328314, + "learning_rate": 2.169491525423729e-05, + "loss": 0.392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1817527413368225, + "step": 225, + "valid_targets_mean": 8587.1, + "valid_targets_min": 6431 + }, + { + "epoch": 0.3898305084745763, + "grad_norm": 0.5264407991637193, + "learning_rate": 2.2179176755447944e-05, + "loss": 0.3598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.144405335187912, + "step": 230, + "valid_targets_mean": 6391.9, + "valid_targets_min": 2800 + }, + { + "epoch": 0.3983050847457627, + "grad_norm": 0.44859050212635043, + "learning_rate": 2.2663438256658597e-05, + "loss": 0.4306, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12371104955673218, + "step": 235, + "valid_targets_mean": 6035.9, + "valid_targets_min": 2422 + }, + { + "epoch": 0.4067796610169492, + "grad_norm": 0.4487952241314178, + "learning_rate": 2.3147699757869254e-05, + "loss": 0.3496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15325893461704254, + "step": 240, + "valid_targets_mean": 7694.0, + "valid_targets_min": 2322 + }, + { + "epoch": 0.4152542372881356, + "grad_norm": 0.5180958481856792, + "learning_rate": 2.3631961259079904e-05, + "loss": 0.3907, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20144130289554596, + "step": 245, + "valid_targets_mean": 6840.8, + "valid_targets_min": 2925 + }, + { + "epoch": 0.423728813559322, + "grad_norm": 0.4491176387970824, + "learning_rate": 2.4116222760290558e-05, + "loss": 0.3935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20885750651359558, + "step": 250, + "valid_targets_mean": 8512.1, + "valid_targets_min": 2493 + }, + { + "epoch": 0.4322033898305085, + "grad_norm": 0.4628691361446054, + "learning_rate": 2.460048426150121e-05, + "loss": 0.3732, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18055710196495056, + "step": 255, + "valid_targets_mean": 7962.2, + "valid_targets_min": 3404 + }, + { + "epoch": 0.4406779661016949, + "grad_norm": 0.4696155991888429, + "learning_rate": 2.5084745762711865e-05, + "loss": 0.3845, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2186737358570099, + "step": 260, + "valid_targets_mean": 8228.9, + "valid_targets_min": 4428 + }, + { + "epoch": 0.4491525423728814, + "grad_norm": 0.4797313441924088, + "learning_rate": 2.556900726392252e-05, + "loss": 0.3806, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18754912912845612, + "step": 265, + "valid_targets_mean": 8026.2, + "valid_targets_min": 2632 + }, + { + "epoch": 0.4576271186440678, + "grad_norm": 0.500792419812694, + "learning_rate": 2.6053268765133175e-05, + "loss": 0.3691, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14188027381896973, + "step": 270, + "valid_targets_mean": 6896.5, + "valid_targets_min": 2844 + }, + { + "epoch": 0.4661016949152542, + "grad_norm": 0.5194573027568329, + "learning_rate": 2.653753026634383e-05, + "loss": 0.4269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25647997856140137, + "step": 275, + "valid_targets_mean": 10153.5, + "valid_targets_min": 2859 + }, + { + "epoch": 0.4745762711864407, + "grad_norm": 0.4835165912338022, + "learning_rate": 2.702179176755448e-05, + "loss": 0.4008, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2677648067474365, + "step": 280, + "valid_targets_mean": 10436.8, + "valid_targets_min": 2643 + }, + { + "epoch": 0.4830508474576271, + "grad_norm": 0.4697980137297522, + "learning_rate": 2.7506053268765135e-05, + "loss": 0.3844, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23836316168308258, + "step": 285, + "valid_targets_mean": 9596.2, + "valid_targets_min": 4758 + }, + { + "epoch": 0.4915254237288136, + "grad_norm": 0.7658555007951203, + "learning_rate": 2.799031476997579e-05, + "loss": 0.389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1868828684091568, + "step": 290, + "valid_targets_mean": 7418.0, + "valid_targets_min": 2145 + }, + { + "epoch": 0.5, + "grad_norm": 0.47702422177750037, + "learning_rate": 2.8474576271186442e-05, + "loss": 0.3657, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20087997615337372, + "step": 295, + "valid_targets_mean": 7950.9, + "valid_targets_min": 1969 + }, + { + "epoch": 0.5084745762711864, + "grad_norm": 0.46273864653365726, + "learning_rate": 2.8958837772397096e-05, + "loss": 0.3648, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1638944149017334, + "step": 300, + "valid_targets_mean": 7513.8, + "valid_targets_min": 1750 + }, + { + "epoch": 0.5169491525423728, + "grad_norm": 0.47460686381697653, + "learning_rate": 2.9443099273607753e-05, + "loss": 0.3583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22977076470851898, + "step": 305, + "valid_targets_mean": 10273.2, + "valid_targets_min": 6552 + }, + { + "epoch": 0.5254237288135594, + "grad_norm": 0.5179070401819209, + "learning_rate": 2.9927360774818406e-05, + "loss": 0.3636, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1554882526397705, + "step": 310, + "valid_targets_mean": 6126.1, + "valid_targets_min": 2357 + }, + { + "epoch": 0.5338983050847458, + "grad_norm": 0.4667464306864076, + "learning_rate": 3.041162227602906e-05, + "loss": 0.3599, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14054939150810242, + "step": 315, + "valid_targets_mean": 7663.6, + "valid_targets_min": 5239 + }, + { + "epoch": 0.5423728813559322, + "grad_norm": 0.4781556906105198, + "learning_rate": 3.089588377723971e-05, + "loss": 0.3804, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19416019320487976, + "step": 320, + "valid_targets_mean": 7567.8, + "valid_targets_min": 1645 + }, + { + "epoch": 0.5508474576271186, + "grad_norm": 0.511629903592572, + "learning_rate": 3.138014527845036e-05, + "loss": 0.357, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12012749165296555, + "step": 325, + "valid_targets_mean": 5964.8, + "valid_targets_min": 4470 + }, + { + "epoch": 0.559322033898305, + "grad_norm": 0.4480119776210039, + "learning_rate": 3.186440677966102e-05, + "loss": 0.3552, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.162928506731987, + "step": 330, + "valid_targets_mean": 7623.0, + "valid_targets_min": 2591 + }, + { + "epoch": 0.5677966101694916, + "grad_norm": 0.4937825533870499, + "learning_rate": 3.234866828087168e-05, + "loss": 0.3694, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19250673055648804, + "step": 335, + "valid_targets_mean": 8913.8, + "valid_targets_min": 2840 + }, + { + "epoch": 0.576271186440678, + "grad_norm": 0.4878075980066041, + "learning_rate": 3.283292978208233e-05, + "loss": 0.3802, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16013866662979126, + "step": 340, + "valid_targets_mean": 6744.0, + "valid_targets_min": 1682 + }, + { + "epoch": 0.5847457627118644, + "grad_norm": 0.45319045459430685, + "learning_rate": 3.3317191283292984e-05, + "loss": 0.3863, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14388547837734222, + "step": 345, + "valid_targets_mean": 7284.5, + "valid_targets_min": 1990 + }, + { + "epoch": 0.5932203389830508, + "grad_norm": 0.47236199339171486, + "learning_rate": 3.3801452784503634e-05, + "loss": 0.3804, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.231609508395195, + "step": 350, + "valid_targets_mean": 9248.5, + "valid_targets_min": 2566 + }, + { + "epoch": 0.6016949152542372, + "grad_norm": 0.5119661968795367, + "learning_rate": 3.4285714285714284e-05, + "loss": 0.3726, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21987944841384888, + "step": 355, + "valid_targets_mean": 8192.4, + "valid_targets_min": 2871 + }, + { + "epoch": 0.6101694915254238, + "grad_norm": 0.42304412282644255, + "learning_rate": 3.476997578692494e-05, + "loss": 0.3661, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13173159956932068, + "step": 360, + "valid_targets_mean": 8175.8, + "valid_targets_min": 5029 + }, + { + "epoch": 0.6186440677966102, + "grad_norm": 0.47803298114996845, + "learning_rate": 3.52542372881356e-05, + "loss": 0.3882, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14908023178577423, + "step": 365, + "valid_targets_mean": 6414.9, + "valid_targets_min": 3910 + }, + { + "epoch": 0.6271186440677966, + "grad_norm": 0.4881529791768924, + "learning_rate": 3.573849878934625e-05, + "loss": 0.3723, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16491301357746124, + "step": 370, + "valid_targets_mean": 7414.9, + "valid_targets_min": 2965 + }, + { + "epoch": 0.635593220338983, + "grad_norm": 0.5108906486160846, + "learning_rate": 3.6222760290556904e-05, + "loss": 0.3844, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22124037146568298, + "step": 375, + "valid_targets_mean": 7832.9, + "valid_targets_min": 2970 + }, + { + "epoch": 0.6440677966101694, + "grad_norm": 0.5139550621670309, + "learning_rate": 3.670702179176756e-05, + "loss": 0.3794, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24905268847942352, + "step": 380, + "valid_targets_mean": 8240.8, + "valid_targets_min": 5678 + }, + { + "epoch": 0.652542372881356, + "grad_norm": 0.4939392728062636, + "learning_rate": 3.719128329297821e-05, + "loss": 0.398, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1989961713552475, + "step": 385, + "valid_targets_mean": 9710.9, + "valid_targets_min": 4394 + }, + { + "epoch": 0.6610169491525424, + "grad_norm": 0.47183364711246323, + "learning_rate": 3.767554479418886e-05, + "loss": 0.3727, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17190328240394592, + "step": 390, + "valid_targets_mean": 7330.9, + "valid_targets_min": 2921 + }, + { + "epoch": 0.6694915254237288, + "grad_norm": 0.4406788345603544, + "learning_rate": 3.815980629539952e-05, + "loss": 0.3487, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15205857157707214, + "step": 395, + "valid_targets_mean": 6784.4, + "valid_targets_min": 2346 + }, + { + "epoch": 0.6779661016949152, + "grad_norm": 0.4456952077678055, + "learning_rate": 3.8644067796610175e-05, + "loss": 0.3699, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1788387894630432, + "step": 400, + "valid_targets_mean": 7900.6, + "valid_targets_min": 3235 + }, + { + "epoch": 0.6864406779661016, + "grad_norm": 0.5523324054394816, + "learning_rate": 3.9128329297820825e-05, + "loss": 0.3574, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13928887248039246, + "step": 405, + "valid_targets_mean": 5171.9, + "valid_targets_min": 3136 + }, + { + "epoch": 0.6949152542372882, + "grad_norm": 0.5002722226670426, + "learning_rate": 3.961259079903148e-05, + "loss": 0.385, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1312628537416458, + "step": 410, + "valid_targets_mean": 6787.4, + "valid_targets_min": 3693 + }, + { + "epoch": 0.7033898305084746, + "grad_norm": 0.42843480849686666, + "learning_rate": 3.9999992856441635e-05, + "loss": 0.3493, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1744052767753601, + "step": 415, + "valid_targets_mean": 7211.9, + "valid_targets_min": 2393 + }, + { + "epoch": 0.711864406779661, + "grad_norm": 0.4679043644147995, + "learning_rate": 3.999974283243472e-05, + "loss": 0.3639, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1082448959350586, + "step": 420, + "valid_targets_mean": 6552.6, + "valid_targets_min": 2437 + }, + { + "epoch": 0.7203389830508474, + "grad_norm": 0.47331069467877396, + "learning_rate": 3.9999135635612606e-05, + "loss": 0.4011, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23097260296344757, + "step": 425, + "valid_targets_mean": 8409.1, + "valid_targets_min": 3741 + }, + { + "epoch": 0.7288135593220338, + "grad_norm": 0.5135319796540361, + "learning_rate": 3.999817127681917e-05, + "loss": 0.3778, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33611786365509033, + "step": 430, + "valid_targets_mean": 11845.2, + "valid_targets_min": 1936 + }, + { + "epoch": 0.7372881355932204, + "grad_norm": 0.5557676245987662, + "learning_rate": 3.9996849773276764e-05, + "loss": 0.3458, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12023050338029861, + "step": 435, + "valid_targets_mean": 4693.2, + "valid_targets_min": 3425 + }, + { + "epoch": 0.7457627118644068, + "grad_norm": 0.5410110705579056, + "learning_rate": 3.9995171148585944e-05, + "loss": 0.3175, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16153821349143982, + "step": 440, + "valid_targets_mean": 6421.5, + "valid_targets_min": 3319 + }, + { + "epoch": 0.7542372881355932, + "grad_norm": 0.4951775086532844, + "learning_rate": 3.999313543272505e-05, + "loss": 0.3564, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1502537578344345, + "step": 445, + "valid_targets_mean": 7038.1, + "valid_targets_min": 3514 + }, + { + "epoch": 0.7627118644067796, + "grad_norm": 0.47906530418320226, + "learning_rate": 3.999074266204967e-05, + "loss": 0.3263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16620051860809326, + "step": 450, + "valid_targets_mean": 8577.1, + "valid_targets_min": 3324 + }, + { + "epoch": 0.7711864406779662, + "grad_norm": 0.5177860251716547, + "learning_rate": 3.998799287929199e-05, + "loss": 0.3375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20412178337574005, + "step": 455, + "valid_targets_mean": 7626.9, + "valid_targets_min": 1240 + }, + { + "epoch": 0.7796610169491526, + "grad_norm": 0.46635973969392164, + "learning_rate": 3.998488613356002e-05, + "loss": 0.3464, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1993708461523056, + "step": 460, + "valid_targets_mean": 9630.6, + "valid_targets_min": 4060 + }, + { + "epoch": 0.788135593220339, + "grad_norm": 0.48835104343419244, + "learning_rate": 3.998142248033673e-05, + "loss": 0.3796, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20394505560398102, + "step": 465, + "valid_targets_mean": 7548.1, + "valid_targets_min": 3516 + }, + { + "epoch": 0.7966101694915254, + "grad_norm": 0.4557086785487366, + "learning_rate": 3.997760198147904e-05, + "loss": 0.3486, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15721432864665985, + "step": 470, + "valid_targets_mean": 6833.1, + "valid_targets_min": 2772 + }, + { + "epoch": 0.8050847457627118, + "grad_norm": 0.4515063413898264, + "learning_rate": 3.9973424705216774e-05, + "loss": 0.3784, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1749514490365982, + "step": 475, + "valid_targets_mean": 7408.5, + "valid_targets_min": 1943 + }, + { + "epoch": 0.8135593220338984, + "grad_norm": 0.4428676672373464, + "learning_rate": 3.996889072615134e-05, + "loss": 0.3258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21249344944953918, + "step": 480, + "valid_targets_mean": 9819.9, + "valid_targets_min": 3010 + }, + { + "epoch": 0.8220338983050848, + "grad_norm": 0.49524032365604226, + "learning_rate": 3.99640001252545e-05, + "loss": 0.375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1323350965976715, + "step": 485, + "valid_targets_mean": 5834.0, + "valid_targets_min": 3776 + }, + { + "epoch": 0.8305084745762712, + "grad_norm": 0.47661852289977547, + "learning_rate": 3.9958752989866856e-05, + "loss": 0.3669, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2077844887971878, + "step": 490, + "valid_targets_mean": 7829.8, + "valid_targets_min": 3541 + }, + { + "epoch": 0.8389830508474576, + "grad_norm": 0.5368833318390628, + "learning_rate": 3.995314941369631e-05, + "loss": 0.3385, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1979312300682068, + "step": 495, + "valid_targets_mean": 7753.1, + "valid_targets_min": 3245 + }, + { + "epoch": 0.847457627118644, + "grad_norm": 0.43413683875323356, + "learning_rate": 3.994718949681642e-05, + "loss": 0.3241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08601364493370056, + "step": 500, + "valid_targets_mean": 4876.6, + "valid_targets_min": 1373 + }, + { + "epoch": 0.8559322033898306, + "grad_norm": 0.45697287254458874, + "learning_rate": 3.994087334566455e-05, + "loss": 0.3471, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1718927025794983, + "step": 505, + "valid_targets_mean": 7721.6, + "valid_targets_min": 4226 + }, + { + "epoch": 0.864406779661017, + "grad_norm": 0.47862116333913, + "learning_rate": 3.9934201073040035e-05, + "loss": 0.3587, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1376647651195526, + "step": 510, + "valid_targets_mean": 7147.1, + "valid_targets_min": 4853 + }, + { + "epoch": 0.8728813559322034, + "grad_norm": 0.4429781490950345, + "learning_rate": 3.992717279810213e-05, + "loss": 0.3546, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17605769634246826, + "step": 515, + "valid_targets_mean": 7849.5, + "valid_targets_min": 4396 + }, + { + "epoch": 0.8813559322033898, + "grad_norm": 0.45127457745702443, + "learning_rate": 3.991978864636788e-05, + "loss": 0.3421, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1218881830573082, + "step": 520, + "valid_targets_mean": 6575.2, + "valid_targets_min": 2730 + }, + { + "epoch": 0.8898305084745762, + "grad_norm": 0.4345536633734186, + "learning_rate": 3.9912048749709896e-05, + "loss": 0.3497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1432826966047287, + "step": 525, + "valid_targets_mean": 8336.4, + "valid_targets_min": 3085 + }, + { + "epoch": 0.8983050847457628, + "grad_norm": 0.4843526513333187, + "learning_rate": 3.990395324635399e-05, + "loss": 0.3294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18618427217006683, + "step": 530, + "valid_targets_mean": 8355.0, + "valid_targets_min": 4107 + }, + { + "epoch": 0.9067796610169492, + "grad_norm": 0.44356795524997744, + "learning_rate": 3.989550228087671e-05, + "loss": 0.3497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1626293659210205, + "step": 535, + "valid_targets_mean": 7243.9, + "valid_targets_min": 2909 + }, + { + "epoch": 0.9152542372881356, + "grad_norm": 0.41561791071560467, + "learning_rate": 3.988669600420275e-05, + "loss": 0.3201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1661594808101654, + "step": 540, + "valid_targets_mean": 9455.1, + "valid_targets_min": 4298 + }, + { + "epoch": 0.923728813559322, + "grad_norm": 0.4358520648605049, + "learning_rate": 3.9877534573602254e-05, + "loss": 0.3617, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27095770835876465, + "step": 545, + "valid_targets_mean": 8973.9, + "valid_targets_min": 2827 + }, + { + "epoch": 0.9322033898305084, + "grad_norm": 0.4813894750533826, + "learning_rate": 3.9868018152688044e-05, + "loss": 0.3558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17274773120880127, + "step": 550, + "valid_targets_mean": 7341.4, + "valid_targets_min": 1721 + }, + { + "epoch": 0.940677966101695, + "grad_norm": 0.46263973848113316, + "learning_rate": 3.985814691141263e-05, + "loss": 0.3598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2267192006111145, + "step": 555, + "valid_targets_mean": 9122.1, + "valid_targets_min": 3336 + }, + { + "epoch": 0.9491525423728814, + "grad_norm": 0.46520816240799234, + "learning_rate": 3.984792102606524e-05, + "loss": 0.3821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11244647204875946, + "step": 560, + "valid_targets_mean": 6185.9, + "valid_targets_min": 2997 + }, + { + "epoch": 0.9576271186440678, + "grad_norm": 0.5072756278635104, + "learning_rate": 3.9837340679268634e-05, + "loss": 0.315, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11192071437835693, + "step": 565, + "valid_targets_mean": 6087.0, + "valid_targets_min": 3094 + }, + { + "epoch": 0.9661016949152542, + "grad_norm": 0.4165557159597932, + "learning_rate": 3.982640605997585e-05, + "loss": 0.329, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14271879196166992, + "step": 570, + "valid_targets_mean": 7421.4, + "valid_targets_min": 3182 + }, + { + "epoch": 0.9745762711864406, + "grad_norm": 0.4465966835957301, + "learning_rate": 3.981511736346684e-05, + "loss": 0.3512, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1899096965789795, + "step": 575, + "valid_targets_mean": 8330.2, + "valid_targets_min": 3990 + }, + { + "epoch": 0.9830508474576272, + "grad_norm": 0.47188153745533346, + "learning_rate": 3.980347479134498e-05, + "loss": 0.3326, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16237373650074005, + "step": 580, + "valid_targets_mean": 7614.1, + "valid_targets_min": 3425 + }, + { + "epoch": 0.9915254237288136, + "grad_norm": 0.45659300690082466, + "learning_rate": 3.9791478551533435e-05, + "loss": 0.3241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1724914014339447, + "step": 585, + "valid_targets_mean": 7735.9, + "valid_targets_min": 3159 + }, + { + "epoch": 1.0, + "grad_norm": 0.4731948101985973, + "learning_rate": 3.977912885827151e-05, + "loss": 0.342, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1396312415599823, + "step": 590, + "valid_targets_mean": 6537.0, + "valid_targets_min": 2991 + }, + { + "epoch": 1.0084745762711864, + "grad_norm": 0.4627342217897108, + "learning_rate": 3.976642593211079e-05, + "loss": 0.3613, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24919381737709045, + "step": 595, + "valid_targets_mean": 10379.8, + "valid_targets_min": 3903 + }, + { + "epoch": 1.0169491525423728, + "grad_norm": 0.4536741195006425, + "learning_rate": 3.9753369999911166e-05, + "loss": 0.3309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15797701478004456, + "step": 600, + "valid_targets_mean": 7904.0, + "valid_targets_min": 3709 + }, + { + "epoch": 1.0254237288135593, + "grad_norm": 0.4589851155496452, + "learning_rate": 3.973996129483684e-05, + "loss": 0.3171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10587269067764282, + "step": 605, + "valid_targets_mean": 7432.1, + "valid_targets_min": 2532 + }, + { + "epoch": 1.0338983050847457, + "grad_norm": 0.47318377384255594, + "learning_rate": 3.972620005635216e-05, + "loss": 0.2935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1729205846786499, + "step": 610, + "valid_targets_mean": 7595.9, + "valid_targets_min": 2825 + }, + { + "epoch": 1.042372881355932, + "grad_norm": 0.4469128531341844, + "learning_rate": 3.971208653021727e-05, + "loss": 0.3171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20472905039787292, + "step": 615, + "valid_targets_mean": 8200.1, + "valid_targets_min": 2509 + }, + { + "epoch": 1.0508474576271187, + "grad_norm": 0.4833955669012435, + "learning_rate": 3.969762096848383e-05, + "loss": 0.3673, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15367567539215088, + "step": 620, + "valid_targets_mean": 7303.2, + "valid_targets_min": 712 + }, + { + "epoch": 1.0593220338983051, + "grad_norm": 0.4180140372553057, + "learning_rate": 3.968280362949042e-05, + "loss": 0.329, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20632800459861755, + "step": 625, + "valid_targets_mean": 9386.4, + "valid_targets_min": 4698 + }, + { + "epoch": 1.0677966101694916, + "grad_norm": 0.40174569986041325, + "learning_rate": 3.9667634777857975e-05, + "loss": 0.3588, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14220260083675385, + "step": 630, + "valid_targets_mean": 8459.8, + "valid_targets_min": 3319 + }, + { + "epoch": 1.076271186440678, + "grad_norm": 0.44484170138321344, + "learning_rate": 3.965211468448505e-05, + "loss": 0.3388, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14559875428676605, + "step": 635, + "valid_targets_mean": 7179.8, + "valid_targets_min": 3830 + }, + { + "epoch": 1.0847457627118644, + "grad_norm": 0.4395541639351123, + "learning_rate": 3.963624362654299e-05, + "loss": 0.3324, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13254770636558533, + "step": 640, + "valid_targets_mean": 7157.9, + "valid_targets_min": 1936 + }, + { + "epoch": 1.0932203389830508, + "grad_norm": 0.4654264001987176, + "learning_rate": 3.962002188747096e-05, + "loss": 0.3234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28930819034576416, + "step": 645, + "valid_targets_mean": 10538.6, + "valid_targets_min": 2967 + }, + { + "epoch": 1.1016949152542372, + "grad_norm": 0.40719297523344944, + "learning_rate": 3.9603449756970877e-05, + "loss": 0.3219, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09647984802722931, + "step": 650, + "valid_targets_mean": 6410.5, + "valid_targets_min": 2114 + }, + { + "epoch": 1.1101694915254237, + "grad_norm": 0.6812110649265294, + "learning_rate": 3.95865275310023e-05, + "loss": 0.3275, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09337997436523438, + "step": 655, + "valid_targets_mean": 4987.0, + "valid_targets_min": 2152 + }, + { + "epoch": 1.11864406779661, + "grad_norm": 0.4778768969090781, + "learning_rate": 3.9569255511777054e-05, + "loss": 0.3253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1386423110961914, + "step": 660, + "valid_targets_mean": 6117.6, + "valid_targets_min": 2957 + }, + { + "epoch": 1.1271186440677967, + "grad_norm": 0.4193417013796084, + "learning_rate": 3.955163400775389e-05, + "loss": 0.361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12261968106031418, + "step": 665, + "valid_targets_mean": 6347.0, + "valid_targets_min": 3535 + }, + { + "epoch": 1.1355932203389831, + "grad_norm": 0.5013613951602334, + "learning_rate": 3.953366333363297e-05, + "loss": 0.3222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12408879399299622, + "step": 670, + "valid_targets_mean": 6869.2, + "valid_targets_min": 1409 + }, + { + "epoch": 1.1440677966101696, + "grad_norm": 0.4160706590681276, + "learning_rate": 3.9515343810350236e-05, + "loss": 0.3091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2585446834564209, + "step": 675, + "valid_targets_mean": 11118.4, + "valid_targets_min": 2837 + }, + { + "epoch": 1.152542372881356, + "grad_norm": 0.48357167974115245, + "learning_rate": 3.949667576507168e-05, + "loss": 0.3338, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2446514070034027, + "step": 680, + "valid_targets_mean": 7852.5, + "valid_targets_min": 2865 + }, + { + "epoch": 1.1610169491525424, + "grad_norm": 0.5207580063819728, + "learning_rate": 3.9477659531187484e-05, + "loss": 0.3305, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2768232822418213, + "step": 685, + "valid_targets_mean": 9521.2, + "valid_targets_min": 1901 + }, + { + "epoch": 1.1694915254237288, + "grad_norm": 0.4352619530283247, + "learning_rate": 3.9458295448306134e-05, + "loss": 0.3273, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.169637992978096, + "step": 690, + "valid_targets_mean": 8180.2, + "valid_targets_min": 3197 + }, + { + "epoch": 1.1779661016949152, + "grad_norm": 0.6375401638430952, + "learning_rate": 3.943858386224825e-05, + "loss": 0.3542, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20666490495204926, + "step": 695, + "valid_targets_mean": 7918.8, + "valid_targets_min": 2972 + }, + { + "epoch": 1.1864406779661016, + "grad_norm": 0.5237074435643403, + "learning_rate": 3.941852512504052e-05, + "loss": 0.3069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16815276443958282, + "step": 700, + "valid_targets_mean": 8423.9, + "valid_targets_min": 3467 + }, + { + "epoch": 1.194915254237288, + "grad_norm": 0.46230638915825684, + "learning_rate": 3.939811959490931e-05, + "loss": 0.3183, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22283053398132324, + "step": 705, + "valid_targets_mean": 11047.0, + "valid_targets_min": 4423 + }, + { + "epoch": 1.2033898305084745, + "grad_norm": 0.4545188486641544, + "learning_rate": 3.937736763627435e-05, + "loss": 0.3157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19005794823169708, + "step": 710, + "valid_targets_mean": 8591.1, + "valid_targets_min": 3981 + }, + { + "epoch": 1.211864406779661, + "grad_norm": 0.4552644672198827, + "learning_rate": 3.935626961974217e-05, + "loss": 0.3603, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14236797392368317, + "step": 715, + "valid_targets_mean": 6977.0, + "valid_targets_min": 3031 + }, + { + "epoch": 1.2203389830508475, + "grad_norm": 0.46886754247998963, + "learning_rate": 3.933482592209951e-05, + "loss": 0.3314, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26897650957107544, + "step": 720, + "valid_targets_mean": 9310.5, + "valid_targets_min": 3393 + }, + { + "epoch": 1.228813559322034, + "grad_norm": 0.48772266789453395, + "learning_rate": 3.931303692630661e-05, + "loss": 0.3101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16506057977676392, + "step": 725, + "valid_targets_mean": 7079.0, + "valid_targets_min": 2432 + }, + { + "epoch": 1.2372881355932204, + "grad_norm": 0.42871408585096393, + "learning_rate": 3.92909030214903e-05, + "loss": 0.3268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11513777822256088, + "step": 730, + "valid_targets_mean": 6985.9, + "valid_targets_min": 3986 + }, + { + "epoch": 1.2457627118644068, + "grad_norm": 0.44587055811958604, + "learning_rate": 3.9268424602937124e-05, + "loss": 0.3199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17389066517353058, + "step": 735, + "valid_targets_mean": 8847.4, + "valid_targets_min": 2642 + }, + { + "epoch": 1.2542372881355932, + "grad_norm": 0.47861212973477374, + "learning_rate": 3.9245602072086246e-05, + "loss": 0.3732, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10631030052900314, + "step": 740, + "valid_targets_mean": 5761.5, + "valid_targets_min": 4648 + }, + { + "epoch": 1.2627118644067796, + "grad_norm": 0.49947791123701396, + "learning_rate": 3.9222435836522286e-05, + "loss": 0.3373, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1645757257938385, + "step": 745, + "valid_targets_mean": 9582.9, + "valid_targets_min": 1652 + }, + { + "epoch": 1.271186440677966, + "grad_norm": 0.42913688486951385, + "learning_rate": 3.919892630996804e-05, + "loss": 0.3352, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14238014817237854, + "step": 750, + "valid_targets_mean": 6065.2, + "valid_targets_min": 2457 + }, + { + "epoch": 1.2796610169491525, + "grad_norm": 0.4255980165569159, + "learning_rate": 3.9175073912277107e-05, + "loss": 0.305, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11966271698474884, + "step": 755, + "valid_targets_mean": 6778.5, + "valid_targets_min": 3511 + }, + { + "epoch": 1.288135593220339, + "grad_norm": 0.4383294865094197, + "learning_rate": 3.915087906942635e-05, + "loss": 0.3196, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18853090703487396, + "step": 760, + "valid_targets_mean": 7773.5, + "valid_targets_min": 2965 + }, + { + "epoch": 1.2966101694915255, + "grad_norm": 0.42624494152006837, + "learning_rate": 3.912634221350834e-05, + "loss": 0.3482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20799216628074646, + "step": 765, + "valid_targets_mean": 10677.5, + "valid_targets_min": 2482 + }, + { + "epoch": 1.305084745762712, + "grad_norm": 0.4740167806151876, + "learning_rate": 3.910146378272361e-05, + "loss": 0.316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1015789806842804, + "step": 770, + "valid_targets_mean": 5372.8, + "valid_targets_min": 2801 + }, + { + "epoch": 1.3135593220338984, + "grad_norm": 0.5006756358318566, + "learning_rate": 3.9076244221372824e-05, + "loss": 0.321, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1526796519756317, + "step": 775, + "valid_targets_mean": 6574.1, + "valid_targets_min": 2460 + }, + { + "epoch": 1.3220338983050848, + "grad_norm": 0.4267845459550884, + "learning_rate": 3.905068397984886e-05, + "loss": 0.3168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16761890053749084, + "step": 780, + "valid_targets_mean": 8788.9, + "valid_targets_min": 4154 + }, + { + "epoch": 1.3305084745762712, + "grad_norm": 0.41392713104247275, + "learning_rate": 3.9024783514628765e-05, + "loss": 0.3568, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17586758732795715, + "step": 785, + "valid_targets_mean": 10475.6, + "valid_targets_min": 3622 + }, + { + "epoch": 1.3389830508474576, + "grad_norm": 0.5337105064121502, + "learning_rate": 3.899854328826559e-05, + "loss": 0.3425, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0900270864367485, + "step": 790, + "valid_targets_mean": 4031.1, + "valid_targets_min": 1420 + }, + { + "epoch": 1.347457627118644, + "grad_norm": 0.4488578510290259, + "learning_rate": 3.897196376938013e-05, + "loss": 0.318, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17309337854385376, + "step": 795, + "valid_targets_mean": 6397.8, + "valid_targets_min": 2425 + }, + { + "epoch": 1.3559322033898304, + "grad_norm": 0.39620489867483555, + "learning_rate": 3.8945045432652575e-05, + "loss": 0.3404, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08745632320642471, + "step": 800, + "valid_targets_mean": 6055.2, + "valid_targets_min": 3550 + }, + { + "epoch": 1.3644067796610169, + "grad_norm": 0.42992870791787763, + "learning_rate": 3.8917788758814e-05, + "loss": 0.3174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13015861809253693, + "step": 805, + "valid_targets_mean": 7460.4, + "valid_targets_min": 3055 + }, + { + "epoch": 1.3728813559322033, + "grad_norm": 0.40354106059339273, + "learning_rate": 3.889019423463783e-05, + "loss": 0.3149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09485109150409698, + "step": 810, + "valid_targets_mean": 6865.6, + "valid_targets_min": 2911 + }, + { + "epoch": 1.3813559322033897, + "grad_norm": 0.4686368291789137, + "learning_rate": 3.8862262352931075e-05, + "loss": 0.3294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1537308543920517, + "step": 815, + "valid_targets_mean": 6440.1, + "valid_targets_min": 2110 + }, + { + "epoch": 1.3898305084745763, + "grad_norm": 0.4408642589858194, + "learning_rate": 3.88339936125256e-05, + "loss": 0.3157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17375317215919495, + "step": 820, + "valid_targets_mean": 8280.6, + "valid_targets_min": 2743 + }, + { + "epoch": 1.3983050847457628, + "grad_norm": 0.46062681778063724, + "learning_rate": 3.8805388518269184e-05, + "loss": 0.2962, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17423167824745178, + "step": 825, + "valid_targets_mean": 8636.1, + "valid_targets_min": 4169 + }, + { + "epoch": 1.4067796610169492, + "grad_norm": 0.4486860590784266, + "learning_rate": 3.877644758101648e-05, + "loss": 0.3156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17933771014213562, + "step": 830, + "valid_targets_mean": 8570.9, + "valid_targets_min": 1893 + }, + { + "epoch": 1.4152542372881356, + "grad_norm": 0.4719151934288519, + "learning_rate": 3.8747171317619955e-05, + "loss": 0.3143, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09397554397583008, + "step": 835, + "valid_targets_mean": 5133.0, + "valid_targets_min": 2254 + }, + { + "epoch": 1.423728813559322, + "grad_norm": 0.4667473106135975, + "learning_rate": 3.871756025092059e-05, + "loss": 0.3479, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1407933086156845, + "step": 840, + "valid_targets_mean": 6628.8, + "valid_targets_min": 2795 + }, + { + "epoch": 1.4322033898305084, + "grad_norm": 0.4412306378722383, + "learning_rate": 3.868761490973859e-05, + "loss": 0.307, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1313735395669937, + "step": 845, + "valid_targets_mean": 6751.1, + "valid_targets_min": 3064 + }, + { + "epoch": 1.4406779661016949, + "grad_norm": 0.43177538465939785, + "learning_rate": 3.8657335828863924e-05, + "loss": 0.3316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1634959578514099, + "step": 850, + "valid_targets_mean": 7480.4, + "valid_targets_min": 3151 + }, + { + "epoch": 1.4491525423728815, + "grad_norm": 0.43807884753609994, + "learning_rate": 3.8626723549046774e-05, + "loss": 0.3268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12339450418949127, + "step": 855, + "valid_targets_mean": 6659.2, + "valid_targets_min": 2840 + }, + { + "epoch": 1.457627118644068, + "grad_norm": 0.4727987965750298, + "learning_rate": 3.859577861698787e-05, + "loss": 0.2922, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15785086154937744, + "step": 860, + "valid_targets_mean": 7509.2, + "valid_targets_min": 3028 + }, + { + "epoch": 1.4661016949152543, + "grad_norm": 0.4384303554477187, + "learning_rate": 3.856450158532875e-05, + "loss": 0.323, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1519169807434082, + "step": 865, + "valid_targets_mean": 7232.5, + "valid_targets_min": 3849 + }, + { + "epoch": 1.4745762711864407, + "grad_norm": 0.49727270409272106, + "learning_rate": 3.853289301264187e-05, + "loss": 0.3358, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1139516681432724, + "step": 870, + "valid_targets_mean": 6231.1, + "valid_targets_min": 1612 + }, + { + "epoch": 1.4830508474576272, + "grad_norm": 0.4426633905595123, + "learning_rate": 3.850095346342064e-05, + "loss": 0.3273, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16769997775554657, + "step": 875, + "valid_targets_mean": 7338.5, + "valid_targets_min": 3859 + }, + { + "epoch": 1.4915254237288136, + "grad_norm": 0.4593726038548315, + "learning_rate": 3.84686835080693e-05, + "loss": 0.3099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11144979298114777, + "step": 880, + "valid_targets_mean": 6119.1, + "valid_targets_min": 3785 + }, + { + "epoch": 1.5, + "grad_norm": 0.49604203241194217, + "learning_rate": 3.843608372289283e-05, + "loss": 0.3271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15156549215316772, + "step": 885, + "valid_targets_mean": 7399.4, + "valid_targets_min": 3299 + }, + { + "epoch": 1.5084745762711864, + "grad_norm": 0.545080093883971, + "learning_rate": 3.8403154690086564e-05, + "loss": 0.3361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12989340722560883, + "step": 890, + "valid_targets_mean": 7236.0, + "valid_targets_min": 3225 + }, + { + "epoch": 1.5169491525423728, + "grad_norm": 0.45075511600659357, + "learning_rate": 3.836989699772582e-05, + "loss": 0.3229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1870659589767456, + "step": 895, + "valid_targets_mean": 7038.4, + "valid_targets_min": 2187 + }, + { + "epoch": 1.5254237288135593, + "grad_norm": 0.47217639934643396, + "learning_rate": 3.8336311239755424e-05, + "loss": 0.3622, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15166038274765015, + "step": 900, + "valid_targets_mean": 7118.4, + "valid_targets_min": 2202 + }, + { + "epoch": 1.5338983050847457, + "grad_norm": 0.41709638199225046, + "learning_rate": 3.830239801597907e-05, + "loss": 0.3125, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14974796772003174, + "step": 905, + "valid_targets_mean": 7620.0, + "valid_targets_min": 2350 + }, + { + "epoch": 1.542372881355932, + "grad_norm": 0.41637607079903677, + "learning_rate": 3.826815793204863e-05, + "loss": 0.3013, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1806432008743286, + "step": 910, + "valid_targets_mean": 9408.8, + "valid_targets_min": 4175 + }, + { + "epoch": 1.5508474576271185, + "grad_norm": 0.5361115971794117, + "learning_rate": 3.823359159945332e-05, + "loss": 0.3193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1987413465976715, + "step": 915, + "valid_targets_mean": 8330.9, + "valid_targets_min": 3259 + }, + { + "epoch": 1.559322033898305, + "grad_norm": 0.44132736535406036, + "learning_rate": 3.8198699635508805e-05, + "loss": 0.2982, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18994596600532532, + "step": 920, + "valid_targets_mean": 9074.9, + "valid_targets_min": 3436 + }, + { + "epoch": 1.5677966101694916, + "grad_norm": 0.3816717467254405, + "learning_rate": 3.816348266334614e-05, + "loss": 0.319, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12687310576438904, + "step": 925, + "valid_targets_mean": 8785.6, + "valid_targets_min": 4974 + }, + { + "epoch": 1.576271186440678, + "grad_norm": 0.4412025073597514, + "learning_rate": 3.812794131190066e-05, + "loss": 0.3306, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13384410738945007, + "step": 930, + "valid_targets_mean": 7849.2, + "valid_targets_min": 3985 + }, + { + "epoch": 1.5847457627118644, + "grad_norm": 0.396693457802134, + "learning_rate": 3.8092076215900765e-05, + "loss": 0.303, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20873287320137024, + "step": 935, + "valid_targets_mean": 11243.4, + "valid_targets_min": 5339 + }, + { + "epoch": 1.5932203389830508, + "grad_norm": 0.4285610045500551, + "learning_rate": 3.805588801585654e-05, + "loss": 0.3188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08912678807973862, + "step": 940, + "valid_targets_mean": 4676.0, + "valid_targets_min": 2847 + }, + { + "epoch": 1.6016949152542372, + "grad_norm": 0.41295836604849834, + "learning_rate": 3.801937735804838e-05, + "loss": 0.3439, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17002055048942566, + "step": 945, + "valid_targets_mean": 8253.2, + "valid_targets_min": 2292 + }, + { + "epoch": 1.6101694915254239, + "grad_norm": 0.4110467780511449, + "learning_rate": 3.798254489451539e-05, + "loss": 0.3218, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26079848408699036, + "step": 950, + "valid_targets_mean": 11661.2, + "valid_targets_min": 2093 + }, + { + "epoch": 1.6186440677966103, + "grad_norm": 0.5284185078380007, + "learning_rate": 3.794539128304374e-05, + "loss": 0.3327, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21993231773376465, + "step": 955, + "valid_targets_mean": 10140.0, + "valid_targets_min": 4917 + }, + { + "epoch": 1.6271186440677967, + "grad_norm": 0.43465978137133837, + "learning_rate": 3.790791718715498e-05, + "loss": 0.3362, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16745583713054657, + "step": 960, + "valid_targets_mean": 7656.5, + "valid_targets_min": 2997 + }, + { + "epoch": 1.6355932203389831, + "grad_norm": 0.46353679599089426, + "learning_rate": 3.7870123276094134e-05, + "loss": 0.3063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14307042956352234, + "step": 965, + "valid_targets_mean": 6720.0, + "valid_targets_min": 2036 + }, + { + "epoch": 1.6440677966101696, + "grad_norm": 0.42508115955425385, + "learning_rate": 3.783201022481775e-05, + "loss": 0.307, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16600486636161804, + "step": 970, + "valid_targets_mean": 7660.0, + "valid_targets_min": 4016 + }, + { + "epoch": 1.652542372881356, + "grad_norm": 0.47460145753384014, + "learning_rate": 3.7793578713981876e-05, + "loss": 0.2713, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17931526899337769, + "step": 975, + "valid_targets_mean": 7207.9, + "valid_targets_min": 2066 + }, + { + "epoch": 1.6610169491525424, + "grad_norm": 0.4565761001462879, + "learning_rate": 3.775482942992989e-05, + "loss": 0.296, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10052239894866943, + "step": 980, + "valid_targets_mean": 5350.4, + "valid_targets_min": 3691 + }, + { + "epoch": 1.6694915254237288, + "grad_norm": 0.404024020976862, + "learning_rate": 3.771576306468022e-05, + "loss": 0.331, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13798417150974274, + "step": 985, + "valid_targets_mean": 8586.6, + "valid_targets_min": 2541 + }, + { + "epoch": 1.6779661016949152, + "grad_norm": 0.46889190610408676, + "learning_rate": 3.7676380315914025e-05, + "loss": 0.3316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09154243022203445, + "step": 990, + "valid_targets_mean": 5740.6, + "valid_targets_min": 1962 + }, + { + "epoch": 1.6864406779661016, + "grad_norm": 0.4064487350790923, + "learning_rate": 3.7636681886962724e-05, + "loss": 0.3665, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15788796544075012, + "step": 995, + "valid_targets_mean": 7709.4, + "valid_targets_min": 2560 + }, + { + "epoch": 1.694915254237288, + "grad_norm": 0.7897794567174825, + "learning_rate": 3.759666848679539e-05, + "loss": 0.304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15532286465168, + "step": 1000, + "valid_targets_mean": 9089.0, + "valid_targets_min": 5046 + }, + { + "epoch": 1.7033898305084745, + "grad_norm": 0.6035847206124464, + "learning_rate": 3.755634083000617e-05, + "loss": 0.3292, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1320587694644928, + "step": 1005, + "valid_targets_mean": 6896.9, + "valid_targets_min": 2965 + }, + { + "epoch": 1.711864406779661, + "grad_norm": 0.41483149367263833, + "learning_rate": 3.751569963680146e-05, + "loss": 0.2949, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20763173699378967, + "step": 1010, + "valid_targets_mean": 9600.8, + "valid_targets_min": 5071 + }, + { + "epoch": 1.7203389830508473, + "grad_norm": 0.45501656641530847, + "learning_rate": 3.747474563298705e-05, + "loss": 0.3288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13265684247016907, + "step": 1015, + "valid_targets_mean": 6442.4, + "valid_targets_min": 1875 + }, + { + "epoch": 1.7288135593220337, + "grad_norm": 0.5257033113939008, + "learning_rate": 3.743347954995519e-05, + "loss": 0.3268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13818372786045074, + "step": 1020, + "valid_targets_mean": 6209.2, + "valid_targets_min": 3843 + }, + { + "epoch": 1.7372881355932204, + "grad_norm": 0.4383597245709914, + "learning_rate": 3.7391902124671516e-05, + "loss": 0.3244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19095399975776672, + "step": 1025, + "valid_targets_mean": 8865.8, + "valid_targets_min": 3685 + }, + { + "epoch": 1.7457627118644068, + "grad_norm": 0.39724550405667364, + "learning_rate": 3.7350014099661874e-05, + "loss": 0.3066, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20521703362464905, + "step": 1030, + "valid_targets_mean": 9690.9, + "valid_targets_min": 3548 + }, + { + "epoch": 1.7542372881355932, + "grad_norm": 0.39927522299758583, + "learning_rate": 3.730781622299907e-05, + "loss": 0.3211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17346695065498352, + "step": 1035, + "valid_targets_mean": 8075.1, + "valid_targets_min": 3805 + }, + { + "epoch": 1.7627118644067796, + "grad_norm": 0.4350255084725687, + "learning_rate": 3.7265309248289516e-05, + "loss": 0.3455, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16887761652469635, + "step": 1040, + "valid_targets_mean": 7783.6, + "valid_targets_min": 3913 + }, + { + "epoch": 1.7711864406779663, + "grad_norm": 0.421663580685689, + "learning_rate": 3.7222493934659765e-05, + "loss": 0.3466, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1530277132987976, + "step": 1045, + "valid_targets_mean": 9355.5, + "valid_targets_min": 4980 + }, + { + "epoch": 1.7796610169491527, + "grad_norm": 0.4369588066271297, + "learning_rate": 3.717937104674296e-05, + "loss": 0.2978, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13133104145526886, + "step": 1050, + "valid_targets_mean": 7752.2, + "valid_targets_min": 4407 + }, + { + "epoch": 1.788135593220339, + "grad_norm": 0.4368294132363595, + "learning_rate": 3.713594135466515e-05, + "loss": 0.3225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17027533054351807, + "step": 1055, + "valid_targets_mean": 8704.5, + "valid_targets_min": 2855 + }, + { + "epoch": 1.7966101694915255, + "grad_norm": 0.43449669149693804, + "learning_rate": 3.7092205634031595e-05, + "loss": 0.3478, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08701007068157196, + "step": 1060, + "valid_targets_mean": 4998.2, + "valid_targets_min": 2374 + }, + { + "epoch": 1.805084745762712, + "grad_norm": 0.39372753859603943, + "learning_rate": 3.704816466591286e-05, + "loss": 0.3163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12855243682861328, + "step": 1065, + "valid_targets_mean": 7622.5, + "valid_targets_min": 4093 + }, + { + "epoch": 1.8135593220338984, + "grad_norm": 0.3964647607911203, + "learning_rate": 3.700381923683087e-05, + "loss": 0.3364, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1131635457277298, + "step": 1070, + "valid_targets_mean": 7209.1, + "valid_targets_min": 2797 + }, + { + "epoch": 1.8220338983050848, + "grad_norm": 0.4159371295645834, + "learning_rate": 3.695917013874491e-05, + "loss": 0.2832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13864587247371674, + "step": 1075, + "valid_targets_mean": 7083.8, + "valid_targets_min": 3551 + }, + { + "epoch": 1.8305084745762712, + "grad_norm": 0.41132981890721415, + "learning_rate": 3.691421816903744e-05, + "loss": 0.3373, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20368866622447968, + "step": 1080, + "valid_targets_mean": 8503.0, + "valid_targets_min": 1795 + }, + { + "epoch": 1.8389830508474576, + "grad_norm": 0.43908713798714083, + "learning_rate": 3.686896413049985e-05, + "loss": 0.2886, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12140090763568878, + "step": 1085, + "valid_targets_mean": 6773.4, + "valid_targets_min": 3364 + }, + { + "epoch": 1.847457627118644, + "grad_norm": 0.4338791941921327, + "learning_rate": 3.6823408831318154e-05, + "loss": 0.3105, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16254982352256775, + "step": 1090, + "valid_targets_mean": 7966.9, + "valid_targets_min": 2532 + }, + { + "epoch": 1.8559322033898304, + "grad_norm": 0.41721828273489936, + "learning_rate": 3.677755308505854e-05, + "loss": 0.3423, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1637614667415619, + "step": 1095, + "valid_targets_mean": 7360.9, + "valid_targets_min": 3864 + }, + { + "epoch": 1.8644067796610169, + "grad_norm": 0.4152523100279547, + "learning_rate": 3.673139771065282e-05, + "loss": 0.3229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11550319194793701, + "step": 1100, + "valid_targets_mean": 6838.5, + "valid_targets_min": 3869 + }, + { + "epoch": 1.8728813559322033, + "grad_norm": 0.37899639866690693, + "learning_rate": 3.6684943532383866e-05, + "loss": 0.3448, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18879902362823486, + "step": 1105, + "valid_targets_mean": 10441.6, + "valid_targets_min": 3589 + }, + { + "epoch": 1.8813559322033897, + "grad_norm": 0.40369311396663893, + "learning_rate": 3.663819137987081e-05, + "loss": 0.3342, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16418354213237762, + "step": 1110, + "valid_targets_mean": 9130.6, + "valid_targets_min": 6228 + }, + { + "epoch": 1.8898305084745761, + "grad_norm": 0.4216701104223837, + "learning_rate": 3.65911420880543e-05, + "loss": 0.3106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2091543972492218, + "step": 1115, + "valid_targets_mean": 8209.8, + "valid_targets_min": 3449 + }, + { + "epoch": 1.8983050847457628, + "grad_norm": 0.39934323363745766, + "learning_rate": 3.654379649718153e-05, + "loss": 0.3059, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16052965819835663, + "step": 1120, + "valid_targets_mean": 8141.9, + "valid_targets_min": 2341 + }, + { + "epoch": 1.9067796610169492, + "grad_norm": 0.425180656486338, + "learning_rate": 3.649615545279127e-05, + "loss": 0.3443, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23255954682826996, + "step": 1125, + "valid_targets_mean": 8977.1, + "valid_targets_min": 1589 + }, + { + "epoch": 1.9152542372881356, + "grad_norm": 0.4134843945605497, + "learning_rate": 3.644821980569876e-05, + "loss": 0.3293, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18696650862693787, + "step": 1130, + "valid_targets_mean": 9344.6, + "valid_targets_min": 2897 + }, + { + "epoch": 1.923728813559322, + "grad_norm": 0.4247315776579201, + "learning_rate": 3.639999041198051e-05, + "loss": 0.3106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15916836261749268, + "step": 1135, + "valid_targets_mean": 7757.0, + "valid_targets_min": 2240 + }, + { + "epoch": 1.9322033898305084, + "grad_norm": 0.4285608095339475, + "learning_rate": 3.635146813295902e-05, + "loss": 0.3347, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12798747420310974, + "step": 1140, + "valid_targets_mean": 7018.9, + "valid_targets_min": 3392 + }, + { + "epoch": 1.940677966101695, + "grad_norm": 0.4320951231170634, + "learning_rate": 3.6302653835187366e-05, + "loss": 0.3154, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2193724513053894, + "step": 1145, + "valid_targets_mean": 8454.5, + "valid_targets_min": 4385 + }, + { + "epoch": 1.9491525423728815, + "grad_norm": 0.3679163355593773, + "learning_rate": 3.625354839043377e-05, + "loss": 0.2863, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2157258540391922, + "step": 1150, + "valid_targets_mean": 12249.4, + "valid_targets_min": 4241 + }, + { + "epoch": 1.957627118644068, + "grad_norm": 0.4102455825218708, + "learning_rate": 3.620415267566601e-05, + "loss": 0.3306, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12105512619018555, + "step": 1155, + "valid_targets_mean": 7516.5, + "valid_targets_min": 3222 + }, + { + "epoch": 1.9661016949152543, + "grad_norm": 0.4175220017891001, + "learning_rate": 3.615446757303575e-05, + "loss": 0.3221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17339207231998444, + "step": 1160, + "valid_targets_mean": 8759.4, + "valid_targets_min": 2960 + }, + { + "epoch": 1.9745762711864407, + "grad_norm": 0.44844776216498816, + "learning_rate": 3.610449396986281e-05, + "loss": 0.3084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09378059208393097, + "step": 1165, + "valid_targets_mean": 5834.0, + "valid_targets_min": 2096 + }, + { + "epoch": 1.9830508474576272, + "grad_norm": 0.44812744257447257, + "learning_rate": 3.6054232758619274e-05, + "loss": 0.3161, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1947910189628601, + "step": 1170, + "valid_targets_mean": 7453.2, + "valid_targets_min": 2451 + }, + { + "epoch": 1.9915254237288136, + "grad_norm": 0.4242232674193107, + "learning_rate": 3.600368483691361e-05, + "loss": 0.3279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13258054852485657, + "step": 1175, + "valid_targets_mean": 7682.2, + "valid_targets_min": 2492 + }, + { + "epoch": 2.0, + "grad_norm": 0.45289022894013076, + "learning_rate": 3.59528511074746e-05, + "loss": 0.299, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12481173872947693, + "step": 1180, + "valid_targets_mean": 5148.2, + "valid_targets_min": 1999 + }, + { + "epoch": 2.0084745762711864, + "grad_norm": 0.47796518296033785, + "learning_rate": 3.5901732478135235e-05, + "loss": 0.3136, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15180028975009918, + "step": 1185, + "valid_targets_mean": 6321.6, + "valid_targets_min": 2236 + }, + { + "epoch": 2.016949152542373, + "grad_norm": 0.438352359074808, + "learning_rate": 3.5850329861816475e-05, + "loss": 0.2817, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12889432907104492, + "step": 1190, + "valid_targets_mean": 6916.6, + "valid_targets_min": 2771 + }, + { + "epoch": 2.0254237288135593, + "grad_norm": 0.4126031654763985, + "learning_rate": 3.5798644176511e-05, + "loss": 0.2969, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09737379848957062, + "step": 1195, + "valid_targets_mean": 6256.8, + "valid_targets_min": 3050 + }, + { + "epoch": 2.0338983050847457, + "grad_norm": 0.408111961548012, + "learning_rate": 3.574667634526676e-05, + "loss": 0.3122, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14440008997917175, + "step": 1200, + "valid_targets_mean": 7384.1, + "valid_targets_min": 2779 + }, + { + "epoch": 2.042372881355932, + "grad_norm": 0.455628995610143, + "learning_rate": 3.5694427296170514e-05, + "loss": 0.3048, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16236944496631622, + "step": 1205, + "valid_targets_mean": 8072.6, + "valid_targets_min": 4463 + }, + { + "epoch": 2.0508474576271185, + "grad_norm": 0.43337894990516485, + "learning_rate": 3.564189796233125e-05, + "loss": 0.3144, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22974911332130432, + "step": 1210, + "valid_targets_mean": 9636.9, + "valid_targets_min": 3097 + }, + { + "epoch": 2.059322033898305, + "grad_norm": 0.40732481179936597, + "learning_rate": 3.5589089281863547e-05, + "loss": 0.2969, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1029449924826622, + "step": 1215, + "valid_targets_mean": 7567.2, + "valid_targets_min": 2751 + }, + { + "epoch": 2.0677966101694913, + "grad_norm": 0.4252300433877439, + "learning_rate": 3.553600219787079e-05, + "loss": 0.2906, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19273892045021057, + "step": 1220, + "valid_targets_mean": 8599.9, + "valid_targets_min": 3639 + }, + { + "epoch": 2.0762711864406778, + "grad_norm": 0.4546211585832868, + "learning_rate": 3.5482637658428315e-05, + "loss": 0.2949, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23350149393081665, + "step": 1225, + "valid_targets_mean": 9294.4, + "valid_targets_min": 1933 + }, + { + "epoch": 2.084745762711864, + "grad_norm": 0.4145817713099008, + "learning_rate": 3.542899661656653e-05, + "loss": 0.3212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1794952154159546, + "step": 1230, + "valid_targets_mean": 9705.6, + "valid_targets_min": 4885 + }, + { + "epoch": 2.093220338983051, + "grad_norm": 0.5271058668855069, + "learning_rate": 3.5375080030253826e-05, + "loss": 0.3432, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12348256260156631, + "step": 1235, + "valid_targets_mean": 6719.0, + "valid_targets_min": 3708 + }, + { + "epoch": 2.1016949152542375, + "grad_norm": 0.4232353398881956, + "learning_rate": 3.532088886237956e-05, + "loss": 0.3022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10980045795440674, + "step": 1240, + "valid_targets_mean": 6338.2, + "valid_targets_min": 3309 + }, + { + "epoch": 2.110169491525424, + "grad_norm": 0.45183791890941466, + "learning_rate": 3.5266424080736765e-05, + "loss": 0.3079, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15499433875083923, + "step": 1245, + "valid_targets_mean": 7531.9, + "valid_targets_min": 3690 + }, + { + "epoch": 2.1186440677966103, + "grad_norm": 0.43508072611158927, + "learning_rate": 3.521168665800491e-05, + "loss": 0.3222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2509422302246094, + "step": 1250, + "valid_targets_mean": 13284.1, + "valid_targets_min": 5966 + }, + { + "epoch": 2.1271186440677967, + "grad_norm": 0.42735089982934016, + "learning_rate": 3.515667757173254e-05, + "loss": 0.2953, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13675671815872192, + "step": 1255, + "valid_targets_mean": 7142.9, + "valid_targets_min": 2413 + }, + { + "epoch": 2.135593220338983, + "grad_norm": 0.40760862132146264, + "learning_rate": 3.5101397804319794e-05, + "loss": 0.2859, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17705723643302917, + "step": 1260, + "valid_targets_mean": 8875.0, + "valid_targets_min": 3101 + }, + { + "epoch": 2.1440677966101696, + "grad_norm": 0.4900166239838904, + "learning_rate": 3.5045848343000876e-05, + "loss": 0.2858, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1725788712501526, + "step": 1265, + "valid_targets_mean": 7732.4, + "valid_targets_min": 2984 + }, + { + "epoch": 2.152542372881356, + "grad_norm": 0.428816419240488, + "learning_rate": 3.4990030179826414e-05, + "loss": 0.3253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20709286630153656, + "step": 1270, + "valid_targets_mean": 10128.1, + "valid_targets_min": 4459 + }, + { + "epoch": 2.1610169491525424, + "grad_norm": 0.40014932477968135, + "learning_rate": 3.493394431164576e-05, + "loss": 0.2927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15721966326236725, + "step": 1275, + "valid_targets_mean": 8368.9, + "valid_targets_min": 4914 + }, + { + "epoch": 2.169491525423729, + "grad_norm": 0.460349336503394, + "learning_rate": 3.4877591740089144e-05, + "loss": 0.3034, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12180677056312561, + "step": 1280, + "valid_targets_mean": 6484.2, + "valid_targets_min": 2984 + }, + { + "epoch": 2.1779661016949152, + "grad_norm": 0.4167414151848438, + "learning_rate": 3.482097347154986e-05, + "loss": 0.2945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15773698687553406, + "step": 1285, + "valid_targets_mean": 8676.9, + "valid_targets_min": 2724 + }, + { + "epoch": 2.1864406779661016, + "grad_norm": 0.4119767997336977, + "learning_rate": 3.476409051716621e-05, + "loss": 0.3075, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19150680303573608, + "step": 1290, + "valid_targets_mean": 9972.0, + "valid_targets_min": 4367 + }, + { + "epoch": 2.194915254237288, + "grad_norm": 0.46842012389861176, + "learning_rate": 3.470694389280352e-05, + "loss": 0.2894, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13265065848827362, + "step": 1295, + "valid_targets_mean": 6506.4, + "valid_targets_min": 2591 + }, + { + "epoch": 2.2033898305084745, + "grad_norm": 0.5070785490329287, + "learning_rate": 3.464953461903593e-05, + "loss": 0.2815, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16730618476867676, + "step": 1300, + "valid_targets_mean": 7640.6, + "valid_targets_min": 2556 + }, + { + "epoch": 2.211864406779661, + "grad_norm": 0.44925860012957636, + "learning_rate": 3.459186372112824e-05, + "loss": 0.3067, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12842459976673126, + "step": 1305, + "valid_targets_mean": 6798.6, + "valid_targets_min": 3979 + }, + { + "epoch": 2.2203389830508473, + "grad_norm": 0.41138242525433244, + "learning_rate": 3.453393222901753e-05, + "loss": 0.3239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09415019303560257, + "step": 1310, + "valid_targets_mean": 7214.1, + "valid_targets_min": 2008 + }, + { + "epoch": 2.2288135593220337, + "grad_norm": 0.41131324862852436, + "learning_rate": 3.44757411772948e-05, + "loss": 0.3134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.173304945230484, + "step": 1315, + "valid_targets_mean": 8934.2, + "valid_targets_min": 3731 + }, + { + "epoch": 2.23728813559322, + "grad_norm": 0.47453310588934633, + "learning_rate": 3.441729160518652e-05, + "loss": 0.326, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20205450057983398, + "step": 1320, + "valid_targets_mean": 8631.2, + "valid_targets_min": 3796 + }, + { + "epoch": 2.2457627118644066, + "grad_norm": 0.43201686834502273, + "learning_rate": 3.435858455653601e-05, + "loss": 0.3064, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13337936997413635, + "step": 1325, + "valid_targets_mean": 7937.0, + "valid_targets_min": 2699 + }, + { + "epoch": 2.2542372881355934, + "grad_norm": 0.458779232154746, + "learning_rate": 3.429962107978485e-05, + "loss": 0.3096, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1039549931883812, + "step": 1330, + "valid_targets_mean": 5822.1, + "valid_targets_min": 2106 + }, + { + "epoch": 2.26271186440678, + "grad_norm": 0.40314998050323314, + "learning_rate": 3.424040222795412e-05, + "loss": 0.3012, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10799141228199005, + "step": 1335, + "valid_targets_mean": 6850.5, + "valid_targets_min": 3619 + }, + { + "epoch": 2.2711864406779663, + "grad_norm": 0.4249827679361363, + "learning_rate": 3.418092905862563e-05, + "loss": 0.2919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1282862275838852, + "step": 1340, + "valid_targets_mean": 7501.6, + "valid_targets_min": 4154 + }, + { + "epoch": 2.2796610169491527, + "grad_norm": 0.45225084379688923, + "learning_rate": 3.412120263392301e-05, + "loss": 0.2935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15831294655799866, + "step": 1345, + "valid_targets_mean": 8395.9, + "valid_targets_min": 5077 + }, + { + "epoch": 2.288135593220339, + "grad_norm": 0.4323979115648768, + "learning_rate": 3.406122402049272e-05, + "loss": 0.3187, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1440098136663437, + "step": 1350, + "valid_targets_mean": 8358.2, + "valid_targets_min": 3033 + }, + { + "epoch": 2.2966101694915255, + "grad_norm": 0.44798843437203717, + "learning_rate": 3.400099428948505e-05, + "loss": 0.2964, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24259638786315918, + "step": 1355, + "valid_targets_mean": 9828.9, + "valid_targets_min": 3934 + }, + { + "epoch": 2.305084745762712, + "grad_norm": 0.4118065309385498, + "learning_rate": 3.394051451653496e-05, + "loss": 0.2987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12573987245559692, + "step": 1360, + "valid_targets_mean": 7931.0, + "valid_targets_min": 5094 + }, + { + "epoch": 2.3135593220338984, + "grad_norm": 0.43851923519918656, + "learning_rate": 3.3879785781742875e-05, + "loss": 0.3164, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18017522990703583, + "step": 1365, + "valid_targets_mean": 8832.6, + "valid_targets_min": 3053 + }, + { + "epoch": 2.3220338983050848, + "grad_norm": 0.49539123931874524, + "learning_rate": 3.381880916965541e-05, + "loss": 0.2939, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10733641684055328, + "step": 1370, + "valid_targets_mean": 5227.6, + "valid_targets_min": 2791 + }, + { + "epoch": 2.330508474576271, + "grad_norm": 0.512139157052037, + "learning_rate": 3.3757585769245964e-05, + "loss": 0.312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.151132732629776, + "step": 1375, + "valid_targets_mean": 7262.0, + "valid_targets_min": 3945 + }, + { + "epoch": 2.3389830508474576, + "grad_norm": 0.4416566028201391, + "learning_rate": 3.3696116673895314e-05, + "loss": 0.3211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2037435919046402, + "step": 1380, + "valid_targets_mean": 9578.2, + "valid_targets_min": 3736 + }, + { + "epoch": 2.347457627118644, + "grad_norm": 0.45082149557407764, + "learning_rate": 3.363440298137207e-05, + "loss": 0.3071, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12679685652256012, + "step": 1385, + "valid_targets_mean": 6039.9, + "valid_targets_min": 2300 + }, + { + "epoch": 2.3559322033898304, + "grad_norm": 0.4421724624356205, + "learning_rate": 3.357244579381306e-05, + "loss": 0.2908, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14652232825756073, + "step": 1390, + "valid_targets_mean": 7244.0, + "valid_targets_min": 1903 + }, + { + "epoch": 2.364406779661017, + "grad_norm": 0.4495061538438427, + "learning_rate": 3.351024621770369e-05, + "loss": 0.2983, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0919191762804985, + "step": 1395, + "valid_targets_mean": 5043.9, + "valid_targets_min": 2452 + }, + { + "epoch": 2.3728813559322033, + "grad_norm": 0.45212052889171317, + "learning_rate": 3.34478053638581e-05, + "loss": 0.2859, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14459501206874847, + "step": 1400, + "valid_targets_mean": 7165.5, + "valid_targets_min": 1936 + }, + { + "epoch": 2.3813559322033897, + "grad_norm": 0.45753710310314344, + "learning_rate": 3.3385124347399415e-05, + "loss": 0.2757, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11004475504159927, + "step": 1405, + "valid_targets_mean": 7322.9, + "valid_targets_min": 2350 + }, + { + "epoch": 2.389830508474576, + "grad_norm": 0.4527197832006006, + "learning_rate": 3.33222042877398e-05, + "loss": 0.301, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17083138227462769, + "step": 1410, + "valid_targets_mean": 7809.4, + "valid_targets_min": 2393 + }, + { + "epoch": 2.3983050847457625, + "grad_norm": 0.3772050754545617, + "learning_rate": 3.325904630856042e-05, + "loss": 0.2956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18102893233299255, + "step": 1415, + "valid_targets_mean": 10666.2, + "valid_targets_min": 3513 + }, + { + "epoch": 2.406779661016949, + "grad_norm": 0.4563452741739858, + "learning_rate": 3.319565153779146e-05, + "loss": 0.3467, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26052290201187134, + "step": 1420, + "valid_targets_mean": 10017.8, + "valid_targets_min": 5124 + }, + { + "epoch": 2.415254237288136, + "grad_norm": 0.46401872953783496, + "learning_rate": 3.31320211075919e-05, + "loss": 0.3201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1795731782913208, + "step": 1425, + "valid_targets_mean": 7820.4, + "valid_targets_min": 2278 + }, + { + "epoch": 2.423728813559322, + "grad_norm": 0.4298768255585762, + "learning_rate": 3.306815615432936e-05, + "loss": 0.3383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1531204879283905, + "step": 1430, + "valid_targets_mean": 8088.8, + "valid_targets_min": 2989 + }, + { + "epoch": 2.4322033898305087, + "grad_norm": 0.42943975120474337, + "learning_rate": 3.300405781855975e-05, + "loss": 0.2942, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19165225327014923, + "step": 1435, + "valid_targets_mean": 9201.4, + "valid_targets_min": 6019 + }, + { + "epoch": 2.440677966101695, + "grad_norm": 0.3977047765538059, + "learning_rate": 3.2939727245006956e-05, + "loss": 0.2999, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15969790518283844, + "step": 1440, + "valid_targets_mean": 8977.9, + "valid_targets_min": 2996 + }, + { + "epoch": 2.4491525423728815, + "grad_norm": 0.43392603484157843, + "learning_rate": 3.2875165582542347e-05, + "loss": 0.3049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09724732488393784, + "step": 1445, + "valid_targets_mean": 6136.5, + "valid_targets_min": 3622 + }, + { + "epoch": 2.457627118644068, + "grad_norm": 0.39026794378770674, + "learning_rate": 3.281037398416427e-05, + "loss": 0.2698, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12890513241291046, + "step": 1450, + "valid_targets_mean": 6924.1, + "valid_targets_min": 2394 + }, + { + "epoch": 2.4661016949152543, + "grad_norm": 0.4242919077715597, + "learning_rate": 3.2745353606977506e-05, + "loss": 0.3159, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1096186563372612, + "step": 1455, + "valid_targets_mean": 7928.4, + "valid_targets_min": 3062 + }, + { + "epoch": 2.4745762711864407, + "grad_norm": 0.4289426904620235, + "learning_rate": 3.268010561217253e-05, + "loss": 0.308, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13930077850818634, + "step": 1460, + "valid_targets_mean": 8676.9, + "valid_targets_min": 4315 + }, + { + "epoch": 2.483050847457627, + "grad_norm": 0.4051021933769338, + "learning_rate": 3.261463116500483e-05, + "loss": 0.2942, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10786758363246918, + "step": 1465, + "valid_targets_mean": 6350.8, + "valid_targets_min": 2847 + }, + { + "epoch": 2.4915254237288136, + "grad_norm": 0.4019638092945469, + "learning_rate": 3.254893143477408e-05, + "loss": 0.2916, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20479941368103027, + "step": 1470, + "valid_targets_mean": 10263.6, + "valid_targets_min": 2865 + }, + { + "epoch": 2.5, + "grad_norm": 0.4299334544244074, + "learning_rate": 3.248300759480323e-05, + "loss": 0.3183, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2492760419845581, + "step": 1475, + "valid_targets_mean": 10219.6, + "valid_targets_min": 5175 + }, + { + "epoch": 2.5084745762711864, + "grad_norm": 0.4023371948985823, + "learning_rate": 3.241686082241761e-05, + "loss": 0.2857, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1464785933494568, + "step": 1480, + "valid_targets_mean": 8838.9, + "valid_targets_min": 2493 + }, + { + "epoch": 2.516949152542373, + "grad_norm": 0.41294672992405235, + "learning_rate": 3.235049229892384e-05, + "loss": 0.2655, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12958091497421265, + "step": 1485, + "valid_targets_mean": 7342.2, + "valid_targets_min": 4829 + }, + { + "epoch": 2.5254237288135593, + "grad_norm": 0.3831925532498252, + "learning_rate": 3.2283903209588795e-05, + "loss": 0.3178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1335603892803192, + "step": 1490, + "valid_targets_mean": 7712.6, + "valid_targets_min": 2385 + }, + { + "epoch": 2.5338983050847457, + "grad_norm": 0.4157070224630618, + "learning_rate": 3.221709474361838e-05, + "loss": 0.3008, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12635986506938934, + "step": 1495, + "valid_targets_mean": 6957.0, + "valid_targets_min": 2932 + }, + { + "epoch": 2.542372881355932, + "grad_norm": 0.4224344033837063, + "learning_rate": 3.215006809413633e-05, + "loss": 0.3194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1392759382724762, + "step": 1500, + "valid_targets_mean": 6384.5, + "valid_targets_min": 2434 + }, + { + "epoch": 2.5508474576271185, + "grad_norm": 0.43012730740401234, + "learning_rate": 3.20828244581629e-05, + "loss": 0.2878, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1791025698184967, + "step": 1505, + "valid_targets_mean": 7117.2, + "valid_targets_min": 1495 + }, + { + "epoch": 2.559322033898305, + "grad_norm": 0.4845914897087292, + "learning_rate": 3.2015365036593466e-05, + "loss": 0.3306, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1442946195602417, + "step": 1510, + "valid_targets_mean": 9361.6, + "valid_targets_min": 4450 + }, + { + "epoch": 2.5677966101694913, + "grad_norm": 0.4020720093483181, + "learning_rate": 3.194769103417709e-05, + "loss": 0.2901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2034224271774292, + "step": 1515, + "valid_targets_mean": 8227.0, + "valid_targets_min": 2913 + }, + { + "epoch": 2.576271186440678, + "grad_norm": 0.47515037487881684, + "learning_rate": 3.1879803659495015e-05, + "loss": 0.2974, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09358513355255127, + "step": 1520, + "valid_targets_mean": 5848.9, + "valid_targets_min": 2633 + }, + { + "epoch": 2.584745762711864, + "grad_norm": 0.4525136249871132, + "learning_rate": 3.181170412493906e-05, + "loss": 0.2957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14096501469612122, + "step": 1525, + "valid_targets_mean": 5804.8, + "valid_targets_min": 2873 + }, + { + "epoch": 2.593220338983051, + "grad_norm": 0.44499842842422144, + "learning_rate": 3.1743393646689996e-05, + "loss": 0.2689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13607238233089447, + "step": 1530, + "valid_targets_mean": 7015.5, + "valid_targets_min": 3650 + }, + { + "epoch": 2.601694915254237, + "grad_norm": 0.39010435281227923, + "learning_rate": 3.1674873444695804e-05, + "loss": 0.2838, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15358000993728638, + "step": 1535, + "valid_targets_mean": 8212.6, + "valid_targets_min": 4561 + }, + { + "epoch": 2.610169491525424, + "grad_norm": 0.38705505466621165, + "learning_rate": 3.1606144742649875e-05, + "loss": 0.2974, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18068253993988037, + "step": 1540, + "valid_targets_mean": 9366.8, + "valid_targets_min": 3442 + }, + { + "epoch": 2.6186440677966103, + "grad_norm": 0.4645250007783615, + "learning_rate": 3.15372087679692e-05, + "loss": 0.2697, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16335920989513397, + "step": 1545, + "valid_targets_mean": 7294.8, + "valid_targets_min": 2880 + }, + { + "epoch": 2.6271186440677967, + "grad_norm": 0.5969381310791982, + "learning_rate": 3.1468066751772415e-05, + "loss": 0.2987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20474021136760712, + "step": 1550, + "valid_targets_mean": 9866.2, + "valid_targets_min": 3896 + }, + { + "epoch": 2.635593220338983, + "grad_norm": 0.39986488663805625, + "learning_rate": 3.1398719928857834e-05, + "loss": 0.2852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16469399631023407, + "step": 1555, + "valid_targets_mean": 9266.1, + "valid_targets_min": 2559 + }, + { + "epoch": 2.6440677966101696, + "grad_norm": 0.42603497362335596, + "learning_rate": 3.132916953768137e-05, + "loss": 0.2842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15886007249355316, + "step": 1560, + "valid_targets_mean": 7792.9, + "valid_targets_min": 2695 + }, + { + "epoch": 2.652542372881356, + "grad_norm": 0.4477773300510562, + "learning_rate": 3.1259416820334446e-05, + "loss": 0.2917, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1468237042427063, + "step": 1565, + "valid_targets_mean": 6308.1, + "valid_targets_min": 2530 + }, + { + "epoch": 2.6610169491525424, + "grad_norm": 0.413038718975138, + "learning_rate": 3.118946302252181e-05, + "loss": 0.2752, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11161170154809952, + "step": 1570, + "valid_targets_mean": 5875.2, + "valid_targets_min": 3706 + }, + { + "epoch": 2.669491525423729, + "grad_norm": 0.40102607092450826, + "learning_rate": 3.1119309393539256e-05, + "loss": 0.2763, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1047399640083313, + "step": 1575, + "valid_targets_mean": 6100.2, + "valid_targets_min": 2617 + }, + { + "epoch": 2.6779661016949152, + "grad_norm": 0.4487526831600451, + "learning_rate": 3.104895718625136e-05, + "loss": 0.2875, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19679084420204163, + "step": 1580, + "valid_targets_mean": 9194.9, + "valid_targets_min": 3588 + }, + { + "epoch": 2.6864406779661016, + "grad_norm": 0.4319081942251288, + "learning_rate": 3.097840765706908e-05, + "loss": 0.3087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16104386746883392, + "step": 1585, + "valid_targets_mean": 7758.5, + "valid_targets_min": 2699 + }, + { + "epoch": 2.694915254237288, + "grad_norm": 0.4362156095926864, + "learning_rate": 3.0907662065927297e-05, + "loss": 0.2998, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17210246622562408, + "step": 1590, + "valid_targets_mean": 7771.1, + "valid_targets_min": 4059 + }, + { + "epoch": 2.7033898305084745, + "grad_norm": 0.3805861970091732, + "learning_rate": 3.083672167626237e-05, + "loss": 0.3063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1351141780614853, + "step": 1595, + "valid_targets_mean": 8147.1, + "valid_targets_min": 3440 + }, + { + "epoch": 2.711864406779661, + "grad_norm": 0.41117431133265786, + "learning_rate": 3.0765587754989516e-05, + "loss": 0.2884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2080633044242859, + "step": 1600, + "valid_targets_mean": 10313.1, + "valid_targets_min": 4746 + }, + { + "epoch": 2.7203389830508473, + "grad_norm": 0.4193393539029648, + "learning_rate": 3.069426157248022e-05, + "loss": 0.2883, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1242239847779274, + "step": 1605, + "valid_targets_mean": 7685.4, + "valid_targets_min": 2538 + }, + { + "epoch": 2.7288135593220337, + "grad_norm": 0.40390165294921654, + "learning_rate": 3.062274440253953e-05, + "loss": 0.3238, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1672280728816986, + "step": 1610, + "valid_targets_mean": 8736.0, + "valid_targets_min": 2510 + }, + { + "epoch": 2.7372881355932206, + "grad_norm": 0.4597361076436166, + "learning_rate": 3.0551037522383325e-05, + "loss": 0.3077, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13972532749176025, + "step": 1615, + "valid_targets_mean": 6083.9, + "valid_targets_min": 2965 + }, + { + "epoch": 2.7457627118644066, + "grad_norm": 0.3801055818275529, + "learning_rate": 3.0479142212615457e-05, + "loss": 0.3031, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14896857738494873, + "step": 1620, + "valid_targets_mean": 8904.1, + "valid_targets_min": 2302 + }, + { + "epoch": 2.7542372881355934, + "grad_norm": 0.37492323834267705, + "learning_rate": 3.0407059757204968e-05, + "loss": 0.3108, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11933213472366333, + "step": 1625, + "valid_targets_mean": 7426.5, + "valid_targets_min": 2795 + }, + { + "epoch": 2.7627118644067794, + "grad_norm": 0.39976463787165845, + "learning_rate": 3.033479144346308e-05, + "loss": 0.3374, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16365092992782593, + "step": 1630, + "valid_targets_mean": 8906.2, + "valid_targets_min": 4011 + }, + { + "epoch": 2.7711864406779663, + "grad_norm": 0.3997723207190587, + "learning_rate": 3.0262338562020246e-05, + "loss": 0.3026, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11927295476198196, + "step": 1635, + "valid_targets_mean": 6491.0, + "valid_targets_min": 2532 + }, + { + "epoch": 2.7796610169491527, + "grad_norm": 0.36564215466073935, + "learning_rate": 3.018970240680308e-05, + "loss": 0.3071, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19709117710590363, + "step": 1640, + "valid_targets_mean": 11646.2, + "valid_targets_min": 4338 + }, + { + "epoch": 2.788135593220339, + "grad_norm": 0.40505026371761105, + "learning_rate": 3.011688427501126e-05, + "loss": 0.3058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19479559361934662, + "step": 1645, + "valid_targets_mean": 10186.4, + "valid_targets_min": 4347 + }, + { + "epoch": 2.7966101694915255, + "grad_norm": 0.39795771334611546, + "learning_rate": 3.0043885467094382e-05, + "loss": 0.3121, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09027592837810516, + "step": 1650, + "valid_targets_mean": 5524.0, + "valid_targets_min": 2597 + }, + { + "epoch": 2.805084745762712, + "grad_norm": 0.4041662599563723, + "learning_rate": 2.9970707286728676e-05, + "loss": 0.2997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1600339710712433, + "step": 1655, + "valid_targets_mean": 7957.8, + "valid_targets_min": 3054 + }, + { + "epoch": 2.8135593220338984, + "grad_norm": 0.437401544209369, + "learning_rate": 2.9897351040793786e-05, + "loss": 0.2776, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11536328494548798, + "step": 1660, + "valid_targets_mean": 5436.1, + "valid_targets_min": 2823 + }, + { + "epoch": 2.8220338983050848, + "grad_norm": 0.37522109968246403, + "learning_rate": 2.9823818039349407e-05, + "loss": 0.2783, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15367770195007324, + "step": 1665, + "valid_targets_mean": 8713.4, + "valid_targets_min": 2676 + }, + { + "epoch": 2.830508474576271, + "grad_norm": 0.3849792093810754, + "learning_rate": 2.9750109595611884e-05, + "loss": 0.2882, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14932164549827576, + "step": 1670, + "valid_targets_mean": 8313.9, + "valid_targets_min": 2584 + }, + { + "epoch": 2.8389830508474576, + "grad_norm": 0.4863619459847622, + "learning_rate": 2.967622702593074e-05, + "loss": 0.2853, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1424635946750641, + "step": 1675, + "valid_targets_mean": 6796.4, + "valid_targets_min": 2567 + }, + { + "epoch": 2.847457627118644, + "grad_norm": 0.396918930200827, + "learning_rate": 2.9602171649765235e-05, + "loss": 0.3067, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14382398128509521, + "step": 1680, + "valid_targets_mean": 9150.9, + "valid_targets_min": 4866 + }, + { + "epoch": 2.8559322033898304, + "grad_norm": 0.4963487698731554, + "learning_rate": 2.9527944789660732e-05, + "loss": 0.2893, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13725848495960236, + "step": 1685, + "valid_targets_mean": 8448.1, + "valid_targets_min": 3413 + }, + { + "epoch": 2.864406779661017, + "grad_norm": 0.4856540030020508, + "learning_rate": 2.9453547771225088e-05, + "loss": 0.2873, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13087928295135498, + "step": 1690, + "valid_targets_mean": 6625.8, + "valid_targets_min": 2060 + }, + { + "epoch": 2.8728813559322033, + "grad_norm": 0.4718602599329464, + "learning_rate": 2.9378981923105026e-05, + "loss": 0.2803, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12425769120454788, + "step": 1695, + "valid_targets_mean": 6502.9, + "valid_targets_min": 3374 + }, + { + "epoch": 2.8813559322033897, + "grad_norm": 0.429811308643893, + "learning_rate": 2.930424857696236e-05, + "loss": 0.3189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11679084599018097, + "step": 1700, + "valid_targets_mean": 6725.0, + "valid_targets_min": 3680 + }, + { + "epoch": 2.889830508474576, + "grad_norm": 0.6106285244411059, + "learning_rate": 2.922934906745024e-05, + "loss": 0.3187, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17136754095554352, + "step": 1705, + "valid_targets_mean": 8815.4, + "valid_targets_min": 3296 + }, + { + "epoch": 2.898305084745763, + "grad_norm": 0.40881667558157, + "learning_rate": 2.9154284732189285e-05, + "loss": 0.3147, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.103614941239357, + "step": 1710, + "valid_targets_mean": 7344.6, + "valid_targets_min": 3896 + }, + { + "epoch": 2.906779661016949, + "grad_norm": 0.40167051142083, + "learning_rate": 2.907905691174374e-05, + "loss": 0.2885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15157365798950195, + "step": 1715, + "valid_targets_mean": 7305.6, + "valid_targets_min": 2406 + }, + { + "epoch": 2.915254237288136, + "grad_norm": 0.44454100171373195, + "learning_rate": 2.90036669495975e-05, + "loss": 0.3193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2535397410392761, + "step": 1720, + "valid_targets_mean": 10899.9, + "valid_targets_min": 4113 + }, + { + "epoch": 2.923728813559322, + "grad_norm": 0.40742031882359336, + "learning_rate": 2.8928116192130127e-05, + "loss": 0.3201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15399280190467834, + "step": 1725, + "valid_targets_mean": 8970.1, + "valid_targets_min": 4604 + }, + { + "epoch": 2.9322033898305087, + "grad_norm": 0.3808270536515648, + "learning_rate": 2.8852405988592802e-05, + "loss": 0.2801, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.125367671251297, + "step": 1730, + "valid_targets_mean": 6888.9, + "valid_targets_min": 3687 + }, + { + "epoch": 2.940677966101695, + "grad_norm": 0.38551744389083203, + "learning_rate": 2.8776537691084247e-05, + "loss": 0.2971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2000572681427002, + "step": 1735, + "valid_targets_mean": 9901.8, + "valid_targets_min": 5423 + }, + { + "epoch": 2.9491525423728815, + "grad_norm": 0.3958071016569807, + "learning_rate": 2.8700512654526543e-05, + "loss": 0.303, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1151888519525528, + "step": 1740, + "valid_targets_mean": 6846.0, + "valid_targets_min": 3356 + }, + { + "epoch": 2.957627118644068, + "grad_norm": 0.4049169362567717, + "learning_rate": 2.8624332236640975e-05, + "loss": 0.2857, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15298178791999817, + "step": 1745, + "valid_targets_mean": 8275.1, + "valid_targets_min": 3234 + }, + { + "epoch": 2.9661016949152543, + "grad_norm": 0.40926795857010767, + "learning_rate": 2.854799779792375e-05, + "loss": 0.2807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.122572161257267, + "step": 1750, + "valid_targets_mean": 6125.0, + "valid_targets_min": 1440 + }, + { + "epoch": 2.9745762711864407, + "grad_norm": 0.4120145141696389, + "learning_rate": 2.8471510701621708e-05, + "loss": 0.2838, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14707563817501068, + "step": 1755, + "valid_targets_mean": 8006.0, + "valid_targets_min": 2888 + }, + { + "epoch": 2.983050847457627, + "grad_norm": 0.4336376958519921, + "learning_rate": 2.8394872313707998e-05, + "loss": 0.3134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2632421851158142, + "step": 1760, + "valid_targets_mean": 9177.8, + "valid_targets_min": 2312 + }, + { + "epoch": 2.9915254237288136, + "grad_norm": 0.44528199555148923, + "learning_rate": 2.8318084002857654e-05, + "loss": 0.3, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14627692103385925, + "step": 1765, + "valid_targets_mean": 6893.6, + "valid_targets_min": 4435 + }, + { + "epoch": 3.0, + "grad_norm": 0.4240883829673781, + "learning_rate": 2.824114714042317e-05, + "loss": 0.2799, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1557423323392868, + "step": 1770, + "valid_targets_mean": 6871.1, + "valid_targets_min": 2648 + }, + { + "epoch": 3.0084745762711864, + "grad_norm": 0.3897900675954003, + "learning_rate": 2.8164063100409992e-05, + "loss": 0.306, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17762136459350586, + "step": 1775, + "valid_targets_mean": 11193.6, + "valid_targets_min": 5241 + }, + { + "epoch": 3.016949152542373, + "grad_norm": 0.47647182837107177, + "learning_rate": 2.8086833259452006e-05, + "loss": 0.2565, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1492662876844406, + "step": 1780, + "valid_targets_mean": 7162.5, + "valid_targets_min": 2970 + }, + { + "epoch": 3.0254237288135593, + "grad_norm": 0.48623120655281904, + "learning_rate": 2.8009458996786934e-05, + "loss": 0.2875, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12112700194120407, + "step": 1785, + "valid_targets_mean": 7915.6, + "valid_targets_min": 4167 + }, + { + "epoch": 3.0338983050847457, + "grad_norm": 0.48482652840024115, + "learning_rate": 2.7931941694231705e-05, + "loss": 0.3197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19166266918182373, + "step": 1790, + "valid_targets_mean": 9350.4, + "valid_targets_min": 3952 + }, + { + "epoch": 3.042372881355932, + "grad_norm": 0.43430659240936026, + "learning_rate": 2.7854282736157777e-05, + "loss": 0.2766, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10274215042591095, + "step": 1795, + "valid_targets_mean": 6751.6, + "valid_targets_min": 3033 + }, + { + "epoch": 3.0508474576271185, + "grad_norm": 0.42824230463335977, + "learning_rate": 2.777648350946642e-05, + "loss": 0.3051, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14262977242469788, + "step": 1800, + "valid_targets_mean": 7915.8, + "valid_targets_min": 4544 + }, + { + "epoch": 3.059322033898305, + "grad_norm": 0.39171848978515866, + "learning_rate": 2.7698545403563934e-05, + "loss": 0.2846, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17258086800575256, + "step": 1805, + "valid_targets_mean": 10852.6, + "valid_targets_min": 4410 + }, + { + "epoch": 3.0677966101694913, + "grad_norm": 0.42586366102628226, + "learning_rate": 2.7620469810336854e-05, + "loss": 0.2595, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10813435912132263, + "step": 1810, + "valid_targets_mean": 7451.9, + "valid_targets_min": 3605 + }, + { + "epoch": 3.0762711864406778, + "grad_norm": 0.5024156841387737, + "learning_rate": 2.754225812412708e-05, + "loss": 0.286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2416592836380005, + "step": 1815, + "valid_targets_mean": 10524.9, + "valid_targets_min": 3310 + }, + { + "epoch": 3.084745762711864, + "grad_norm": 0.4048547245262977, + "learning_rate": 2.7463911741706982e-05, + "loss": 0.3173, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.207644984126091, + "step": 1820, + "valid_targets_mean": 12621.1, + "valid_targets_min": 5029 + }, + { + "epoch": 3.093220338983051, + "grad_norm": 0.4307490078277596, + "learning_rate": 2.738543206225445e-05, + "loss": 0.3163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1587986946105957, + "step": 1825, + "valid_targets_mean": 7724.6, + "valid_targets_min": 3033 + }, + { + "epoch": 3.1016949152542375, + "grad_norm": 0.3979456347157598, + "learning_rate": 2.7306820487327906e-05, + "loss": 0.2543, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09165980666875839, + "step": 1830, + "valid_targets_mean": 6352.9, + "valid_targets_min": 3636 + }, + { + "epoch": 3.110169491525424, + "grad_norm": 0.41012860288675734, + "learning_rate": 2.7228078420841277e-05, + "loss": 0.2854, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15160031616687775, + "step": 1835, + "valid_targets_mean": 8778.5, + "valid_targets_min": 4517 + }, + { + "epoch": 3.1186440677966103, + "grad_norm": 0.3676896512476812, + "learning_rate": 2.714920726903892e-05, + "loss": 0.2595, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12810014188289642, + "step": 1840, + "valid_targets_mean": 9615.2, + "valid_targets_min": 2341 + }, + { + "epoch": 3.1271186440677967, + "grad_norm": 0.4376407960674012, + "learning_rate": 2.7070208440470525e-05, + "loss": 0.2995, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10664518177509308, + "step": 1845, + "valid_targets_mean": 6728.5, + "valid_targets_min": 1635 + }, + { + "epoch": 3.135593220338983, + "grad_norm": 0.4408544143757849, + "learning_rate": 2.699108334596592e-05, + "loss": 0.2933, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13383883237838745, + "step": 1850, + "valid_targets_mean": 6220.6, + "valid_targets_min": 1893 + }, + { + "epoch": 3.1440677966101696, + "grad_norm": 0.4171325307219931, + "learning_rate": 2.6911833398609923e-05, + "loss": 0.2504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13895325362682343, + "step": 1855, + "valid_targets_mean": 7073.8, + "valid_targets_min": 3127 + }, + { + "epoch": 3.152542372881356, + "grad_norm": 0.38458629105978887, + "learning_rate": 2.683246001371706e-05, + "loss": 0.2848, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15742285549640656, + "step": 1860, + "valid_targets_mean": 8551.6, + "valid_targets_min": 3754 + }, + { + "epoch": 3.1610169491525424, + "grad_norm": 0.43171473858147835, + "learning_rate": 2.6752964608806338e-05, + "loss": 0.2832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16160979866981506, + "step": 1865, + "valid_targets_mean": 8368.9, + "valid_targets_min": 2778 + }, + { + "epoch": 3.169491525423729, + "grad_norm": 0.4050340176255496, + "learning_rate": 2.6673348603575884e-05, + "loss": 0.2756, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11083655059337616, + "step": 1870, + "valid_targets_mean": 7184.9, + "valid_targets_min": 2213 + }, + { + "epoch": 3.1779661016949152, + "grad_norm": 0.387647020584462, + "learning_rate": 2.6593613419877615e-05, + "loss": 0.2906, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.143922820687294, + "step": 1875, + "valid_targets_mean": 7900.6, + "valid_targets_min": 3621 + }, + { + "epoch": 3.1864406779661016, + "grad_norm": 0.42761047108532324, + "learning_rate": 2.6513760481691842e-05, + "loss": 0.3078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20920830965042114, + "step": 1880, + "valid_targets_mean": 10595.6, + "valid_targets_min": 4433 + }, + { + "epoch": 3.194915254237288, + "grad_norm": 0.41992267855603493, + "learning_rate": 2.6433791215101848e-05, + "loss": 0.2867, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16483736038208008, + "step": 1885, + "valid_targets_mean": 8851.0, + "valid_targets_min": 2382 + }, + { + "epoch": 3.2033898305084745, + "grad_norm": 0.4957805375483976, + "learning_rate": 2.6353707048268397e-05, + "loss": 0.3328, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19370196759700775, + "step": 1890, + "valid_targets_mean": 6473.1, + "valid_targets_min": 2295 + }, + { + "epoch": 3.211864406779661, + "grad_norm": 0.44788686707718267, + "learning_rate": 2.6273509411404234e-05, + "loss": 0.2979, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1875634789466858, + "step": 1895, + "valid_targets_mean": 8210.6, + "valid_targets_min": 2503 + }, + { + "epoch": 3.2203389830508473, + "grad_norm": 0.4152706213229902, + "learning_rate": 2.6193199736748572e-05, + "loss": 0.2844, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1070324182510376, + "step": 1900, + "valid_targets_mean": 6541.2, + "valid_targets_min": 3099 + }, + { + "epoch": 3.2288135593220337, + "grad_norm": 0.4205334323132011, + "learning_rate": 2.611277945854148e-05, + "loss": 0.3005, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12432655692100525, + "step": 1905, + "valid_targets_mean": 7172.9, + "valid_targets_min": 2347 + }, + { + "epoch": 3.23728813559322, + "grad_norm": 0.42085706446217025, + "learning_rate": 2.603225001299829e-05, + "loss": 0.2999, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1846511960029602, + "step": 1910, + "valid_targets_mean": 9515.6, + "valid_targets_min": 2967 + }, + { + "epoch": 3.2457627118644066, + "grad_norm": 0.45800092129429243, + "learning_rate": 2.595161283828392e-05, + "loss": 0.3104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10589482635259628, + "step": 1915, + "valid_targets_mean": 5909.1, + "valid_targets_min": 2628 + }, + { + "epoch": 3.2542372881355934, + "grad_norm": 0.4274729974353385, + "learning_rate": 2.5870869374487227e-05, + "loss": 0.2692, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1856462061405182, + "step": 1920, + "valid_targets_mean": 8283.9, + "valid_targets_min": 4400 + }, + { + "epoch": 3.26271186440678, + "grad_norm": 0.45054085287704343, + "learning_rate": 2.579002106359527e-05, + "loss": 0.2954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16199690103530884, + "step": 1925, + "valid_targets_mean": 6181.9, + "valid_targets_min": 2319 + }, + { + "epoch": 3.2711864406779663, + "grad_norm": 0.40980194755456195, + "learning_rate": 2.5709069349467562e-05, + "loss": 0.3383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13299697637557983, + "step": 1930, + "valid_targets_mean": 8032.4, + "valid_targets_min": 2865 + }, + { + "epoch": 3.2796610169491527, + "grad_norm": 0.3829926624037664, + "learning_rate": 2.562801567781026e-05, + "loss": 0.2986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10366646200418472, + "step": 1935, + "valid_targets_mean": 8115.5, + "valid_targets_min": 3637 + }, + { + "epoch": 3.288135593220339, + "grad_norm": 0.42359013428814046, + "learning_rate": 2.554686149615038e-05, + "loss": 0.2566, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12953156232833862, + "step": 1940, + "valid_targets_mean": 8511.0, + "valid_targets_min": 5177 + }, + { + "epoch": 3.2966101694915255, + "grad_norm": 0.39940930819276965, + "learning_rate": 2.5465608253809944e-05, + "loss": 0.2642, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10232742875814438, + "step": 1945, + "valid_targets_mean": 7172.9, + "valid_targets_min": 1999 + }, + { + "epoch": 3.305084745762712, + "grad_norm": 0.43955208594397505, + "learning_rate": 2.5384257401880077e-05, + "loss": 0.2692, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1324247121810913, + "step": 1950, + "valid_targets_mean": 7481.0, + "valid_targets_min": 3559 + }, + { + "epoch": 3.3135593220338984, + "grad_norm": 0.4759603073565482, + "learning_rate": 2.530281039319509e-05, + "loss": 0.2531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1068073958158493, + "step": 1955, + "valid_targets_mean": 5274.9, + "valid_targets_min": 2989 + }, + { + "epoch": 3.3220338983050848, + "grad_norm": 0.39533664131007507, + "learning_rate": 2.5221268682306565e-05, + "loss": 0.2614, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12157115340232849, + "step": 1960, + "valid_targets_mean": 8086.8, + "valid_targets_min": 3023 + }, + { + "epoch": 3.330508474576271, + "grad_norm": 0.4025452212806949, + "learning_rate": 2.5139633725457345e-05, + "loss": 0.3042, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1479698270559311, + "step": 1965, + "valid_targets_mean": 8655.5, + "valid_targets_min": 3906 + }, + { + "epoch": 3.3389830508474576, + "grad_norm": 0.42521063572004575, + "learning_rate": 2.505790698055554e-05, + "loss": 0.2786, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11045683920383453, + "step": 1970, + "valid_targets_mean": 7279.1, + "valid_targets_min": 5657 + }, + { + "epoch": 3.347457627118644, + "grad_norm": 0.48755661717841947, + "learning_rate": 2.49760899071485e-05, + "loss": 0.2911, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17295318841934204, + "step": 1975, + "valid_targets_mean": 7348.9, + "valid_targets_min": 2427 + }, + { + "epoch": 3.3559322033898304, + "grad_norm": 0.4254688178029983, + "learning_rate": 2.4894183966396735e-05, + "loss": 0.2686, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09378187358379364, + "step": 1980, + "valid_targets_mean": 5475.5, + "valid_targets_min": 2778 + }, + { + "epoch": 3.364406779661017, + "grad_norm": 0.367434521784498, + "learning_rate": 2.4812190621047822e-05, + "loss": 0.294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10478046536445618, + "step": 1985, + "valid_targets_mean": 8775.1, + "valid_targets_min": 4384 + }, + { + "epoch": 3.3728813559322033, + "grad_norm": 0.4189507633838683, + "learning_rate": 2.4730111335410298e-05, + "loss": 0.304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17582011222839355, + "step": 1990, + "valid_targets_mean": 7836.2, + "valid_targets_min": 1645 + }, + { + "epoch": 3.3813559322033897, + "grad_norm": 0.400233301929351, + "learning_rate": 2.4647947575327468e-05, + "loss": 0.2775, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09607855975627899, + "step": 1995, + "valid_targets_mean": 5813.9, + "valid_targets_min": 3494 + }, + { + "epoch": 3.389830508474576, + "grad_norm": 0.4336791016592384, + "learning_rate": 2.4565700808151297e-05, + "loss": 0.2513, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10696402192115784, + "step": 2000, + "valid_targets_mean": 6734.2, + "valid_targets_min": 3928 + }, + { + "epoch": 3.3983050847457625, + "grad_norm": 0.41428448011026164, + "learning_rate": 2.4483372502716124e-05, + "loss": 0.2799, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0847843810915947, + "step": 2005, + "valid_targets_mean": 5492.8, + "valid_targets_min": 3844 + }, + { + "epoch": 3.406779661016949, + "grad_norm": 0.40964037100046546, + "learning_rate": 2.44009641293125e-05, + "loss": 0.2883, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14137449860572815, + "step": 2010, + "valid_targets_mean": 7062.4, + "valid_targets_min": 2779 + }, + { + "epoch": 3.415254237288136, + "grad_norm": 0.38682559049197435, + "learning_rate": 2.431847715966087e-05, + "loss": 0.2797, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0912858098745346, + "step": 2015, + "valid_targets_mean": 6138.2, + "valid_targets_min": 2715 + }, + { + "epoch": 3.423728813559322, + "grad_norm": 0.48692004450222665, + "learning_rate": 2.423591306688534e-05, + "loss": 0.2708, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11212123930454254, + "step": 2020, + "valid_targets_mean": 6439.9, + "valid_targets_min": 2940 + }, + { + "epoch": 3.4322033898305087, + "grad_norm": 0.5255657570421769, + "learning_rate": 2.4153273325487346e-05, + "loss": 0.279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1764291524887085, + "step": 2025, + "valid_targets_mean": 8640.4, + "valid_targets_min": 2608 + }, + { + "epoch": 3.440677966101695, + "grad_norm": 0.4266344445319651, + "learning_rate": 2.407055941131932e-05, + "loss": 0.2662, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18718381226062775, + "step": 2030, + "valid_targets_mean": 7492.9, + "valid_targets_min": 2960 + }, + { + "epoch": 3.4491525423728815, + "grad_norm": 0.4211828179123291, + "learning_rate": 2.3987772801558328e-05, + "loss": 0.2858, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21861864626407623, + "step": 2035, + "valid_targets_mean": 8366.5, + "valid_targets_min": 3066 + }, + { + "epoch": 3.457627118644068, + "grad_norm": 0.4160233489369109, + "learning_rate": 2.3904914974679705e-05, + "loss": 0.2831, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10223515331745148, + "step": 2040, + "valid_targets_mean": 6495.2, + "valid_targets_min": 3637 + }, + { + "epoch": 3.4661016949152543, + "grad_norm": 0.40882160997249284, + "learning_rate": 2.3821987410430646e-05, + "loss": 0.2652, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12576085329055786, + "step": 2045, + "valid_targets_mean": 7358.2, + "valid_targets_min": 2607 + }, + { + "epoch": 3.4745762711864407, + "grad_norm": 0.36672520626623, + "learning_rate": 2.3738991589803783e-05, + "loss": 0.2965, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20486734807491302, + "step": 2050, + "valid_targets_mean": 12180.8, + "valid_targets_min": 7787 + }, + { + "epoch": 3.483050847457627, + "grad_norm": 0.3853682329233998, + "learning_rate": 2.36559289950107e-05, + "loss": 0.2794, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18601134419441223, + "step": 2055, + "valid_targets_mean": 9524.1, + "valid_targets_min": 3073 + }, + { + "epoch": 3.4915254237288136, + "grad_norm": 0.3801472492117076, + "learning_rate": 2.357280110945552e-05, + "loss": 0.2966, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15141558647155762, + "step": 2060, + "valid_targets_mean": 9554.1, + "valid_targets_min": 4884 + }, + { + "epoch": 3.5, + "grad_norm": 0.38281552006385716, + "learning_rate": 2.3489609417708383e-05, + "loss": 0.3091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07897169888019562, + "step": 2065, + "valid_targets_mean": 6056.4, + "valid_targets_min": 2487 + }, + { + "epoch": 3.5084745762711864, + "grad_norm": 0.4084426268312189, + "learning_rate": 2.340635540547892e-05, + "loss": 0.2594, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09317970275878906, + "step": 2070, + "valid_targets_mean": 6611.2, + "valid_targets_min": 2457 + }, + { + "epoch": 3.516949152542373, + "grad_norm": 0.43668463366477434, + "learning_rate": 2.3323040559589755e-05, + "loss": 0.2841, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1499471664428711, + "step": 2075, + "valid_targets_mean": 7579.8, + "valid_targets_min": 2966 + }, + { + "epoch": 3.5254237288135593, + "grad_norm": 0.3983631104396672, + "learning_rate": 2.3239666367949917e-05, + "loss": 0.2827, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1473519206047058, + "step": 2080, + "valid_targets_mean": 7799.1, + "valid_targets_min": 3621 + }, + { + "epoch": 3.5338983050847457, + "grad_norm": 0.4120452974947437, + "learning_rate": 2.3156234319528295e-05, + "loss": 0.2647, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0906115174293518, + "step": 2085, + "valid_targets_mean": 6207.0, + "valid_targets_min": 2847 + }, + { + "epoch": 3.542372881355932, + "grad_norm": 0.44363425545735335, + "learning_rate": 2.3072745904327015e-05, + "loss": 0.2936, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09172677993774414, + "step": 2090, + "valid_targets_mean": 6414.6, + "valid_targets_min": 5234 + }, + { + "epoch": 3.5508474576271185, + "grad_norm": 0.38869052034458823, + "learning_rate": 2.298920261335488e-05, + "loss": 0.2575, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09527749568223953, + "step": 2095, + "valid_targets_mean": 6330.2, + "valid_targets_min": 2577 + }, + { + "epoch": 3.559322033898305, + "grad_norm": 0.36643178759344713, + "learning_rate": 2.2905605938600685e-05, + "loss": 0.2891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20668168365955353, + "step": 2100, + "valid_targets_mean": 12464.9, + "valid_targets_min": 6539 + }, + { + "epoch": 3.5677966101694913, + "grad_norm": 0.3959504607284564, + "learning_rate": 2.2821957373006617e-05, + "loss": 0.262, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18114525079727173, + "step": 2105, + "valid_targets_mean": 10751.5, + "valid_targets_min": 6678 + }, + { + "epoch": 3.576271186440678, + "grad_norm": 0.41062663468779714, + "learning_rate": 2.273825841044156e-05, + "loss": 0.2941, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15731394290924072, + "step": 2110, + "valid_targets_mean": 8485.2, + "valid_targets_min": 2609 + }, + { + "epoch": 3.584745762711864, + "grad_norm": 0.374346290872505, + "learning_rate": 2.2654510545674442e-05, + "loss": 0.2772, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1397765576839447, + "step": 2115, + "valid_targets_mean": 8244.4, + "valid_targets_min": 3700 + }, + { + "epoch": 3.593220338983051, + "grad_norm": 0.39875361896903927, + "learning_rate": 2.257071527434753e-05, + "loss": 0.2967, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14811114966869354, + "step": 2120, + "valid_targets_mean": 7846.0, + "valid_targets_min": 3187 + }, + { + "epoch": 3.601694915254237, + "grad_norm": 0.39347828360733145, + "learning_rate": 2.2486874092949708e-05, + "loss": 0.2814, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12575045228004456, + "step": 2125, + "valid_targets_mean": 8018.4, + "valid_targets_min": 3985 + }, + { + "epoch": 3.610169491525424, + "grad_norm": 0.4164173242177716, + "learning_rate": 2.2402988498789767e-05, + "loss": 0.2911, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10205131769180298, + "step": 2130, + "valid_targets_mean": 7143.9, + "valid_targets_min": 2676 + }, + { + "epoch": 3.6186440677966103, + "grad_norm": 0.4125444447963192, + "learning_rate": 2.2319059989969668e-05, + "loss": 0.2925, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16392400860786438, + "step": 2135, + "valid_targets_mean": 7902.1, + "valid_targets_min": 3675 + }, + { + "epoch": 3.6271186440677967, + "grad_norm": 0.40524649599732243, + "learning_rate": 2.2235090065357773e-05, + "loss": 0.2945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18411213159561157, + "step": 2140, + "valid_targets_mean": 8892.9, + "valid_targets_min": 4234 + }, + { + "epoch": 3.635593220338983, + "grad_norm": 0.4088874114510119, + "learning_rate": 2.215108022456208e-05, + "loss": 0.3024, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14849057793617249, + "step": 2145, + "valid_targets_mean": 8279.2, + "valid_targets_min": 4495 + }, + { + "epoch": 3.6440677966101696, + "grad_norm": 0.4831151083725686, + "learning_rate": 2.2067031967903443e-05, + "loss": 0.2542, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13207237422466278, + "step": 2150, + "valid_targets_mean": 9388.2, + "valid_targets_min": 4290 + }, + { + "epoch": 3.652542372881356, + "grad_norm": 0.3733280663746573, + "learning_rate": 2.1982946796388788e-05, + "loss": 0.3061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17002075910568237, + "step": 2155, + "valid_targets_mean": 11468.6, + "valid_targets_min": 4610 + }, + { + "epoch": 3.6610169491525424, + "grad_norm": 0.4173341617806821, + "learning_rate": 2.1898826211684297e-05, + "loss": 0.2735, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1557663381099701, + "step": 2160, + "valid_targets_mean": 8174.9, + "valid_targets_min": 3753 + }, + { + "epoch": 3.669491525423729, + "grad_norm": 0.4186670500997302, + "learning_rate": 2.1814671716088593e-05, + "loss": 0.3066, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08113788068294525, + "step": 2165, + "valid_targets_mean": 6345.8, + "valid_targets_min": 2595 + }, + { + "epoch": 3.6779661016949152, + "grad_norm": 0.4101685556228967, + "learning_rate": 2.17304848125059e-05, + "loss": 0.2923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16531658172607422, + "step": 2170, + "valid_targets_mean": 8883.8, + "valid_targets_min": 4246 + }, + { + "epoch": 3.6864406779661016, + "grad_norm": 0.41763151825852196, + "learning_rate": 2.1646267004419218e-05, + "loss": 0.2746, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1397768259048462, + "step": 2175, + "valid_targets_mean": 7207.2, + "valid_targets_min": 2605 + }, + { + "epoch": 3.694915254237288, + "grad_norm": 0.440242674224947, + "learning_rate": 2.1562019795863463e-05, + "loss": 0.2954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22693797945976257, + "step": 2180, + "valid_targets_mean": 9268.8, + "valid_targets_min": 4187 + }, + { + "epoch": 3.7033898305084745, + "grad_norm": 0.44197333796797894, + "learning_rate": 2.147774469139863e-05, + "loss": 0.2516, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10422711074352264, + "step": 2185, + "valid_targets_mean": 6519.4, + "valid_targets_min": 3589 + }, + { + "epoch": 3.711864406779661, + "grad_norm": 0.40539121412831586, + "learning_rate": 2.1393443196082867e-05, + "loss": 0.283, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2202359437942505, + "step": 2190, + "valid_targets_mean": 11366.1, + "valid_targets_min": 4141 + }, + { + "epoch": 3.7203389830508473, + "grad_norm": 0.430547381803079, + "learning_rate": 2.1309116815445665e-05, + "loss": 0.2757, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09388360381126404, + "step": 2195, + "valid_targets_mean": 5664.4, + "valid_targets_min": 3034 + }, + { + "epoch": 3.7288135593220337, + "grad_norm": 0.42608356334048153, + "learning_rate": 2.1224767055460922e-05, + "loss": 0.2968, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10148052871227264, + "step": 2200, + "valid_targets_mean": 6436.9, + "valid_targets_min": 3169 + }, + { + "epoch": 3.7372881355932206, + "grad_norm": 0.4210448690634892, + "learning_rate": 2.114039542252008e-05, + "loss": 0.2988, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1500019133090973, + "step": 2205, + "valid_targets_mean": 7466.1, + "valid_targets_min": 3197 + }, + { + "epoch": 3.7457627118644066, + "grad_norm": 0.8119317714900413, + "learning_rate": 2.1056003423405178e-05, + "loss": 0.3019, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22710689902305603, + "step": 2210, + "valid_targets_mean": 8778.1, + "valid_targets_min": 2972 + }, + { + "epoch": 3.7542372881355934, + "grad_norm": 0.4821378308753357, + "learning_rate": 2.0971592565262005e-05, + "loss": 0.2924, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19904181361198425, + "step": 2215, + "valid_targets_mean": 10680.4, + "valid_targets_min": 6006 + }, + { + "epoch": 3.7627118644067794, + "grad_norm": 0.4372433360996204, + "learning_rate": 2.088716435557313e-05, + "loss": 0.2795, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10062790662050247, + "step": 2220, + "valid_targets_mean": 7107.2, + "valid_targets_min": 3544 + }, + { + "epoch": 3.7711864406779663, + "grad_norm": 0.37024338787318023, + "learning_rate": 2.0802720302131016e-05, + "loss": 0.3064, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1332758069038391, + "step": 2225, + "valid_targets_mean": 8794.9, + "valid_targets_min": 1389 + }, + { + "epoch": 3.7796610169491527, + "grad_norm": 0.41076254617672314, + "learning_rate": 2.0718261913011055e-05, + "loss": 0.2873, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15456616878509521, + "step": 2230, + "valid_targets_mean": 7351.8, + "valid_targets_min": 3400 + }, + { + "epoch": 3.788135593220339, + "grad_norm": 0.42262471917169897, + "learning_rate": 2.063379069654468e-05, + "loss": 0.2419, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09343097358942032, + "step": 2235, + "valid_targets_mean": 5882.2, + "valid_targets_min": 1584 + }, + { + "epoch": 3.7966101694915255, + "grad_norm": 0.4069130983703195, + "learning_rate": 2.0549308161292405e-05, + "loss": 0.3008, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1469895988702774, + "step": 2240, + "valid_targets_mean": 7706.8, + "valid_targets_min": 2311 + }, + { + "epoch": 3.805084745762712, + "grad_norm": 0.4321629041786689, + "learning_rate": 2.0464815816016866e-05, + "loss": 0.2685, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11798998713493347, + "step": 2245, + "valid_targets_mean": 6210.6, + "valid_targets_min": 3443 + }, + { + "epoch": 3.8135593220338984, + "grad_norm": 0.3846555018208555, + "learning_rate": 2.0380315169655905e-05, + "loss": 0.3082, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15529337525367737, + "step": 2250, + "valid_targets_mean": 8531.0, + "valid_targets_min": 3768 + }, + { + "epoch": 3.8220338983050848, + "grad_norm": 0.43425368654131496, + "learning_rate": 2.0295807731295628e-05, + "loss": 0.2841, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16532611846923828, + "step": 2255, + "valid_targets_mean": 10186.9, + "valid_targets_min": 5887 + }, + { + "epoch": 3.830508474576271, + "grad_norm": 0.4060353944725796, + "learning_rate": 2.021129501014342e-05, + "loss": 0.2618, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20302706956863403, + "step": 2260, + "valid_targets_mean": 9178.1, + "valid_targets_min": 3145 + }, + { + "epoch": 3.8389830508474576, + "grad_norm": 0.4419753942797279, + "learning_rate": 2.0126778515501e-05, + "loss": 0.2847, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1332482248544693, + "step": 2265, + "valid_targets_mean": 6810.1, + "valid_targets_min": 2611 + }, + { + "epoch": 3.847457627118644, + "grad_norm": 0.3860661265841699, + "learning_rate": 2.0042259756737508e-05, + "loss": 0.3056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12230737507343292, + "step": 2270, + "valid_targets_mean": 7196.2, + "valid_targets_min": 2703 + }, + { + "epoch": 3.8559322033898304, + "grad_norm": 0.4232795474780064, + "learning_rate": 1.99577402432625e-05, + "loss": 0.2909, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14375734329223633, + "step": 2275, + "valid_targets_mean": 7267.1, + "valid_targets_min": 3181 + }, + { + "epoch": 3.864406779661017, + "grad_norm": 0.4224770166929963, + "learning_rate": 1.9873221484499006e-05, + "loss": 0.2665, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17108933627605438, + "step": 2280, + "valid_targets_mean": 8647.1, + "valid_targets_min": 2676 + }, + { + "epoch": 3.8728813559322033, + "grad_norm": 0.38764218963486163, + "learning_rate": 1.978870498985659e-05, + "loss": 0.2931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1058858335018158, + "step": 2285, + "valid_targets_mean": 6942.6, + "valid_targets_min": 2277 + }, + { + "epoch": 3.8813559322033897, + "grad_norm": 0.4395517223806546, + "learning_rate": 1.9704192268704372e-05, + "loss": 0.2693, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10128942131996155, + "step": 2290, + "valid_targets_mean": 5997.0, + "valid_targets_min": 1707 + }, + { + "epoch": 3.889830508474576, + "grad_norm": 0.37259316195160275, + "learning_rate": 1.96196848303441e-05, + "loss": 0.2855, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18444445729255676, + "step": 2295, + "valid_targets_mean": 9367.5, + "valid_targets_min": 4451 + }, + { + "epoch": 3.898305084745763, + "grad_norm": 0.44009690363461895, + "learning_rate": 1.953518418398314e-05, + "loss": 0.2737, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14901164174079895, + "step": 2300, + "valid_targets_mean": 6996.6, + "valid_targets_min": 2612 + }, + { + "epoch": 3.906779661016949, + "grad_norm": 0.4064339811743784, + "learning_rate": 1.94506918387076e-05, + "loss": 0.2818, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15096023678779602, + "step": 2305, + "valid_targets_mean": 8826.8, + "valid_targets_min": 3590 + }, + { + "epoch": 3.915254237288136, + "grad_norm": 0.4395725069154411, + "learning_rate": 1.9366209303455322e-05, + "loss": 0.2886, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14768223464488983, + "step": 2310, + "valid_targets_mean": 8623.0, + "valid_targets_min": 5117 + }, + { + "epoch": 3.923728813559322, + "grad_norm": 0.3938918935844931, + "learning_rate": 1.928173808698895e-05, + "loss": 0.2872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08866434544324875, + "step": 2315, + "valid_targets_mean": 6831.0, + "valid_targets_min": 4091 + }, + { + "epoch": 3.9322033898305087, + "grad_norm": 0.38259904582950616, + "learning_rate": 1.919727969786899e-05, + "loss": 0.283, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14592121541500092, + "step": 2320, + "valid_targets_mean": 8793.0, + "valid_targets_min": 2865 + }, + { + "epoch": 3.940677966101695, + "grad_norm": 0.3874042376620344, + "learning_rate": 1.911283564442687e-05, + "loss": 0.2718, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15052124857902527, + "step": 2325, + "valid_targets_mean": 8260.5, + "valid_targets_min": 2791 + }, + { + "epoch": 3.9491525423728815, + "grad_norm": 0.48083269380960864, + "learning_rate": 1.9028407434737998e-05, + "loss": 0.2774, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15742509067058563, + "step": 2330, + "valid_targets_mean": 6578.2, + "valid_targets_min": 712 + }, + { + "epoch": 3.957627118644068, + "grad_norm": 0.3922858402598884, + "learning_rate": 1.894399657659483e-05, + "loss": 0.2829, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1299702376127243, + "step": 2335, + "valid_targets_mean": 8018.9, + "valid_targets_min": 4466 + }, + { + "epoch": 3.9661016949152543, + "grad_norm": 0.4193645141156418, + "learning_rate": 1.8859604577479927e-05, + "loss": 0.2677, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1529259979724884, + "step": 2340, + "valid_targets_mean": 7416.6, + "valid_targets_min": 2801 + }, + { + "epoch": 3.9745762711864407, + "grad_norm": 0.4485830985098884, + "learning_rate": 1.877523294453908e-05, + "loss": 0.2741, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11698532849550247, + "step": 2345, + "valid_targets_mean": 5913.9, + "valid_targets_min": 2271 + }, + { + "epoch": 3.983050847457627, + "grad_norm": 0.39041637106352106, + "learning_rate": 1.869088318455434e-05, + "loss": 0.2821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12944526970386505, + "step": 2350, + "valid_targets_mean": 7937.2, + "valid_targets_min": 4038 + }, + { + "epoch": 3.9915254237288136, + "grad_norm": 0.4206277849161821, + "learning_rate": 1.8606556803917136e-05, + "loss": 0.233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12252271175384521, + "step": 2355, + "valid_targets_mean": 7135.5, + "valid_targets_min": 2557 + }, + { + "epoch": 4.0, + "grad_norm": 0.42395282370877047, + "learning_rate": 1.8522255308601378e-05, + "loss": 0.2707, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14860565960407257, + "step": 2360, + "valid_targets_mean": 6954.8, + "valid_targets_min": 1915 + }, + { + "epoch": 4.008474576271187, + "grad_norm": 0.4394981579743167, + "learning_rate": 1.8437980204136537e-05, + "loss": 0.2836, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1371266394853592, + "step": 2365, + "valid_targets_mean": 6881.1, + "valid_targets_min": 3617 + }, + { + "epoch": 4.016949152542373, + "grad_norm": 0.39865371969450675, + "learning_rate": 1.8353732995580786e-05, + "loss": 0.2458, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1319272816181183, + "step": 2370, + "valid_targets_mean": 7666.8, + "valid_targets_min": 3523 + }, + { + "epoch": 4.02542372881356, + "grad_norm": 0.4335576658492927, + "learning_rate": 1.826951518749411e-05, + "loss": 0.279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15865981578826904, + "step": 2375, + "valid_targets_mean": 9701.0, + "valid_targets_min": 4588 + }, + { + "epoch": 4.033898305084746, + "grad_norm": 0.37429007480712123, + "learning_rate": 1.8185328283911417e-05, + "loss": 0.2631, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11880265921354294, + "step": 2380, + "valid_targets_mean": 8349.1, + "valid_targets_min": 3445 + }, + { + "epoch": 4.0423728813559325, + "grad_norm": 0.4653775490052777, + "learning_rate": 1.8101173788315707e-05, + "loss": 0.2996, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17142072319984436, + "step": 2385, + "valid_targets_mean": 8055.1, + "valid_targets_min": 2989 + }, + { + "epoch": 4.0508474576271185, + "grad_norm": 0.38759263121062476, + "learning_rate": 1.8017053203611215e-05, + "loss": 0.2565, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13516907393932343, + "step": 2390, + "valid_targets_mean": 8046.6, + "valid_targets_min": 3542 + }, + { + "epoch": 4.059322033898305, + "grad_norm": 0.40174040501426045, + "learning_rate": 1.7932968032096564e-05, + "loss": 0.2761, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07665864378213882, + "step": 2395, + "valid_targets_mean": 5400.4, + "valid_targets_min": 2670 + }, + { + "epoch": 4.067796610169491, + "grad_norm": 0.40431475588899, + "learning_rate": 1.7848919775437924e-05, + "loss": 0.2665, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11547114700078964, + "step": 2400, + "valid_targets_mean": 7075.5, + "valid_targets_min": 2911 + }, + { + "epoch": 4.076271186440678, + "grad_norm": 0.41851164508496586, + "learning_rate": 1.776490993464223e-05, + "loss": 0.2873, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13930678367614746, + "step": 2405, + "valid_targets_mean": 8866.9, + "valid_targets_min": 4799 + }, + { + "epoch": 4.084745762711864, + "grad_norm": 0.42772766629398995, + "learning_rate": 1.768094001003033e-05, + "loss": 0.2575, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12916797399520874, + "step": 2410, + "valid_targets_mean": 7858.2, + "valid_targets_min": 4104 + }, + { + "epoch": 4.093220338983051, + "grad_norm": 0.42053509359988245, + "learning_rate": 1.759701150121024e-05, + "loss": 0.2457, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12978839874267578, + "step": 2415, + "valid_targets_mean": 7875.4, + "valid_targets_min": 2319 + }, + { + "epoch": 4.101694915254237, + "grad_norm": 0.5009497034489835, + "learning_rate": 1.7513125907050302e-05, + "loss": 0.2897, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22473761439323425, + "step": 2420, + "valid_targets_mean": 6372.8, + "valid_targets_min": 2271 + }, + { + "epoch": 4.110169491525424, + "grad_norm": 0.43870007930354155, + "learning_rate": 1.742928472565248e-05, + "loss": 0.27, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09245385229587555, + "step": 2425, + "valid_targets_mean": 5360.8, + "valid_targets_min": 2382 + }, + { + "epoch": 4.11864406779661, + "grad_norm": 0.44775043625125593, + "learning_rate": 1.7345489454325564e-05, + "loss": 0.2703, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0709337666630745, + "step": 2430, + "valid_targets_mean": 5598.9, + "valid_targets_min": 2645 + }, + { + "epoch": 4.127118644067797, + "grad_norm": 0.39217639662993736, + "learning_rate": 1.7261741589558448e-05, + "loss": 0.288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0978158563375473, + "step": 2435, + "valid_targets_mean": 7005.9, + "valid_targets_min": 3151 + }, + { + "epoch": 4.135593220338983, + "grad_norm": 0.4552504409470467, + "learning_rate": 1.717804262699339e-05, + "loss": 0.2712, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1586516797542572, + "step": 2440, + "valid_targets_mean": 8164.1, + "valid_targets_min": 4684 + }, + { + "epoch": 4.1440677966101696, + "grad_norm": 0.6110641883530884, + "learning_rate": 1.7094394061399318e-05, + "loss": 0.2571, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11182674765586853, + "step": 2445, + "valid_targets_mean": 6517.5, + "valid_targets_min": 3535 + }, + { + "epoch": 4.1525423728813555, + "grad_norm": 0.4189713731531144, + "learning_rate": 1.701079738664512e-05, + "loss": 0.2609, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1106354147195816, + "step": 2450, + "valid_targets_mean": 7306.5, + "valid_targets_min": 2984 + }, + { + "epoch": 4.161016949152542, + "grad_norm": 0.4353514390157063, + "learning_rate": 1.6927254095672992e-05, + "loss": 0.2641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10617899894714355, + "step": 2455, + "valid_targets_mean": 5812.9, + "valid_targets_min": 2453 + }, + { + "epoch": 4.169491525423728, + "grad_norm": 0.4219809852768852, + "learning_rate": 1.6843765680471715e-05, + "loss": 0.2742, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11135134100914001, + "step": 2460, + "valid_targets_mean": 7021.0, + "valid_targets_min": 3043 + }, + { + "epoch": 4.177966101694915, + "grad_norm": 0.5654406681363515, + "learning_rate": 1.6760333632050086e-05, + "loss": 0.2835, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11446435004472733, + "step": 2465, + "valid_targets_mean": 6612.6, + "valid_targets_min": 3022 + }, + { + "epoch": 4.186440677966102, + "grad_norm": 0.47653784967954316, + "learning_rate": 1.667695944041025e-05, + "loss": 0.2723, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11347555369138718, + "step": 2470, + "valid_targets_mean": 7101.2, + "valid_targets_min": 2948 + }, + { + "epoch": 4.194915254237288, + "grad_norm": 0.4662821933614443, + "learning_rate": 1.6593644594521082e-05, + "loss": 0.2996, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13076099753379822, + "step": 2475, + "valid_targets_mean": 7465.9, + "valid_targets_min": 2341 + }, + { + "epoch": 4.203389830508475, + "grad_norm": 0.4080427666049444, + "learning_rate": 1.6510390582291624e-05, + "loss": 0.2611, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18516531586647034, + "step": 2480, + "valid_targets_mean": 9916.2, + "valid_targets_min": 5024 + }, + { + "epoch": 4.211864406779661, + "grad_norm": 0.42008095154266495, + "learning_rate": 1.6427198890544483e-05, + "loss": 0.2685, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14330461621284485, + "step": 2485, + "valid_targets_mean": 8390.0, + "valid_targets_min": 2523 + }, + { + "epoch": 4.220338983050848, + "grad_norm": 0.41276959099838073, + "learning_rate": 1.634407100498931e-05, + "loss": 0.264, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11455489695072174, + "step": 2490, + "valid_targets_mean": 7962.2, + "valid_targets_min": 4119 + }, + { + "epoch": 4.228813559322034, + "grad_norm": 0.43611233307799147, + "learning_rate": 1.626100841019623e-05, + "loss": 0.2634, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11222334951162338, + "step": 2495, + "valid_targets_mean": 6606.1, + "valid_targets_min": 3702 + }, + { + "epoch": 4.237288135593221, + "grad_norm": 0.5784961476511713, + "learning_rate": 1.6178012589569358e-05, + "loss": 0.2881, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20426484942436218, + "step": 2500, + "valid_targets_mean": 9576.0, + "valid_targets_min": 4395 + }, + { + "epoch": 4.245762711864407, + "grad_norm": 0.41472930754303877, + "learning_rate": 1.60950850253203e-05, + "loss": 0.2774, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18941691517829895, + "step": 2505, + "valid_targets_mean": 9656.6, + "valid_targets_min": 4846 + }, + { + "epoch": 4.254237288135593, + "grad_norm": 0.39746772521027784, + "learning_rate": 1.601222719844168e-05, + "loss": 0.2598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10123373568058014, + "step": 2510, + "valid_targets_mean": 8234.5, + "valid_targets_min": 4070 + }, + { + "epoch": 4.262711864406779, + "grad_norm": 0.40487688980861414, + "learning_rate": 1.5929440588680688e-05, + "loss": 0.239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1368967741727829, + "step": 2515, + "valid_targets_mean": 9803.1, + "valid_targets_min": 3305 + }, + { + "epoch": 4.271186440677966, + "grad_norm": 0.38573108303487735, + "learning_rate": 1.5846726674512654e-05, + "loss": 0.2474, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09613785147666931, + "step": 2520, + "valid_targets_mean": 7835.9, + "valid_targets_min": 3348 + }, + { + "epoch": 4.279661016949152, + "grad_norm": 0.43145138808268946, + "learning_rate": 1.576408693311466e-05, + "loss": 0.2675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18399053812026978, + "step": 2525, + "valid_targets_mean": 9229.1, + "valid_targets_min": 3336 + }, + { + "epoch": 4.288135593220339, + "grad_norm": 0.4562660091012742, + "learning_rate": 1.5681522840339143e-05, + "loss": 0.2722, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1121688187122345, + "step": 2530, + "valid_targets_mean": 6697.4, + "valid_targets_min": 1611 + }, + { + "epoch": 4.296610169491525, + "grad_norm": 0.5087600350546465, + "learning_rate": 1.5599035870687515e-05, + "loss": 0.2855, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12653526663780212, + "step": 2535, + "valid_targets_mean": 6205.5, + "valid_targets_min": 2504 + }, + { + "epoch": 4.305084745762712, + "grad_norm": 0.438881885643239, + "learning_rate": 1.5516627497283882e-05, + "loss": 0.2753, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19421055912971497, + "step": 2540, + "valid_targets_mean": 9667.5, + "valid_targets_min": 2638 + }, + { + "epoch": 4.313559322033898, + "grad_norm": 0.45645782507464455, + "learning_rate": 1.5434299191848713e-05, + "loss": 0.2795, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1491662859916687, + "step": 2545, + "valid_targets_mean": 7809.4, + "valid_targets_min": 2630 + }, + { + "epoch": 4.322033898305085, + "grad_norm": 0.4353487772661872, + "learning_rate": 1.5352052424672535e-05, + "loss": 0.2644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13219210505485535, + "step": 2550, + "valid_targets_mean": 6678.6, + "valid_targets_min": 1032 + }, + { + "epoch": 4.330508474576272, + "grad_norm": 0.4386593211818938, + "learning_rate": 1.5269888664589712e-05, + "loss": 0.2586, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09329979121685028, + "step": 2555, + "valid_targets_mean": 6891.2, + "valid_targets_min": 3901 + }, + { + "epoch": 4.338983050847458, + "grad_norm": 0.45062923880238476, + "learning_rate": 1.5187809378952182e-05, + "loss": 0.2555, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10724156349897385, + "step": 2560, + "valid_targets_mean": 6354.0, + "valid_targets_min": 1847 + }, + { + "epoch": 4.3474576271186445, + "grad_norm": 0.4720009798967789, + "learning_rate": 1.5105816033603266e-05, + "loss": 0.2433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09511254727840424, + "step": 2565, + "valid_targets_mean": 6438.9, + "valid_targets_min": 3573 + }, + { + "epoch": 4.3559322033898304, + "grad_norm": 0.47501420296893465, + "learning_rate": 1.5023910092851509e-05, + "loss": 0.2692, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14761820435523987, + "step": 2570, + "valid_targets_mean": 7794.8, + "valid_targets_min": 4409 + }, + { + "epoch": 4.364406779661017, + "grad_norm": 0.46228965195292865, + "learning_rate": 1.4942093019444468e-05, + "loss": 0.2713, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21561656892299652, + "step": 2575, + "valid_targets_mean": 7940.1, + "valid_targets_min": 2271 + }, + { + "epoch": 4.372881355932203, + "grad_norm": 0.4310289841712482, + "learning_rate": 1.4860366274542663e-05, + "loss": 0.2577, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15172511339187622, + "step": 2580, + "valid_targets_mean": 6876.4, + "valid_targets_min": 3609 + }, + { + "epoch": 4.38135593220339, + "grad_norm": 0.3817393899077175, + "learning_rate": 1.4778731317693442e-05, + "loss": 0.2474, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1488693356513977, + "step": 2585, + "valid_targets_mean": 10913.8, + "valid_targets_min": 2336 + }, + { + "epoch": 4.389830508474576, + "grad_norm": 0.4396698768007295, + "learning_rate": 1.4697189606804914e-05, + "loss": 0.2492, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11185161769390106, + "step": 2590, + "valid_targets_mean": 7252.6, + "valid_targets_min": 4278 + }, + { + "epoch": 4.398305084745763, + "grad_norm": 0.4425465024994567, + "learning_rate": 1.4615742598119927e-05, + "loss": 0.2621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10830656439065933, + "step": 2595, + "valid_targets_mean": 7119.5, + "valid_targets_min": 2530 + }, + { + "epoch": 4.406779661016949, + "grad_norm": 0.4071900412191274, + "learning_rate": 1.4534391746190056e-05, + "loss": 0.2762, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10529286414384842, + "step": 2600, + "valid_targets_mean": 7428.5, + "valid_targets_min": 2578 + }, + { + "epoch": 4.415254237288136, + "grad_norm": 0.40288822455342677, + "learning_rate": 1.4453138503849622e-05, + "loss": 0.3073, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11631416529417038, + "step": 2605, + "valid_targets_mean": 7269.8, + "valid_targets_min": 3017 + }, + { + "epoch": 4.423728813559322, + "grad_norm": 0.42750798117550126, + "learning_rate": 1.4371984322189754e-05, + "loss": 0.2646, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14900711178779602, + "step": 2610, + "valid_targets_mean": 8732.9, + "valid_targets_min": 4282 + }, + { + "epoch": 4.432203389830509, + "grad_norm": 0.44095759717826927, + "learning_rate": 1.4290930650532448e-05, + "loss": 0.2676, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1209695041179657, + "step": 2615, + "valid_targets_mean": 6879.2, + "valid_targets_min": 3422 + }, + { + "epoch": 4.440677966101695, + "grad_norm": 0.424552739901633, + "learning_rate": 1.4209978936404731e-05, + "loss": 0.2878, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1218380331993103, + "step": 2620, + "valid_targets_mean": 6677.4, + "valid_targets_min": 3274 + }, + { + "epoch": 4.4491525423728815, + "grad_norm": 0.39167231606947506, + "learning_rate": 1.4129130625512776e-05, + "loss": 0.2973, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12196886539459229, + "step": 2625, + "valid_targets_mean": 9059.2, + "valid_targets_min": 3095 + }, + { + "epoch": 4.4576271186440675, + "grad_norm": 0.3954677586985334, + "learning_rate": 1.4048387161716086e-05, + "loss": 0.2739, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13891199231147766, + "step": 2630, + "valid_targets_mean": 8787.0, + "valid_targets_min": 4182 + }, + { + "epoch": 4.466101694915254, + "grad_norm": 0.3922770972346297, + "learning_rate": 1.3967749987001717e-05, + "loss": 0.2644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15331467986106873, + "step": 2635, + "valid_targets_mean": 8593.4, + "valid_targets_min": 2049 + }, + { + "epoch": 4.47457627118644, + "grad_norm": 0.416498484310529, + "learning_rate": 1.3887220541458521e-05, + "loss": 0.2726, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14011646807193756, + "step": 2640, + "valid_targets_mean": 6794.2, + "valid_targets_min": 1697 + }, + { + "epoch": 4.483050847457627, + "grad_norm": 0.3977702816938163, + "learning_rate": 1.380680026325143e-05, + "loss": 0.236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10949341207742691, + "step": 2645, + "valid_targets_mean": 7184.6, + "valid_targets_min": 1466 + }, + { + "epoch": 4.491525423728813, + "grad_norm": 0.43575966118057613, + "learning_rate": 1.3726490588595776e-05, + "loss": 0.267, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16025930643081665, + "step": 2650, + "valid_targets_mean": 8080.8, + "valid_targets_min": 4200 + }, + { + "epoch": 4.5, + "grad_norm": 0.4929537665321967, + "learning_rate": 1.3646292951731615e-05, + "loss": 0.2622, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12223613262176514, + "step": 2655, + "valid_targets_mean": 7641.6, + "valid_targets_min": 2772 + }, + { + "epoch": 4.508474576271187, + "grad_norm": 0.4542816770985378, + "learning_rate": 1.3566208784898157e-05, + "loss": 0.2684, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10347205400466919, + "step": 2660, + "valid_targets_mean": 7062.9, + "valid_targets_min": 3917 + }, + { + "epoch": 4.516949152542373, + "grad_norm": 0.6154023708778347, + "learning_rate": 1.348623951830816e-05, + "loss": 0.2597, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12198853492736816, + "step": 2665, + "valid_targets_mean": 6628.5, + "valid_targets_min": 2337 + }, + { + "epoch": 4.52542372881356, + "grad_norm": 0.4401656665983104, + "learning_rate": 1.3406386580122389e-05, + "loss": 0.2879, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06955887377262115, + "step": 2670, + "valid_targets_mean": 4901.9, + "valid_targets_min": 2179 + }, + { + "epoch": 4.533898305084746, + "grad_norm": 0.407257406794763, + "learning_rate": 1.332665139642412e-05, + "loss": 0.2733, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21901419758796692, + "step": 2675, + "valid_targets_mean": 10808.1, + "valid_targets_min": 3359 + }, + { + "epoch": 4.5423728813559325, + "grad_norm": 0.4171993331704572, + "learning_rate": 1.3247035391193664e-05, + "loss": 0.268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08096012473106384, + "step": 2680, + "valid_targets_mean": 6991.5, + "valid_targets_min": 3342 + }, + { + "epoch": 4.5508474576271185, + "grad_norm": 0.4216667198517297, + "learning_rate": 1.3167539986282938e-05, + "loss": 0.2414, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12701958417892456, + "step": 2685, + "valid_targets_mean": 7187.9, + "valid_targets_min": 3835 + }, + { + "epoch": 4.559322033898305, + "grad_norm": 0.4007002554100059, + "learning_rate": 1.3088166601390087e-05, + "loss": 0.2757, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13677562773227692, + "step": 2690, + "valid_targets_mean": 8478.9, + "valid_targets_min": 3949 + }, + { + "epoch": 4.567796610169491, + "grad_norm": 0.44906505243084627, + "learning_rate": 1.3008916654034085e-05, + "loss": 0.3112, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12453994154930115, + "step": 2695, + "valid_targets_mean": 6475.2, + "valid_targets_min": 2863 + }, + { + "epoch": 4.576271186440678, + "grad_norm": 0.4695955316852692, + "learning_rate": 1.2929791559529484e-05, + "loss": 0.2944, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1315167248249054, + "step": 2700, + "valid_targets_mean": 8320.2, + "valid_targets_min": 4323 + }, + { + "epoch": 4.584745762711864, + "grad_norm": 0.480923032502113, + "learning_rate": 1.2850792730961082e-05, + "loss": 0.2867, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10258597880601883, + "step": 2705, + "valid_targets_mean": 6287.9, + "valid_targets_min": 2432 + }, + { + "epoch": 4.593220338983051, + "grad_norm": 0.4053593691587642, + "learning_rate": 1.2771921579158728e-05, + "loss": 0.2853, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20100140571594238, + "step": 2710, + "valid_targets_mean": 11134.0, + "valid_targets_min": 5394 + }, + { + "epoch": 4.601694915254237, + "grad_norm": 0.5133696354264329, + "learning_rate": 1.26931795126721e-05, + "loss": 0.2653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19328990578651428, + "step": 2715, + "valid_targets_mean": 8126.9, + "valid_targets_min": 2713 + }, + { + "epoch": 4.610169491525424, + "grad_norm": 0.40346643930406395, + "learning_rate": 1.2614567937745554e-05, + "loss": 0.2749, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12850111722946167, + "step": 2720, + "valid_targets_mean": 8410.1, + "valid_targets_min": 3309 + }, + { + "epoch": 4.61864406779661, + "grad_norm": 0.4112102027826456, + "learning_rate": 1.2536088258293018e-05, + "loss": 0.2723, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11901889741420746, + "step": 2725, + "valid_targets_mean": 7852.2, + "valid_targets_min": 3343 + }, + { + "epoch": 4.627118644067797, + "grad_norm": 0.43842191631154037, + "learning_rate": 1.2457741875872928e-05, + "loss": 0.2652, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12838314473628998, + "step": 2730, + "valid_targets_mean": 8761.0, + "valid_targets_min": 3660 + }, + { + "epoch": 4.635593220338983, + "grad_norm": 0.4232260475024782, + "learning_rate": 1.2379530189663156e-05, + "loss": 0.2686, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16140376031398773, + "step": 2735, + "valid_targets_mean": 7674.8, + "valid_targets_min": 1973 + }, + { + "epoch": 4.6440677966101696, + "grad_norm": 0.4001326172915943, + "learning_rate": 1.2301454596436076e-05, + "loss": 0.2578, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1508510857820511, + "step": 2740, + "valid_targets_mean": 8669.1, + "valid_targets_min": 3636 + }, + { + "epoch": 4.652542372881356, + "grad_norm": 0.46641967025775893, + "learning_rate": 1.222351649053359e-05, + "loss": 0.2457, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08667419850826263, + "step": 2745, + "valid_targets_mean": 6366.4, + "valid_targets_min": 2728 + }, + { + "epoch": 4.661016949152542, + "grad_norm": 0.41058878739853244, + "learning_rate": 1.2145717263842228e-05, + "loss": 0.2752, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14657464623451233, + "step": 2750, + "valid_targets_mean": 10316.6, + "valid_targets_min": 4889 + }, + { + "epoch": 4.669491525423728, + "grad_norm": 0.43047052682197245, + "learning_rate": 1.2068058305768298e-05, + "loss": 0.2773, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17472457885742188, + "step": 2755, + "valid_targets_mean": 8935.2, + "valid_targets_min": 1559 + }, + { + "epoch": 4.677966101694915, + "grad_norm": 0.48052761275513234, + "learning_rate": 1.1990541003213072e-05, + "loss": 0.2782, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1159568727016449, + "step": 2760, + "valid_targets_mean": 5699.4, + "valid_targets_min": 1794 + }, + { + "epoch": 4.686440677966102, + "grad_norm": 0.42086376935943387, + "learning_rate": 1.1913166740547999e-05, + "loss": 0.2616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15755105018615723, + "step": 2765, + "valid_targets_mean": 8291.0, + "valid_targets_min": 2110 + }, + { + "epoch": 4.694915254237288, + "grad_norm": 0.4261819528196372, + "learning_rate": 1.1835936899590017e-05, + "loss": 0.2767, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12719427049160004, + "step": 2770, + "valid_targets_mean": 7391.2, + "valid_targets_min": 3754 + }, + { + "epoch": 4.703389830508475, + "grad_norm": 0.41188015404081924, + "learning_rate": 1.1758852859576842e-05, + "loss": 0.2791, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09580564498901367, + "step": 2775, + "valid_targets_mean": 6902.0, + "valid_targets_min": 4403 + }, + { + "epoch": 4.711864406779661, + "grad_norm": 0.42367310030699584, + "learning_rate": 1.1681915997142354e-05, + "loss": 0.2698, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1462278664112091, + "step": 2780, + "valid_targets_mean": 8892.1, + "valid_targets_min": 2956 + }, + { + "epoch": 4.720338983050848, + "grad_norm": 0.3983024142470498, + "learning_rate": 1.1605127686292009e-05, + "loss": 0.2685, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18142619729042053, + "step": 2785, + "valid_targets_mean": 11195.0, + "valid_targets_min": 4341 + }, + { + "epoch": 4.728813559322034, + "grad_norm": 0.43308748942127245, + "learning_rate": 1.15284892983783e-05, + "loss": 0.2784, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11833596974611282, + "step": 2790, + "valid_targets_mean": 7267.1, + "valid_targets_min": 3360 + }, + { + "epoch": 4.737288135593221, + "grad_norm": 0.42170297161536185, + "learning_rate": 1.1452002202076256e-05, + "loss": 0.289, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1312982141971588, + "step": 2795, + "valid_targets_mean": 8055.4, + "valid_targets_min": 2530 + }, + { + "epoch": 4.745762711864407, + "grad_norm": 0.3919530604528147, + "learning_rate": 1.1375667763359031e-05, + "loss": 0.2649, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14995722472667694, + "step": 2800, + "valid_targets_mean": 8652.5, + "valid_targets_min": 3923 + }, + { + "epoch": 4.754237288135593, + "grad_norm": 0.4210088857440684, + "learning_rate": 1.1299487345473457e-05, + "loss": 0.2776, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10921230912208557, + "step": 2805, + "valid_targets_mean": 7063.4, + "valid_targets_min": 3390 + }, + { + "epoch": 4.762711864406779, + "grad_norm": 0.46524547077364725, + "learning_rate": 1.1223462308915767e-05, + "loss": 0.2773, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16076411306858063, + "step": 2810, + "valid_targets_mean": 7103.1, + "valid_targets_min": 2713 + }, + { + "epoch": 4.771186440677966, + "grad_norm": 0.3987547098085568, + "learning_rate": 1.1147594011407203e-05, + "loss": 0.2921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15100906789302826, + "step": 2815, + "valid_targets_mean": 9900.6, + "valid_targets_min": 4761 + }, + { + "epoch": 4.779661016949152, + "grad_norm": 0.4867606351030108, + "learning_rate": 1.1071883807869886e-05, + "loss": 0.2769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1709168553352356, + "step": 2820, + "valid_targets_mean": 7995.1, + "valid_targets_min": 3848 + }, + { + "epoch": 4.788135593220339, + "grad_norm": 0.4243770648885672, + "learning_rate": 1.0996333050402503e-05, + "loss": 0.29, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11102272570133209, + "step": 2825, + "valid_targets_mean": 6283.8, + "valid_targets_min": 3432 + }, + { + "epoch": 4.796610169491525, + "grad_norm": 0.37807523819250266, + "learning_rate": 1.0920943088256266e-05, + "loss": 0.2929, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17590108513832092, + "step": 2830, + "valid_targets_mean": 11326.0, + "valid_targets_min": 3696 + }, + { + "epoch": 4.805084745762712, + "grad_norm": 0.5285744602943411, + "learning_rate": 1.0845715267810716e-05, + "loss": 0.2683, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16316203773021698, + "step": 2835, + "valid_targets_mean": 6556.4, + "valid_targets_min": 1843 + }, + { + "epoch": 4.813559322033898, + "grad_norm": 0.409867873854923, + "learning_rate": 1.0770650932549768e-05, + "loss": 0.2768, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16258347034454346, + "step": 2840, + "valid_targets_mean": 9091.2, + "valid_targets_min": 3104 + }, + { + "epoch": 4.822033898305085, + "grad_norm": 0.4612130048394203, + "learning_rate": 1.0695751423037639e-05, + "loss": 0.2593, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14501486718654633, + "step": 2845, + "valid_targets_mean": 9458.6, + "valid_targets_min": 5624 + }, + { + "epoch": 4.830508474576272, + "grad_norm": 0.4165122048257007, + "learning_rate": 1.0621018076894984e-05, + "loss": 0.2691, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1871585100889206, + "step": 2850, + "valid_targets_mean": 9650.6, + "valid_targets_min": 2319 + }, + { + "epoch": 4.838983050847458, + "grad_norm": 0.4447768666450171, + "learning_rate": 1.0546452228774919e-05, + "loss": 0.2932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2016182541847229, + "step": 2855, + "valid_targets_mean": 9618.0, + "valid_targets_min": 2098 + }, + { + "epoch": 4.847457627118644, + "grad_norm": 0.45706910235659043, + "learning_rate": 1.047205521033928e-05, + "loss": 0.2659, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07524390518665314, + "step": 2860, + "valid_targets_mean": 5177.8, + "valid_targets_min": 1795 + }, + { + "epoch": 4.8559322033898304, + "grad_norm": 0.4082417794116573, + "learning_rate": 1.0397828350234765e-05, + "loss": 0.2715, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07515836507081985, + "step": 2865, + "valid_targets_mean": 5618.4, + "valid_targets_min": 3548 + }, + { + "epoch": 4.864406779661017, + "grad_norm": 0.43699485002864896, + "learning_rate": 1.032377297406926e-05, + "loss": 0.2669, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15624886751174927, + "step": 2870, + "valid_targets_mean": 8017.9, + "valid_targets_min": 3896 + }, + { + "epoch": 4.872881355932203, + "grad_norm": 0.4475219215390075, + "learning_rate": 1.0249890404388121e-05, + "loss": 0.2769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13607046008110046, + "step": 2875, + "valid_targets_mean": 7762.4, + "valid_targets_min": 2731 + }, + { + "epoch": 4.88135593220339, + "grad_norm": 0.4010893872939635, + "learning_rate": 1.0176181960650595e-05, + "loss": 0.2606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2050163745880127, + "step": 2880, + "valid_targets_mean": 10443.4, + "valid_targets_min": 4967 + }, + { + "epoch": 4.889830508474576, + "grad_norm": 0.43399489366456434, + "learning_rate": 1.0102648959206212e-05, + "loss": 0.2465, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09470526874065399, + "step": 2885, + "valid_targets_mean": 6960.6, + "valid_targets_min": 1501 + }, + { + "epoch": 4.898305084745763, + "grad_norm": 0.409246582546555, + "learning_rate": 1.0029292713271334e-05, + "loss": 0.265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16161762177944183, + "step": 2890, + "valid_targets_mean": 7954.8, + "valid_targets_min": 3290 + }, + { + "epoch": 4.906779661016949, + "grad_norm": 0.43312261146531655, + "learning_rate": 9.956114532905625e-06, + "loss": 0.3058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12446765601634979, + "step": 2895, + "valid_targets_mean": 7838.4, + "valid_targets_min": 4758 + }, + { + "epoch": 4.915254237288136, + "grad_norm": 0.4301864357851658, + "learning_rate": 9.883115724988743e-06, + "loss": 0.2753, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12632432579994202, + "step": 2900, + "valid_targets_mean": 7188.4, + "valid_targets_min": 2425 + }, + { + "epoch": 4.923728813559322, + "grad_norm": 0.5636109539825138, + "learning_rate": 9.810297593196922e-06, + "loss": 0.2839, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1164482980966568, + "step": 2905, + "valid_targets_mean": 7041.4, + "valid_targets_min": 1517 + }, + { + "epoch": 4.932203389830509, + "grad_norm": 0.41163855796829296, + "learning_rate": 9.73766143797976e-06, + "loss": 0.2975, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18512123823165894, + "step": 2910, + "valid_targets_mean": 9377.4, + "valid_targets_min": 3063 + }, + { + "epoch": 4.940677966101695, + "grad_norm": 0.3999145511854064, + "learning_rate": 9.665208556536918e-06, + "loss": 0.255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15674389898777008, + "step": 2915, + "valid_targets_mean": 10361.1, + "valid_targets_min": 2778 + }, + { + "epoch": 4.9491525423728815, + "grad_norm": 0.41681357372277467, + "learning_rate": 9.592940242795035e-06, + "loss": 0.2692, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1276121735572815, + "step": 2920, + "valid_targets_mean": 7945.4, + "valid_targets_min": 4230 + }, + { + "epoch": 4.9576271186440675, + "grad_norm": 0.4103109872648721, + "learning_rate": 9.520857787384548e-06, + "loss": 0.2913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2234308123588562, + "step": 2925, + "valid_targets_mean": 10142.1, + "valid_targets_min": 4081 + }, + { + "epoch": 4.966101694915254, + "grad_norm": 0.4773090185998591, + "learning_rate": 9.44896247761669e-06, + "loss": 0.2859, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11663774400949478, + "step": 2930, + "valid_targets_mean": 7561.9, + "valid_targets_min": 2388 + }, + { + "epoch": 4.97457627118644, + "grad_norm": 0.4519877157560931, + "learning_rate": 9.377255597460469e-06, + "loss": 0.2697, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14655426144599915, + "step": 2935, + "valid_targets_mean": 7012.6, + "valid_targets_min": 2452 + }, + { + "epoch": 4.983050847457627, + "grad_norm": 0.46442379360691927, + "learning_rate": 9.305738427519782e-06, + "loss": 0.2943, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10421495884656906, + "step": 2940, + "valid_targets_mean": 5663.6, + "valid_targets_min": 2072 + }, + { + "epoch": 4.991525423728813, + "grad_norm": 0.38014541504707516, + "learning_rate": 9.234412245010482e-06, + "loss": 0.2418, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16515886783599854, + "step": 2945, + "valid_targets_mean": 9815.4, + "valid_targets_min": 2340 + }, + { + "epoch": 5.0, + "grad_norm": 0.40418734474649126, + "learning_rate": 9.163278323737635e-06, + "loss": 0.2861, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17972296476364136, + "step": 2950, + "valid_targets_mean": 9544.8, + "valid_targets_min": 3286 + }, + { + "epoch": 5.008474576271187, + "grad_norm": 0.38884902460392823, + "learning_rate": 9.092337934072703e-06, + "loss": 0.27, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12223666906356812, + "step": 2955, + "valid_targets_mean": 8354.1, + "valid_targets_min": 3525 + }, + { + "epoch": 5.016949152542373, + "grad_norm": 0.4358731046466529, + "learning_rate": 9.021592342930928e-06, + "loss": 0.2311, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10257917642593384, + "step": 2960, + "valid_targets_mean": 8100.0, + "valid_targets_min": 4173 + }, + { + "epoch": 5.02542372881356, + "grad_norm": 0.43373781383804855, + "learning_rate": 8.951042813748645e-06, + "loss": 0.2664, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18158259987831116, + "step": 2965, + "valid_targets_mean": 10387.9, + "valid_targets_min": 5211 + }, + { + "epoch": 5.033898305084746, + "grad_norm": 0.5249679818676168, + "learning_rate": 8.880690606460754e-06, + "loss": 0.2915, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10569009184837341, + "step": 2970, + "valid_targets_mean": 6634.9, + "valid_targets_min": 2482 + }, + { + "epoch": 5.0423728813559325, + "grad_norm": 0.42560397590925436, + "learning_rate": 8.8105369774782e-06, + "loss": 0.2722, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.157941997051239, + "step": 2975, + "valid_targets_mean": 8599.6, + "valid_targets_min": 2981 + }, + { + "epoch": 5.0508474576271185, + "grad_norm": 0.4355648091689131, + "learning_rate": 8.74058317966556e-06, + "loss": 0.2488, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08466358482837677, + "step": 2980, + "valid_targets_mean": 5620.9, + "valid_targets_min": 3876 + }, + { + "epoch": 5.059322033898305, + "grad_norm": 0.4188697143373527, + "learning_rate": 8.670830462318633e-06, + "loss": 0.2516, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06649868935346603, + "step": 2985, + "valid_targets_mean": 5346.4, + "valid_targets_min": 2357 + }, + { + "epoch": 5.067796610169491, + "grad_norm": 0.43278797414764, + "learning_rate": 8.60128007114217e-06, + "loss": 0.2706, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1381576806306839, + "step": 2990, + "valid_targets_mean": 8565.6, + "valid_targets_min": 1759 + }, + { + "epoch": 5.076271186440678, + "grad_norm": 0.40143576428343275, + "learning_rate": 8.531933248227582e-06, + "loss": 0.2392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10228410363197327, + "step": 2995, + "valid_targets_mean": 5543.6, + "valid_targets_min": 2229 + }, + { + "epoch": 5.084745762711864, + "grad_norm": 0.4286280311865031, + "learning_rate": 8.462791232030803e-06, + "loss": 0.2759, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13835610449314117, + "step": 3000, + "valid_targets_mean": 8272.5, + "valid_targets_min": 4373 + }, + { + "epoch": 5.093220338983051, + "grad_norm": 0.41785258691109217, + "learning_rate": 8.393855257350132e-06, + "loss": 0.2515, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11477389186620712, + "step": 3005, + "valid_targets_mean": 8371.8, + "valid_targets_min": 4218 + }, + { + "epoch": 5.101694915254237, + "grad_norm": 0.42839185232988447, + "learning_rate": 8.325126555304208e-06, + "loss": 0.2614, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1777895838022232, + "step": 3010, + "valid_targets_mean": 9394.4, + "valid_targets_min": 4110 + }, + { + "epoch": 5.110169491525424, + "grad_norm": 0.4337647626076782, + "learning_rate": 8.256606353310003e-06, + "loss": 0.2472, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14281994104385376, + "step": 3015, + "valid_targets_mean": 9484.0, + "valid_targets_min": 3434 + }, + { + "epoch": 5.11864406779661, + "grad_norm": 0.4295355742774288, + "learning_rate": 8.188295875060943e-06, + "loss": 0.2746, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0776737704873085, + "step": 3020, + "valid_targets_mean": 4949.9, + "valid_targets_min": 3294 + }, + { + "epoch": 5.127118644067797, + "grad_norm": 0.3676364308403277, + "learning_rate": 8.12019634050499e-06, + "loss": 0.2271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08112052828073502, + "step": 3025, + "valid_targets_mean": 7908.5, + "valid_targets_min": 4680 + }, + { + "epoch": 5.135593220338983, + "grad_norm": 0.4454936935125421, + "learning_rate": 8.052308965822916e-06, + "loss": 0.2468, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1395069807767868, + "step": 3030, + "valid_targets_mean": 7846.9, + "valid_targets_min": 4498 + }, + { + "epoch": 5.1440677966101696, + "grad_norm": 0.4122037084305391, + "learning_rate": 7.984634963406537e-06, + "loss": 0.2499, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14162138104438782, + "step": 3035, + "valid_targets_mean": 8179.1, + "valid_targets_min": 4548 + }, + { + "epoch": 5.1525423728813555, + "grad_norm": 0.463084879888614, + "learning_rate": 7.917175541837101e-06, + "loss": 0.2842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09783188998699188, + "step": 3040, + "valid_targets_mean": 5998.4, + "valid_targets_min": 2460 + }, + { + "epoch": 5.161016949152542, + "grad_norm": 0.4748887059748165, + "learning_rate": 7.849931905863672e-06, + "loss": 0.2885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12707798182964325, + "step": 3045, + "valid_targets_mean": 6415.8, + "valid_targets_min": 3785 + }, + { + "epoch": 5.169491525423728, + "grad_norm": 0.45526749296808317, + "learning_rate": 7.78290525638163e-06, + "loss": 0.2575, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18409213423728943, + "step": 3050, + "valid_targets_mean": 11028.6, + "valid_targets_min": 3734 + }, + { + "epoch": 5.177966101694915, + "grad_norm": 0.4462181398544631, + "learning_rate": 7.71609679041121e-06, + "loss": 0.2503, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15138982236385345, + "step": 3055, + "valid_targets_mean": 7039.2, + "valid_targets_min": 3502 + }, + { + "epoch": 5.186440677966102, + "grad_norm": 0.3963924524169505, + "learning_rate": 7.649507701076164e-06, + "loss": 0.2633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17887073755264282, + "step": 3060, + "valid_targets_mean": 10073.6, + "valid_targets_min": 2114 + }, + { + "epoch": 5.194915254237288, + "grad_norm": 0.5348841144000112, + "learning_rate": 7.583139177582395e-06, + "loss": 0.2634, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2061377465724945, + "step": 3065, + "valid_targets_mean": 7855.2, + "valid_targets_min": 3111 + }, + { + "epoch": 5.203389830508475, + "grad_norm": 0.41577883860215764, + "learning_rate": 7.516992405196772e-06, + "loss": 0.2662, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13540074229240417, + "step": 3070, + "valid_targets_mean": 8547.1, + "valid_targets_min": 4854 + }, + { + "epoch": 5.211864406779661, + "grad_norm": 0.4271021340563035, + "learning_rate": 7.45106856522593e-06, + "loss": 0.2686, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10686710476875305, + "step": 3075, + "valid_targets_mean": 5644.2, + "valid_targets_min": 2827 + }, + { + "epoch": 5.220338983050848, + "grad_norm": 0.4303321911070651, + "learning_rate": 7.385368834995168e-06, + "loss": 0.2305, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07251991331577301, + "step": 3080, + "valid_targets_mean": 5377.9, + "valid_targets_min": 2896 + }, + { + "epoch": 5.228813559322034, + "grad_norm": 0.4414950670458604, + "learning_rate": 7.319894387827473e-06, + "loss": 0.2513, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12613925337791443, + "step": 3085, + "valid_targets_mean": 7042.0, + "valid_targets_min": 3869 + }, + { + "epoch": 5.237288135593221, + "grad_norm": 0.42597819657193176, + "learning_rate": 7.254646393022502e-06, + "loss": 0.2804, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1456468105316162, + "step": 3090, + "valid_targets_mean": 8970.8, + "valid_targets_min": 2240 + }, + { + "epoch": 5.245762711864407, + "grad_norm": 0.3910096201156548, + "learning_rate": 7.189626015835733e-06, + "loss": 0.2832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14637431502342224, + "step": 3095, + "valid_targets_mean": 9771.9, + "valid_targets_min": 2504 + }, + { + "epoch": 5.254237288135593, + "grad_norm": 0.4720410475372794, + "learning_rate": 7.124834417457664e-06, + "loss": 0.2499, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10337448865175247, + "step": 3100, + "valid_targets_mean": 6589.2, + "valid_targets_min": 2630 + }, + { + "epoch": 5.262711864406779, + "grad_norm": 0.4165414378767662, + "learning_rate": 7.060272754993051e-06, + "loss": 0.2528, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10730390250682831, + "step": 3105, + "valid_targets_mean": 7689.1, + "valid_targets_min": 3877 + }, + { + "epoch": 5.271186440677966, + "grad_norm": 0.4773925338374391, + "learning_rate": 6.9959421814402494e-06, + "loss": 0.2686, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09607205539941788, + "step": 3110, + "valid_targets_mean": 6103.0, + "valid_targets_min": 2958 + }, + { + "epoch": 5.279661016949152, + "grad_norm": 0.405934436370515, + "learning_rate": 6.931843845670647e-06, + "loss": 0.2782, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18584570288658142, + "step": 3115, + "valid_targets_mean": 11376.5, + "valid_targets_min": 6700 + }, + { + "epoch": 5.288135593220339, + "grad_norm": 0.40944718673488073, + "learning_rate": 6.867978892408101e-06, + "loss": 0.2812, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06526018679141998, + "step": 3120, + "valid_targets_mean": 5554.6, + "valid_targets_min": 1909 + }, + { + "epoch": 5.296610169491525, + "grad_norm": 0.3969787353916221, + "learning_rate": 6.804348462208548e-06, + "loss": 0.251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14641955494880676, + "step": 3125, + "valid_targets_mean": 10160.4, + "valid_targets_min": 4904 + }, + { + "epoch": 5.305084745762712, + "grad_norm": 0.40381438825051413, + "learning_rate": 6.7409536914395866e-06, + "loss": 0.255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12536650896072388, + "step": 3130, + "valid_targets_mean": 8634.0, + "valid_targets_min": 6440 + }, + { + "epoch": 5.313559322033898, + "grad_norm": 0.4407810032396024, + "learning_rate": 6.677795712260206e-06, + "loss": 0.2689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10065967589616776, + "step": 3135, + "valid_targets_mean": 6554.6, + "valid_targets_min": 3413 + }, + { + "epoch": 5.322033898305085, + "grad_norm": 0.43225307653715944, + "learning_rate": 6.6148756526005855e-06, + "loss": 0.2621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17093005776405334, + "step": 3140, + "valid_targets_mean": 7674.1, + "valid_targets_min": 2705 + }, + { + "epoch": 5.330508474576272, + "grad_norm": 0.42168841714997635, + "learning_rate": 6.552194636141909e-06, + "loss": 0.2444, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1504831612110138, + "step": 3145, + "valid_targets_mean": 8807.0, + "valid_targets_min": 3609 + }, + { + "epoch": 5.338983050847458, + "grad_norm": 0.4721877133160371, + "learning_rate": 6.489753782296315e-06, + "loss": 0.2603, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1312541961669922, + "step": 3150, + "valid_targets_mean": 6869.5, + "valid_targets_min": 2014 + }, + { + "epoch": 5.3474576271186445, + "grad_norm": 0.5627993433253363, + "learning_rate": 6.427554206186939e-06, + "loss": 0.2598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12869901955127716, + "step": 3155, + "valid_targets_mean": 8781.0, + "valid_targets_min": 3073 + }, + { + "epoch": 5.3559322033898304, + "grad_norm": 0.5975905344692939, + "learning_rate": 6.3655970186279314e-06, + "loss": 0.279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15334156155586243, + "step": 3160, + "valid_targets_mean": 7974.1, + "valid_targets_min": 4571 + }, + { + "epoch": 5.364406779661017, + "grad_norm": 0.4399240043257231, + "learning_rate": 6.30388332610469e-06, + "loss": 0.2482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09615137428045273, + "step": 3165, + "valid_targets_mean": 6191.0, + "valid_targets_min": 2960 + }, + { + "epoch": 5.372881355932203, + "grad_norm": 0.43555573486472715, + "learning_rate": 6.242414230754044e-06, + "loss": 0.2651, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1269509643316269, + "step": 3170, + "valid_targets_mean": 7501.0, + "valid_targets_min": 2635 + }, + { + "epoch": 5.38135593220339, + "grad_norm": 0.4707060650067185, + "learning_rate": 6.181190830344601e-06, + "loss": 0.2865, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14338397979736328, + "step": 3175, + "valid_targets_mean": 6411.2, + "valid_targets_min": 3296 + }, + { + "epoch": 5.389830508474576, + "grad_norm": 0.42574272563993854, + "learning_rate": 6.120214218257128e-06, + "loss": 0.2553, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20924800634384155, + "step": 3180, + "valid_targets_mean": 9852.9, + "valid_targets_min": 4562 + }, + { + "epoch": 5.398305084745763, + "grad_norm": 0.39823088488510644, + "learning_rate": 6.059485483465048e-06, + "loss": 0.2489, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12313079833984375, + "step": 3185, + "valid_targets_mean": 7619.0, + "valid_targets_min": 3737 + }, + { + "epoch": 5.406779661016949, + "grad_norm": 0.9536002287476373, + "learning_rate": 5.999005710514956e-06, + "loss": 0.2446, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09335184842348099, + "step": 3190, + "valid_targets_mean": 5375.0, + "valid_targets_min": 1635 + }, + { + "epoch": 5.415254237288136, + "grad_norm": 0.431612528522527, + "learning_rate": 5.938775979507287e-06, + "loss": 0.2625, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13442601263523102, + "step": 3195, + "valid_targets_mean": 7720.2, + "valid_targets_min": 2911 + }, + { + "epoch": 5.423728813559322, + "grad_norm": 0.44860126013223406, + "learning_rate": 5.878797366076994e-06, + "loss": 0.2427, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12965793907642365, + "step": 3200, + "valid_targets_mean": 6444.4, + "valid_targets_min": 2340 + }, + { + "epoch": 5.432203389830509, + "grad_norm": 0.42018341577045487, + "learning_rate": 5.819070941374368e-06, + "loss": 0.2481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14158044755458832, + "step": 3205, + "valid_targets_mean": 8188.9, + "valid_targets_min": 3917 + }, + { + "epoch": 5.440677966101695, + "grad_norm": 0.48422403137134756, + "learning_rate": 5.759597772045882e-06, + "loss": 0.2805, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1876494586467743, + "step": 3210, + "valid_targets_mean": 9145.9, + "valid_targets_min": 5285 + }, + { + "epoch": 5.4491525423728815, + "grad_norm": 0.46211420065830605, + "learning_rate": 5.700378920215159e-06, + "loss": 0.2735, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21201786398887634, + "step": 3215, + "valid_targets_mean": 7421.4, + "valid_targets_min": 2476 + }, + { + "epoch": 5.4576271186440675, + "grad_norm": 0.4264912650604428, + "learning_rate": 5.641415443463994e-06, + "loss": 0.2615, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1297842115163803, + "step": 3220, + "valid_targets_mean": 7719.5, + "valid_targets_min": 1584 + }, + { + "epoch": 5.466101694915254, + "grad_norm": 0.5482676590741974, + "learning_rate": 5.5827083948134876e-06, + "loss": 0.2821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11752267181873322, + "step": 3225, + "valid_targets_mean": 6575.1, + "valid_targets_min": 1240 + }, + { + "epoch": 5.47457627118644, + "grad_norm": 0.5019414160677941, + "learning_rate": 5.524258822705202e-06, + "loss": 0.2297, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12094447016716003, + "step": 3230, + "valid_targets_mean": 7180.8, + "valid_targets_min": 4446 + }, + { + "epoch": 5.483050847457627, + "grad_norm": 0.4037586289857663, + "learning_rate": 5.466067770982482e-06, + "loss": 0.2937, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10668241232633591, + "step": 3235, + "valid_targets_mean": 6875.6, + "valid_targets_min": 2801 + }, + { + "epoch": 5.491525423728813, + "grad_norm": 0.4432879666748049, + "learning_rate": 5.4081362788717625e-06, + "loss": 0.2908, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09486261010169983, + "step": 3240, + "valid_targets_mean": 5720.0, + "valid_targets_min": 2827 + }, + { + "epoch": 5.5, + "grad_norm": 0.41525930005316086, + "learning_rate": 5.350465380964076e-06, + "loss": 0.2694, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12814128398895264, + "step": 3245, + "valid_targets_mean": 8286.4, + "valid_targets_min": 3278 + }, + { + "epoch": 5.508474576271187, + "grad_norm": 0.3967241521552427, + "learning_rate": 5.293056107196488e-06, + "loss": 0.2819, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10649764537811279, + "step": 3250, + "valid_targets_mean": 9235.5, + "valid_targets_min": 3054 + }, + { + "epoch": 5.516949152542373, + "grad_norm": 0.4104500751756487, + "learning_rate": 5.235909482833797e-06, + "loss": 0.2718, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07652749121189117, + "step": 3255, + "valid_targets_mean": 5837.8, + "valid_targets_min": 3543 + }, + { + "epoch": 5.52542372881356, + "grad_norm": 0.4548802593937043, + "learning_rate": 5.179026528450146e-06, + "loss": 0.2637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10874311625957489, + "step": 3260, + "valid_targets_mean": 6713.8, + "valid_targets_min": 3128 + }, + { + "epoch": 5.533898305084746, + "grad_norm": 0.42626630165063617, + "learning_rate": 5.1224082599108584e-06, + "loss": 0.2444, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11963523179292679, + "step": 3265, + "valid_targets_mean": 7900.5, + "valid_targets_min": 4232 + }, + { + "epoch": 5.5423728813559325, + "grad_norm": 0.42226966542492606, + "learning_rate": 5.066055688354246e-06, + "loss": 0.2764, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1330696940422058, + "step": 3270, + "valid_targets_mean": 7405.2, + "valid_targets_min": 3859 + }, + { + "epoch": 5.5508474576271185, + "grad_norm": 0.41559115903205107, + "learning_rate": 5.0099698201735855e-06, + "loss": 0.2615, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18021991848945618, + "step": 3275, + "valid_targets_mean": 9442.4, + "valid_targets_min": 2425 + }, + { + "epoch": 5.559322033898305, + "grad_norm": 0.4473698575482938, + "learning_rate": 4.954151656999122e-06, + "loss": 0.2595, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18893000483512878, + "step": 3280, + "valid_targets_mean": 8873.5, + "valid_targets_min": 2503 + }, + { + "epoch": 5.567796610169491, + "grad_norm": 0.4126655990570961, + "learning_rate": 4.898602195680214e-06, + "loss": 0.257, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17205744981765747, + "step": 3285, + "valid_targets_mean": 10166.2, + "valid_targets_min": 2566 + }, + { + "epoch": 5.576271186440678, + "grad_norm": 0.4436803493070262, + "learning_rate": 4.843322428267465e-06, + "loss": 0.2574, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1269497573375702, + "step": 3290, + "valid_targets_mean": 7204.2, + "valid_targets_min": 2145 + }, + { + "epoch": 5.584745762711864, + "grad_norm": 0.41757091681380304, + "learning_rate": 4.788313341995096e-06, + "loss": 0.3007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12728919088840485, + "step": 3295, + "valid_targets_mean": 7854.6, + "valid_targets_min": 3467 + }, + { + "epoch": 5.593220338983051, + "grad_norm": 0.4333169695340451, + "learning_rate": 4.733575919263238e-06, + "loss": 0.2715, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.197248175740242, + "step": 3300, + "valid_targets_mean": 9669.5, + "valid_targets_min": 2530 + }, + { + "epoch": 5.601694915254237, + "grad_norm": 0.4217198882582936, + "learning_rate": 4.679111137620442e-06, + "loss": 0.2766, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0994122177362442, + "step": 3305, + "valid_targets_mean": 7220.2, + "valid_targets_min": 2826 + }, + { + "epoch": 5.610169491525424, + "grad_norm": 0.45922876277681324, + "learning_rate": 4.624919969746171e-06, + "loss": 0.2755, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.143977552652359, + "step": 3310, + "valid_targets_mean": 7108.6, + "valid_targets_min": 3254 + }, + { + "epoch": 5.61864406779661, + "grad_norm": 0.4497468341605269, + "learning_rate": 4.571003383433481e-06, + "loss": 0.2898, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15260854363441467, + "step": 3315, + "valid_targets_mean": 7907.2, + "valid_targets_min": 2748 + }, + { + "epoch": 5.627118644067797, + "grad_norm": 0.45353082867834693, + "learning_rate": 4.517362341571687e-06, + "loss": 0.2759, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1295567750930786, + "step": 3320, + "valid_targets_mean": 7593.5, + "valid_targets_min": 2355 + }, + { + "epoch": 5.635593220338983, + "grad_norm": 0.4119838194637205, + "learning_rate": 4.463997802129221e-06, + "loss": 0.3005, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1388033777475357, + "step": 3325, + "valid_targets_mean": 8385.2, + "valid_targets_min": 4455 + }, + { + "epoch": 5.6440677966101696, + "grad_norm": 0.4140759472855946, + "learning_rate": 4.410910718136454e-06, + "loss": 0.2646, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15042278170585632, + "step": 3330, + "valid_targets_mean": 9002.2, + "valid_targets_min": 2717 + }, + { + "epoch": 5.652542372881356, + "grad_norm": 0.4400439343964711, + "learning_rate": 4.3581020376687566e-06, + "loss": 0.2625, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10155346989631653, + "step": 3335, + "valid_targets_mean": 7740.9, + "valid_targets_min": 3495 + }, + { + "epoch": 5.661016949152542, + "grad_norm": 0.45980924813766, + "learning_rate": 4.305572703829495e-06, + "loss": 0.2508, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11865295469760895, + "step": 3340, + "valid_targets_mean": 8350.5, + "valid_targets_min": 4097 + }, + { + "epoch": 5.669491525423728, + "grad_norm": 0.47385129359550743, + "learning_rate": 4.253323654733248e-06, + "loss": 0.2662, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10272833704948425, + "step": 3345, + "valid_targets_mean": 6288.5, + "valid_targets_min": 2754 + }, + { + "epoch": 5.677966101694915, + "grad_norm": 0.42022120557595954, + "learning_rate": 4.201355823488999e-06, + "loss": 0.2676, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14795033633708954, + "step": 3350, + "valid_targets_mean": 7618.1, + "valid_targets_min": 2832 + }, + { + "epoch": 5.686440677966102, + "grad_norm": 0.43924218046367447, + "learning_rate": 4.149670138183526e-06, + "loss": 0.2512, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08661969006061554, + "step": 3355, + "valid_targets_mean": 6429.2, + "valid_targets_min": 1434 + }, + { + "epoch": 5.694915254237288, + "grad_norm": 0.4633969763685704, + "learning_rate": 4.098267521864772e-06, + "loss": 0.2385, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1861276477575302, + "step": 3360, + "valid_targets_mean": 9499.4, + "valid_targets_min": 2276 + }, + { + "epoch": 5.703389830508475, + "grad_norm": 0.45898066026283985, + "learning_rate": 4.047148892525403e-06, + "loss": 0.229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1299194097518921, + "step": 3365, + "valid_targets_mean": 6270.8, + "valid_targets_min": 2471 + }, + { + "epoch": 5.711864406779661, + "grad_norm": 0.43083386950054814, + "learning_rate": 3.996315163086391e-06, + "loss": 0.2581, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15286263823509216, + "step": 3370, + "valid_targets_mean": 8112.6, + "valid_targets_min": 1794 + }, + { + "epoch": 5.720338983050848, + "grad_norm": 0.467520944139597, + "learning_rate": 3.945767241380732e-06, + "loss": 0.2898, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18376997113227844, + "step": 3375, + "valid_targets_mean": 7821.9, + "valid_targets_min": 1652 + }, + { + "epoch": 5.728813559322034, + "grad_norm": 0.41645203978501605, + "learning_rate": 3.895506030137195e-06, + "loss": 0.2476, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12087373435497284, + "step": 3380, + "valid_targets_mean": 7218.1, + "valid_targets_min": 3939 + }, + { + "epoch": 5.737288135593221, + "grad_norm": 0.41823635458160535, + "learning_rate": 3.845532426964252e-06, + "loss": 0.2501, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10257397592067719, + "step": 3385, + "valid_targets_mean": 6861.1, + "valid_targets_min": 3023 + }, + { + "epoch": 5.745762711864407, + "grad_norm": 0.43232642787196573, + "learning_rate": 3.79584732433399e-06, + "loss": 0.2825, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12480692565441132, + "step": 3390, + "valid_targets_mean": 7853.9, + "valid_targets_min": 2572 + }, + { + "epoch": 5.754237288135593, + "grad_norm": 0.49325336882654114, + "learning_rate": 3.746451609566233e-06, + "loss": 0.267, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24762919545173645, + "step": 3395, + "valid_targets_mean": 9721.4, + "valid_targets_min": 5420 + }, + { + "epoch": 5.762711864406779, + "grad_norm": 0.4212695658266242, + "learning_rate": 3.697346164812643e-06, + "loss": 0.2424, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11336623877286911, + "step": 3400, + "valid_targets_mean": 7380.5, + "valid_targets_min": 3715 + }, + { + "epoch": 5.771186440677966, + "grad_norm": 0.4588086641728118, + "learning_rate": 3.6485318670409896e-06, + "loss": 0.2611, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10371188074350357, + "step": 3405, + "valid_targets_mean": 6874.6, + "valid_targets_min": 2581 + }, + { + "epoch": 5.779661016949152, + "grad_norm": 0.44398724002047824, + "learning_rate": 3.6000095880194905e-06, + "loss": 0.2979, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11031177639961243, + "step": 3410, + "valid_targets_mean": 7567.9, + "valid_targets_min": 4255 + }, + { + "epoch": 5.788135593220339, + "grad_norm": 0.42924629006736004, + "learning_rate": 3.5517801943012443e-06, + "loss": 0.2643, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1974351704120636, + "step": 3415, + "valid_targets_mean": 9567.6, + "valid_targets_min": 4475 + }, + { + "epoch": 5.796610169491525, + "grad_norm": 0.46016588572316125, + "learning_rate": 3.5038445472087324e-06, + "loss": 0.2755, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13061898946762085, + "step": 3420, + "valid_targets_mean": 7301.4, + "valid_targets_min": 2394 + }, + { + "epoch": 5.805084745762712, + "grad_norm": 0.4058426308160901, + "learning_rate": 3.456203502818476e-06, + "loss": 0.2596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11977847665548325, + "step": 3425, + "valid_targets_mean": 7847.4, + "valid_targets_min": 3901 + }, + { + "epoch": 5.813559322033898, + "grad_norm": 0.48970336832788647, + "learning_rate": 3.408857911945702e-06, + "loss": 0.2906, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18240872025489807, + "step": 3430, + "valid_targets_mean": 9729.4, + "valid_targets_min": 2322 + }, + { + "epoch": 5.822033898305085, + "grad_norm": 0.39563623240144213, + "learning_rate": 3.36180862012919e-06, + "loss": 0.265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20780718326568604, + "step": 3435, + "valid_targets_mean": 11158.8, + "valid_targets_min": 3305 + }, + { + "epoch": 5.830508474576272, + "grad_norm": 0.49787796279197905, + "learning_rate": 3.3150564676161402e-06, + "loss": 0.2354, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10818520188331604, + "step": 3440, + "valid_targets_mean": 5966.9, + "valid_targets_min": 3336 + }, + { + "epoch": 5.838983050847458, + "grad_norm": 0.43084579663109984, + "learning_rate": 3.268602289347185e-06, + "loss": 0.2569, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19690270721912384, + "step": 3445, + "valid_targets_mean": 11298.9, + "valid_targets_min": 7754 + }, + { + "epoch": 5.847457627118644, + "grad_norm": 0.4218069624746767, + "learning_rate": 3.222446914941468e-06, + "loss": 0.2746, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17221492528915405, + "step": 3450, + "valid_targets_mean": 8413.1, + "valid_targets_min": 3225 + }, + { + "epoch": 5.8559322033898304, + "grad_norm": 0.4671618570113744, + "learning_rate": 3.176591168681851e-06, + "loss": 0.2577, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13562491536140442, + "step": 3455, + "valid_targets_mean": 7066.1, + "valid_targets_min": 2472 + }, + { + "epoch": 5.864406779661017, + "grad_norm": 0.4590320225196124, + "learning_rate": 3.131035869500152e-06, + "loss": 0.2468, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09656020998954773, + "step": 3460, + "valid_targets_mean": 5605.9, + "valid_targets_min": 3660 + }, + { + "epoch": 5.872881355932203, + "grad_norm": 0.4238092707837205, + "learning_rate": 3.085781830962564e-06, + "loss": 0.26, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11015133559703827, + "step": 3465, + "valid_targets_mean": 6491.9, + "valid_targets_min": 2791 + }, + { + "epoch": 5.88135593220339, + "grad_norm": 0.4388528153492548, + "learning_rate": 3.0408298612550878e-06, + "loss": 0.2349, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17622537910938263, + "step": 3470, + "valid_targets_mean": 8512.5, + "valid_targets_min": 2873 + }, + { + "epoch": 5.889830508474576, + "grad_norm": 0.4306978345104024, + "learning_rate": 2.996180763169132e-06, + "loss": 0.2504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09644504636526108, + "step": 3475, + "valid_targets_mean": 5898.6, + "valid_targets_min": 1697 + }, + { + "epoch": 5.898305084745763, + "grad_norm": 0.4429192567068347, + "learning_rate": 2.95183533408715e-06, + "loss": 0.2562, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09832319617271423, + "step": 3480, + "valid_targets_mean": 6330.5, + "valid_targets_min": 4248 + }, + { + "epoch": 5.906779661016949, + "grad_norm": 0.5042107811710015, + "learning_rate": 2.907794365968413e-06, + "loss": 0.2604, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14449542760849, + "step": 3485, + "valid_targets_mean": 7709.2, + "valid_targets_min": 4466 + }, + { + "epoch": 5.915254237288136, + "grad_norm": 0.38111377370566013, + "learning_rate": 2.864058645334853e-06, + "loss": 0.2441, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1592138707637787, + "step": 3490, + "valid_targets_mean": 9714.1, + "valid_targets_min": 4445 + }, + { + "epoch": 5.923728813559322, + "grad_norm": 0.4523598810623572, + "learning_rate": 2.820628953257052e-06, + "loss": 0.2723, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11317625641822815, + "step": 3495, + "valid_targets_mean": 6696.9, + "valid_targets_min": 1438 + }, + { + "epoch": 5.932203389830509, + "grad_norm": 0.38284023698249975, + "learning_rate": 2.7775060653402387e-06, + "loss": 0.2726, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1514039784669876, + "step": 3500, + "valid_targets_mean": 9845.6, + "valid_targets_min": 4052 + }, + { + "epoch": 5.940677966101695, + "grad_norm": 0.4164588979342514, + "learning_rate": 2.7346907517104894e-06, + "loss": 0.2939, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.209864541888237, + "step": 3505, + "valid_targets_mean": 11032.0, + "valid_targets_min": 5443 + }, + { + "epoch": 5.9491525423728815, + "grad_norm": 0.3835673805693966, + "learning_rate": 2.692183777000932e-06, + "loss": 0.2667, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12400268763303757, + "step": 3510, + "valid_targets_mean": 9057.1, + "valid_targets_min": 2882 + }, + { + "epoch": 5.9576271186440675, + "grad_norm": 0.48693557523835473, + "learning_rate": 2.64998590033813e-06, + "loss": 0.2685, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09107373654842377, + "step": 3515, + "valid_targets_mean": 5536.4, + "valid_targets_min": 1342 + }, + { + "epoch": 5.966101694915254, + "grad_norm": 0.46983127864689195, + "learning_rate": 2.608097875328488e-06, + "loss": 0.2467, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08910076320171356, + "step": 3520, + "valid_targets_mean": 4977.9, + "valid_targets_min": 1896 + }, + { + "epoch": 5.97457627118644, + "grad_norm": 0.45050680482743777, + "learning_rate": 2.5665204500448137e-06, + "loss": 0.2483, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06933078914880753, + "step": 3525, + "valid_targets_mean": 4338.5, + "valid_targets_min": 1973 + }, + { + "epoch": 5.983050847457627, + "grad_norm": 0.449771116335777, + "learning_rate": 2.525254367012955e-06, + "loss": 0.2675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17051050066947937, + "step": 3530, + "valid_targets_mean": 8545.4, + "valid_targets_min": 3602 + }, + { + "epoch": 5.991525423728813, + "grad_norm": 0.46300251369792844, + "learning_rate": 2.4843003631985486e-06, + "loss": 0.2955, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07504920661449432, + "step": 3535, + "valid_targets_mean": 5244.5, + "valid_targets_min": 3387 + }, + { + "epoch": 6.0, + "grad_norm": 0.4255488380121361, + "learning_rate": 2.4436591699938305e-06, + "loss": 0.2468, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10396578907966614, + "step": 3540, + "valid_targets_mean": 8307.2, + "valid_targets_min": 3542 + }, + { + "epoch": 6.008474576271187, + "grad_norm": 0.4079638692535048, + "learning_rate": 2.403331513204612e-06, + "loss": 0.2447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.132585346698761, + "step": 3545, + "valid_targets_mean": 8225.9, + "valid_targets_min": 3132 + }, + { + "epoch": 6.016949152542373, + "grad_norm": 0.42095335043120474, + "learning_rate": 2.363318113037283e-06, + "loss": 0.2426, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19237245619297028, + "step": 3550, + "valid_targets_mean": 8534.2, + "valid_targets_min": 2336 + }, + { + "epoch": 6.02542372881356, + "grad_norm": 0.4247831459112695, + "learning_rate": 2.323619684085976e-06, + "loss": 0.2412, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10242437571287155, + "step": 3555, + "valid_targets_mean": 8372.6, + "valid_targets_min": 3019 + }, + { + "epoch": 6.033898305084746, + "grad_norm": 0.5101711223801056, + "learning_rate": 2.2842369353197858e-06, + "loss": 0.2399, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10061325132846832, + "step": 3560, + "valid_targets_mean": 6458.5, + "valid_targets_min": 3200 + }, + { + "epoch": 6.0423728813559325, + "grad_norm": 0.46951651616591455, + "learning_rate": 2.2451705700701185e-06, + "loss": 0.2441, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09043577313423157, + "step": 3565, + "valid_targets_mean": 6405.8, + "valid_targets_min": 1973 + }, + { + "epoch": 6.0508474576271185, + "grad_norm": 0.43838570005499733, + "learning_rate": 2.2064212860181258e-06, + "loss": 0.2347, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1115138828754425, + "step": 3570, + "valid_targets_mean": 6562.5, + "valid_targets_min": 2966 + }, + { + "epoch": 6.059322033898305, + "grad_norm": 0.4105990788568166, + "learning_rate": 2.1679897751822532e-06, + "loss": 0.245, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14000532031059265, + "step": 3575, + "valid_targets_mean": 8664.9, + "valid_targets_min": 3036 + }, + { + "epoch": 6.067796610169491, + "grad_norm": 0.4000234466993258, + "learning_rate": 2.1298767239058684e-06, + "loss": 0.2781, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17599308490753174, + "step": 3580, + "valid_targets_mean": 10298.4, + "valid_targets_min": 3167 + }, + { + "epoch": 6.076271186440678, + "grad_norm": 0.4630894417075392, + "learning_rate": 2.0920828128450197e-06, + "loss": 0.2412, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16314397752285004, + "step": 3585, + "valid_targets_mean": 8534.8, + "valid_targets_min": 4293 + }, + { + "epoch": 6.084745762711864, + "grad_norm": 0.4227879675646018, + "learning_rate": 2.054608716956259e-06, + "loss": 0.2497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1060272678732872, + "step": 3590, + "valid_targets_mean": 7418.1, + "valid_targets_min": 1916 + }, + { + "epoch": 6.093220338983051, + "grad_norm": 0.4463726939777628, + "learning_rate": 2.0174551054846158e-06, + "loss": 0.2406, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11649863421916962, + "step": 3595, + "valid_targets_mean": 6681.9, + "valid_targets_min": 2538 + }, + { + "epoch": 6.101694915254237, + "grad_norm": 0.44505007275052016, + "learning_rate": 1.9806226419516195e-06, + "loss": 0.2847, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10530796647071838, + "step": 3600, + "valid_targets_mean": 7766.4, + "valid_targets_min": 5614 + }, + { + "epoch": 6.110169491525424, + "grad_norm": 0.38470113587130134, + "learning_rate": 1.94411198414346e-06, + "loss": 0.2665, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14323177933692932, + "step": 3605, + "valid_targets_mean": 10445.9, + "valid_targets_min": 2694 + }, + { + "epoch": 6.11864406779661, + "grad_norm": 0.5125177576701928, + "learning_rate": 1.9079237840992416e-06, + "loss": 0.2332, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09224593639373779, + "step": 3610, + "valid_targets_mean": 6256.4, + "valid_targets_min": 2591 + }, + { + "epoch": 6.127118644067797, + "grad_norm": 0.40141614645721524, + "learning_rate": 1.8720586880993452e-06, + "loss": 0.2753, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13916637003421783, + "step": 3615, + "valid_targets_mean": 8134.5, + "valid_targets_min": 1875 + }, + { + "epoch": 6.135593220338983, + "grad_norm": 0.4648377214616805, + "learning_rate": 1.8365173366538647e-06, + "loss": 0.2984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1737988442182541, + "step": 3620, + "valid_targets_mean": 8593.6, + "valid_targets_min": 2950 + }, + { + "epoch": 6.1440677966101696, + "grad_norm": 0.3970149435933971, + "learning_rate": 1.8013003644911987e-06, + "loss": 0.2869, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1591392606496811, + "step": 3625, + "valid_targets_mean": 7797.2, + "valid_targets_min": 2927 + }, + { + "epoch": 6.1525423728813555, + "grad_norm": 0.4329881802584791, + "learning_rate": 1.7664084005466796e-06, + "loss": 0.2586, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1466069221496582, + "step": 3630, + "valid_targets_mean": 7398.9, + "valid_targets_min": 2493 + }, + { + "epoch": 6.161016949152542, + "grad_norm": 0.40044188924352225, + "learning_rate": 1.7318420679513725e-06, + "loss": 0.2675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09767980873584747, + "step": 3635, + "valid_targets_mean": 7647.6, + "valid_targets_min": 5285 + }, + { + "epoch": 6.169491525423728, + "grad_norm": 0.4666515135940152, + "learning_rate": 1.6976019840209334e-06, + "loss": 0.2487, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13460057973861694, + "step": 3640, + "valid_targets_mean": 6764.6, + "valid_targets_min": 3017 + }, + { + "epoch": 6.177966101694915, + "grad_norm": 0.4310188952800369, + "learning_rate": 1.6636887602445839e-06, + "loss": 0.2494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14499178528785706, + "step": 3645, + "valid_targets_mean": 8610.5, + "valid_targets_min": 4089 + }, + { + "epoch": 6.186440677966102, + "grad_norm": 0.47475101684614096, + "learning_rate": 1.6301030022741837e-06, + "loss": 0.265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12736810743808746, + "step": 3650, + "valid_targets_mean": 6779.5, + "valid_targets_min": 2699 + }, + { + "epoch": 6.194915254237288, + "grad_norm": 0.5568318024157459, + "learning_rate": 1.596845309913444e-06, + "loss": 0.2766, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13458159565925598, + "step": 3655, + "valid_targets_mean": 6805.9, + "valid_targets_min": 1820 + }, + { + "epoch": 6.203389830508475, + "grad_norm": 0.4321942421836466, + "learning_rate": 1.5639162771071736e-06, + "loss": 0.2582, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17277520895004272, + "step": 3660, + "valid_targets_mean": 8875.1, + "valid_targets_min": 3888 + }, + { + "epoch": 6.211864406779661, + "grad_norm": 0.4459991928762019, + "learning_rate": 1.5313164919307033e-06, + "loss": 0.2631, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11502149701118469, + "step": 3665, + "valid_targets_mean": 7180.1, + "valid_targets_min": 4359 + }, + { + "epoch": 6.220338983050848, + "grad_norm": 0.42250806309461797, + "learning_rate": 1.499046536579374e-06, + "loss": 0.282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17123055458068848, + "step": 3670, + "valid_targets_mean": 8993.6, + "valid_targets_min": 4613 + }, + { + "epoch": 6.228813559322034, + "grad_norm": 0.4108820724486728, + "learning_rate": 1.4671069873581312e-06, + "loss": 0.2852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15709635615348816, + "step": 3675, + "valid_targets_mean": 9469.9, + "valid_targets_min": 5070 + }, + { + "epoch": 6.237288135593221, + "grad_norm": 0.4437412702980212, + "learning_rate": 1.4354984146712503e-06, + "loss": 0.2632, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11063840240240097, + "step": 3680, + "valid_targets_mean": 6998.9, + "valid_targets_min": 2213 + }, + { + "epoch": 6.245762711864407, + "grad_norm": 0.4733988446311304, + "learning_rate": 1.4042213830121344e-06, + "loss": 0.2515, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14029532670974731, + "step": 3685, + "valid_targets_mean": 6649.2, + "valid_targets_min": 3248 + }, + { + "epoch": 6.254237288135593, + "grad_norm": 0.38655289252851993, + "learning_rate": 1.3732764509532316e-06, + "loss": 0.2575, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13541369140148163, + "step": 3690, + "valid_targets_mean": 9996.2, + "valid_targets_min": 5577 + }, + { + "epoch": 6.262711864406779, + "grad_norm": 0.4419355294886104, + "learning_rate": 1.3426641711360788e-06, + "loss": 0.2543, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12257914245128632, + "step": 3695, + "valid_targets_mean": 7234.6, + "valid_targets_min": 3465 + }, + { + "epoch": 6.271186440677966, + "grad_norm": 0.4944609384643766, + "learning_rate": 1.3123850902614143e-06, + "loss": 0.2433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09550976008176804, + "step": 3700, + "valid_targets_mean": 5357.8, + "valid_targets_min": 2337 + }, + { + "epoch": 6.279661016949152, + "grad_norm": 0.458073682292656, + "learning_rate": 1.2824397490794115e-06, + "loss": 0.2791, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12735655903816223, + "step": 3705, + "valid_targets_mean": 8300.4, + "valid_targets_min": 2948 + }, + { + "epoch": 6.288135593220339, + "grad_norm": 0.44512304664485036, + "learning_rate": 1.2528286823800495e-06, + "loss": 0.2496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12010197341442108, + "step": 3710, + "valid_targets_mean": 6729.8, + "valid_targets_min": 2551 + }, + { + "epoch": 6.296610169491525, + "grad_norm": 0.4241959010800955, + "learning_rate": 1.223552418983518e-06, + "loss": 0.2651, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1606883406639099, + "step": 3715, + "valid_targets_mean": 8563.4, + "valid_targets_min": 2422 + }, + { + "epoch": 6.305084745762712, + "grad_norm": 0.4458826979380267, + "learning_rate": 1.1946114817308207e-06, + "loss": 0.2453, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.126150980591774, + "step": 3720, + "valid_targets_mean": 6960.0, + "valid_targets_min": 2437 + }, + { + "epoch": 6.313559322033898, + "grad_norm": 0.39768023598211966, + "learning_rate": 1.166006387474401e-06, + "loss": 0.2429, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1836184561252594, + "step": 3725, + "valid_targets_mean": 10689.0, + "valid_targets_min": 3353 + }, + { + "epoch": 6.322033898305085, + "grad_norm": 0.4787935493604884, + "learning_rate": 1.1377376470689328e-06, + "loss": 0.271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12405265867710114, + "step": 3730, + "valid_targets_mean": 6661.1, + "valid_targets_min": 3367 + }, + { + "epoch": 6.330508474576272, + "grad_norm": 0.513993676048688, + "learning_rate": 1.1098057653621775e-06, + "loss": 0.2535, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16209466755390167, + "step": 3735, + "valid_targets_mean": 7460.2, + "valid_targets_min": 3795 + }, + { + "epoch": 6.338983050847458, + "grad_norm": 0.45485260063869304, + "learning_rate": 1.0822112411860042e-06, + "loss": 0.2653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0905480831861496, + "step": 3740, + "valid_targets_mean": 5860.2, + "valid_targets_min": 2406 + }, + { + "epoch": 6.3474576271186445, + "grad_norm": 0.47528112960496416, + "learning_rate": 1.0549545673474304e-06, + "loss": 0.2461, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0847092866897583, + "step": 3745, + "valid_targets_mean": 6441.5, + "valid_targets_min": 3400 + }, + { + "epoch": 6.3559322033898304, + "grad_norm": 0.417189000217903, + "learning_rate": 1.0280362306198732e-06, + "loss": 0.2609, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1653599739074707, + "step": 3750, + "valid_targets_mean": 9874.0, + "valid_targets_min": 3847 + }, + { + "epoch": 6.364406779661017, + "grad_norm": 0.44496662963253514, + "learning_rate": 1.0014567117344121e-06, + "loss": 0.2689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14929382503032684, + "step": 3755, + "valid_targets_mean": 6836.2, + "valid_targets_min": 2605 + }, + { + "epoch": 6.372881355932203, + "grad_norm": 0.4711935019321799, + "learning_rate": 9.752164853712355e-07, + "loss": 0.2432, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11264555901288986, + "step": 3760, + "valid_targets_mean": 7332.9, + "valid_targets_min": 3422 + }, + { + "epoch": 6.38135593220339, + "grad_norm": 0.503630625795691, + "learning_rate": 9.493160201511409e-07, + "loss": 0.2658, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11310052871704102, + "step": 3765, + "valid_targets_mean": 7008.2, + "valid_targets_min": 1707 + }, + { + "epoch": 6.389830508474576, + "grad_norm": 0.5778340405809688, + "learning_rate": 9.2375577862718e-07, + "loss": 0.2638, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09299856424331665, + "step": 3770, + "valid_targets_mean": 6915.5, + "valid_targets_min": 2350 + }, + { + "epoch": 6.398305084745763, + "grad_norm": 0.42295528500037055, + "learning_rate": 8.985362172763933e-07, + "loss": 0.2444, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09429045021533966, + "step": 3775, + "valid_targets_mean": 6875.8, + "valid_targets_min": 2364 + }, + { + "epoch": 6.406779661016949, + "grad_norm": 0.39896345678565265, + "learning_rate": 8.736577864916617e-07, + "loss": 0.2497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11996320635080338, + "step": 3780, + "valid_targets_mean": 7433.8, + "valid_targets_min": 2417 + }, + { + "epoch": 6.415254237288136, + "grad_norm": 0.42165435770722925, + "learning_rate": 8.491209305736525e-07, + "loss": 0.2535, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13380880653858185, + "step": 3785, + "valid_targets_mean": 7627.2, + "valid_targets_min": 2303 + }, + { + "epoch": 6.423728813559322, + "grad_norm": 0.4505139819346616, + "learning_rate": 8.249260877228993e-07, + "loss": 0.2862, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14228764176368713, + "step": 3790, + "valid_targets_mean": 8098.2, + "valid_targets_min": 3002 + }, + { + "epoch": 6.432203389830509, + "grad_norm": 0.4321271164525556, + "learning_rate": 8.010736900319615e-07, + "loss": 0.2721, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09055182337760925, + "step": 3795, + "valid_targets_mean": 6403.5, + "valid_targets_min": 2779 + }, + { + "epoch": 6.440677966101695, + "grad_norm": 0.4445613645730953, + "learning_rate": 7.775641634777198e-07, + "loss": 0.2607, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11796161532402039, + "step": 3800, + "valid_targets_mean": 7846.5, + "valid_targets_min": 3128 + }, + { + "epoch": 6.4491525423728815, + "grad_norm": 0.4983181318128694, + "learning_rate": 7.543979279137592e-07, + "loss": 0.2583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11737058311700821, + "step": 3805, + "valid_targets_mean": 6364.1, + "valid_targets_min": 2068 + }, + { + "epoch": 6.4576271186440675, + "grad_norm": 0.4637887645159089, + "learning_rate": 7.315753970628825e-07, + "loss": 0.2487, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09322785586118698, + "step": 3810, + "valid_targets_mean": 6619.9, + "valid_targets_min": 2636 + }, + { + "epoch": 6.466101694915254, + "grad_norm": 0.40047532995209967, + "learning_rate": 7.090969785097046e-07, + "loss": 0.2647, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13654407858848572, + "step": 3815, + "valid_targets_mean": 9421.6, + "valid_targets_min": 5966 + }, + { + "epoch": 6.47457627118644, + "grad_norm": 0.4390708368570101, + "learning_rate": 6.869630736933963e-07, + "loss": 0.242, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07607319951057434, + "step": 3820, + "valid_targets_mean": 6052.5, + "valid_targets_min": 3828 + }, + { + "epoch": 6.483050847457627, + "grad_norm": 0.42364553715790104, + "learning_rate": 6.651740779004878e-07, + "loss": 0.2651, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1431792676448822, + "step": 3825, + "valid_targets_mean": 8558.6, + "valid_targets_min": 2566 + }, + { + "epoch": 6.491525423728813, + "grad_norm": 0.47872145294990065, + "learning_rate": 6.437303802578365e-07, + "loss": 0.2624, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09658294916152954, + "step": 3830, + "valid_targets_mean": 5816.0, + "valid_targets_min": 2772 + }, + { + "epoch": 6.5, + "grad_norm": 0.42695972686370715, + "learning_rate": 6.226323637256592e-07, + "loss": 0.2558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09363295882940292, + "step": 3835, + "valid_targets_mean": 6977.9, + "valid_targets_min": 2840 + }, + { + "epoch": 6.508474576271187, + "grad_norm": 0.448749456041159, + "learning_rate": 6.018804050906957e-07, + "loss": 0.259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1705683469772339, + "step": 3840, + "valid_targets_mean": 9966.0, + "valid_targets_min": 3703 + }, + { + "epoch": 6.516949152542373, + "grad_norm": 0.44110593342725196, + "learning_rate": 5.814748749594845e-07, + "loss": 0.2921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15280672907829285, + "step": 3845, + "valid_targets_mean": 7834.5, + "valid_targets_min": 2385 + }, + { + "epoch": 6.52542372881356, + "grad_norm": 0.41011102728994003, + "learning_rate": 5.614161377517491e-07, + "loss": 0.2395, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10929296910762787, + "step": 3850, + "valid_targets_mean": 7395.1, + "valid_targets_min": 2328 + }, + { + "epoch": 6.533898305084746, + "grad_norm": 0.37684976767116324, + "learning_rate": 5.417045516938712e-07, + "loss": 0.2607, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15998807549476624, + "step": 3855, + "valid_targets_mean": 11794.1, + "valid_targets_min": 3559 + }, + { + "epoch": 6.5423728813559325, + "grad_norm": 0.4502091870017217, + "learning_rate": 5.223404688125189e-07, + "loss": 0.2652, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08542191982269287, + "step": 3860, + "valid_targets_mean": 5364.5, + "valid_targets_min": 1501 + }, + { + "epoch": 6.5508474576271185, + "grad_norm": 0.4518810494268951, + "learning_rate": 5.033242349283307e-07, + "loss": 0.2461, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13581258058547974, + "step": 3865, + "valid_targets_mean": 7274.4, + "valid_targets_min": 2654 + }, + { + "epoch": 6.559322033898305, + "grad_norm": 0.467029591171528, + "learning_rate": 4.846561896497682e-07, + "loss": 0.2871, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10872132331132889, + "step": 3870, + "valid_targets_mean": 7022.8, + "valid_targets_min": 4600 + }, + { + "epoch": 6.567796610169491, + "grad_norm": 0.4409609140769841, + "learning_rate": 4.6633666636703325e-07, + "loss": 0.256, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11535359919071198, + "step": 3875, + "valid_targets_mean": 7674.4, + "valid_targets_min": 4116 + }, + { + "epoch": 6.576271186440678, + "grad_norm": 0.42972659095916, + "learning_rate": 4.4836599224611586e-07, + "loss": 0.2518, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09469720721244812, + "step": 3880, + "valid_targets_mean": 7193.9, + "valid_targets_min": 712 + }, + { + "epoch": 6.584745762711864, + "grad_norm": 0.45334276617935493, + "learning_rate": 4.3074448822295165e-07, + "loss": 0.266, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23430021107196808, + "step": 3885, + "valid_targets_mean": 11505.8, + "valid_targets_min": 2009 + }, + { + "epoch": 6.593220338983051, + "grad_norm": 0.43929363356639645, + "learning_rate": 4.1347246899770435e-07, + "loss": 0.252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16690164804458618, + "step": 3890, + "valid_targets_mean": 7407.8, + "valid_targets_min": 3494 + }, + { + "epoch": 6.601694915254237, + "grad_norm": 0.4147188602054449, + "learning_rate": 3.965502430291235e-07, + "loss": 0.2583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16083547472953796, + "step": 3895, + "valid_targets_mean": 11111.1, + "valid_targets_min": 5126 + }, + { + "epoch": 6.610169491525424, + "grad_norm": 0.455809497113382, + "learning_rate": 3.7997811252905135e-07, + "loss": 0.2462, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10246642678976059, + "step": 3900, + "valid_targets_mean": 6430.8, + "valid_targets_min": 2509 + }, + { + "epoch": 6.61864406779661, + "grad_norm": 0.48481248655451537, + "learning_rate": 3.6375637345701376e-07, + "loss": 0.2921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12926767766475677, + "step": 3905, + "valid_targets_mean": 8199.2, + "valid_targets_min": 3433 + }, + { + "epoch": 6.627118644067797, + "grad_norm": 0.42600486230878915, + "learning_rate": 3.4788531551495307e-07, + "loss": 0.2337, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1657295525074005, + "step": 3910, + "valid_targets_mean": 9773.5, + "valid_targets_min": 3644 + }, + { + "epoch": 6.635593220338983, + "grad_norm": 0.44131521564665016, + "learning_rate": 3.323652221420326e-07, + "loss": 0.2662, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11407070606946945, + "step": 3915, + "valid_targets_mean": 7225.0, + "valid_targets_min": 3796 + }, + { + "epoch": 6.6440677966101696, + "grad_norm": 0.4377236209372105, + "learning_rate": 3.1719637050958706e-07, + "loss": 0.2443, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16772839426994324, + "step": 3920, + "valid_targets_mean": 7740.8, + "valid_targets_min": 2711 + }, + { + "epoch": 6.652542372881356, + "grad_norm": 0.48773453863500077, + "learning_rate": 3.023790315161734e-07, + "loss": 0.234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08592482656240463, + "step": 3925, + "valid_targets_mean": 5208.9, + "valid_targets_min": 2740 + }, + { + "epoch": 6.661016949152542, + "grad_norm": 0.4720937825623047, + "learning_rate": 2.8791346978273015e-07, + "loss": 0.2457, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14076513051986694, + "step": 3930, + "valid_targets_mean": 7652.5, + "valid_targets_min": 2939 + }, + { + "epoch": 6.669491525423728, + "grad_norm": 0.3859609875387887, + "learning_rate": 2.7379994364784556e-07, + "loss": 0.2748, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.149990051984787, + "step": 3935, + "valid_targets_mean": 10438.9, + "valid_targets_min": 6415 + }, + { + "epoch": 6.677966101694915, + "grad_norm": 0.5550308272010621, + "learning_rate": 2.60038705163157e-07, + "loss": 0.2458, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08144932985305786, + "step": 3940, + "valid_targets_mean": 5604.2, + "valid_targets_min": 3387 + }, + { + "epoch": 6.686440677966102, + "grad_norm": 0.3979338951489735, + "learning_rate": 2.4663000008883664e-07, + "loss": 0.2958, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16274738311767578, + "step": 3945, + "valid_targets_mean": 9629.6, + "valid_targets_min": 3399 + }, + { + "epoch": 6.694915254237288, + "grad_norm": 0.46083448051365644, + "learning_rate": 2.335740678892129e-07, + "loss": 0.2563, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14789345860481262, + "step": 3950, + "valid_targets_mean": 7863.1, + "valid_targets_min": 2423 + }, + { + "epoch": 6.703389830508475, + "grad_norm": 0.41684119058343516, + "learning_rate": 2.20871141728487e-07, + "loss": 0.2757, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2013491988182068, + "step": 3955, + "valid_targets_mean": 10909.6, + "valid_targets_min": 3286 + }, + { + "epoch": 6.711864406779661, + "grad_norm": 0.40804130143632766, + "learning_rate": 2.0852144846656764e-07, + "loss": 0.254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11485549807548523, + "step": 3960, + "valid_targets_mean": 7442.1, + "valid_targets_min": 1795 + }, + { + "epoch": 6.720338983050848, + "grad_norm": 0.41669778757995984, + "learning_rate": 1.9652520865502734e-07, + "loss": 0.2667, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11961879581212997, + "step": 3965, + "valid_targets_mean": 6853.5, + "valid_targets_min": 2648 + }, + { + "epoch": 6.728813559322034, + "grad_norm": 0.4152131127329952, + "learning_rate": 1.848826365331613e-07, + "loss": 0.2728, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09015417098999023, + "step": 3970, + "valid_targets_mean": 6583.1, + "valid_targets_min": 3468 + }, + { + "epoch": 6.737288135593221, + "grad_norm": 0.40715982611325285, + "learning_rate": 1.7359394002415265e-07, + "loss": 0.2537, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0808727890253067, + "step": 3975, + "valid_targets_mean": 7092.9, + "valid_targets_min": 2970 + }, + { + "epoch": 6.745762711864407, + "grad_norm": 0.5044552290709712, + "learning_rate": 1.626593207313709e-07, + "loss": 0.2494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08215104788541794, + "step": 3980, + "valid_targets_mean": 5966.9, + "valid_targets_min": 2607 + }, + { + "epoch": 6.754237288135593, + "grad_norm": 0.43110120943383057, + "learning_rate": 1.520789739347617e-07, + "loss": 0.2726, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14837504923343658, + "step": 3985, + "valid_targets_mean": 8823.1, + "valid_targets_min": 4021 + }, + { + "epoch": 6.762711864406779, + "grad_norm": 0.4055433819445956, + "learning_rate": 1.4185308858737367e-07, + "loss": 0.2864, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1624079942703247, + "step": 3990, + "valid_targets_mean": 7929.6, + "valid_targets_min": 2855 + }, + { + "epoch": 6.771186440677966, + "grad_norm": 0.477581742178108, + "learning_rate": 1.3198184731196162e-07, + "loss": 0.2545, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10930319130420685, + "step": 3995, + "valid_targets_mean": 7842.5, + "valid_targets_min": 3884 + }, + { + "epoch": 6.779661016949152, + "grad_norm": 0.46632621619817743, + "learning_rate": 1.2246542639774871e-07, + "loss": 0.2893, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08825379610061646, + "step": 4000, + "valid_targets_mean": 5714.2, + "valid_targets_min": 2503 + }, + { + "epoch": 6.788135593220339, + "grad_norm": 0.40822795025329855, + "learning_rate": 1.1330399579725814e-07, + "loss": 0.2502, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12100020796060562, + "step": 4005, + "valid_targets_mean": 7386.6, + "valid_targets_min": 2520 + }, + { + "epoch": 6.796610169491525, + "grad_norm": 0.4869071996289484, + "learning_rate": 1.0449771912329543e-07, + "loss": 0.2679, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13639283180236816, + "step": 4010, + "valid_targets_mean": 6874.1, + "valid_targets_min": 3308 + }, + { + "epoch": 6.805084745762712, + "grad_norm": 0.4514466969309618, + "learning_rate": 9.604675364601079e-08, + "loss": 0.2802, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16514557600021362, + "step": 4015, + "valid_targets_mean": 8557.4, + "valid_targets_min": 2551 + }, + { + "epoch": 6.813559322033898, + "grad_norm": 0.45927796348806976, + "learning_rate": 8.795125029010587e-08, + "loss": 0.2344, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14747881889343262, + "step": 4020, + "valid_targets_mean": 7801.5, + "valid_targets_min": 1934 + }, + { + "epoch": 6.822033898305085, + "grad_norm": 0.4736824137520606, + "learning_rate": 8.021135363212252e-08, + "loss": 0.2668, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1297898292541504, + "step": 4025, + "valid_targets_mean": 7571.8, + "valid_targets_min": 3105 + }, + { + "epoch": 6.830508474576272, + "grad_norm": 0.44820578616508494, + "learning_rate": 7.282720189787374e-08, + "loss": 0.2582, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11103338748216629, + "step": 4030, + "valid_targets_mean": 7009.0, + "valid_targets_min": 2167 + }, + { + "epoch": 6.838983050847458, + "grad_norm": 0.41724902537057335, + "learning_rate": 6.579892695996571e-08, + "loss": 0.2534, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11125913262367249, + "step": 4035, + "valid_targets_mean": 7157.2, + "valid_targets_min": 4536 + }, + { + "epoch": 6.847457627118644, + "grad_norm": 0.43675935476999767, + "learning_rate": 5.912665433545517e-08, + "loss": 0.2585, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13949739933013916, + "step": 4040, + "valid_targets_mean": 7369.8, + "valid_targets_min": 2319 + }, + { + "epoch": 6.8559322033898304, + "grad_norm": 0.3967356930940284, + "learning_rate": 5.281050318358683e-08, + "loss": 0.2403, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11958187818527222, + "step": 4045, + "valid_targets_mean": 9524.0, + "valid_targets_min": 3222 + }, + { + "epoch": 6.864406779661017, + "grad_norm": 0.3764643187198624, + "learning_rate": 4.685058630369055e-08, + "loss": 0.2759, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14520995318889618, + "step": 4050, + "valid_targets_mean": 10037.6, + "valid_targets_min": 3726 + }, + { + "epoch": 6.872881355932203, + "grad_norm": 0.4472913726578498, + "learning_rate": 4.124701013314969e-08, + "loss": 0.2816, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13814541697502136, + "step": 4055, + "valid_targets_mean": 8044.9, + "valid_targets_min": 1559 + }, + { + "epoch": 6.88135593220339, + "grad_norm": 0.4304758387859473, + "learning_rate": 3.599987474550259e-08, + "loss": 0.2661, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17096751928329468, + "step": 4060, + "valid_targets_mean": 8318.6, + "valid_targets_min": 2625 + }, + { + "epoch": 6.889830508474576, + "grad_norm": 0.4255133064645767, + "learning_rate": 3.110927384865958e-08, + "loss": 0.2771, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18236063420772552, + "step": 4065, + "valid_targets_mean": 10562.4, + "valid_targets_min": 4446 + }, + { + "epoch": 6.898305084745763, + "grad_norm": 0.42579147928580874, + "learning_rate": 2.6575294783230954e-08, + "loss": 0.232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0787440836429596, + "step": 4070, + "valid_targets_mean": 5780.5, + "valid_targets_min": 2433 + }, + { + "epoch": 6.906779661016949, + "grad_norm": 0.41394744030559266, + "learning_rate": 2.239801852095935e-08, + "loss": 0.2446, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.160111665725708, + "step": 4075, + "valid_targets_mean": 10663.0, + "valid_targets_min": 4448 + }, + { + "epoch": 6.915254237288136, + "grad_norm": 0.4398804522507922, + "learning_rate": 1.8577519663278697e-08, + "loss": 0.2397, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11937999725341797, + "step": 4080, + "valid_targets_mean": 8688.0, + "valid_targets_min": 4993 + }, + { + "epoch": 6.923728813559322, + "grad_norm": 0.4242647115439553, + "learning_rate": 1.5113866439986357e-08, + "loss": 0.2832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16489309072494507, + "step": 4085, + "valid_targets_mean": 8224.9, + "valid_targets_min": 2579 + }, + { + "epoch": 6.932203389830509, + "grad_norm": 0.4463993067738115, + "learning_rate": 1.2007120708015241e-08, + "loss": 0.2719, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13091351091861725, + "step": 4090, + "valid_targets_mean": 6447.1, + "valid_targets_min": 2442 + }, + { + "epoch": 6.940677966101695, + "grad_norm": 0.3869465593180131, + "learning_rate": 9.257337950332456e-09, + "loss": 0.2656, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12474340200424194, + "step": 4095, + "valid_targets_mean": 8366.1, + "valid_targets_min": 3401 + }, + { + "epoch": 6.9491525423728815, + "grad_norm": 0.4310417118559466, + "learning_rate": 6.864567274955658e-09, + "loss": 0.2695, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1725938618183136, + "step": 4100, + "valid_targets_mean": 8291.4, + "valid_targets_min": 2433 + }, + { + "epoch": 6.9576271186440675, + "grad_norm": 0.495997210458029, + "learning_rate": 4.828851414062641e-09, + "loss": 0.2767, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15047688782215118, + "step": 4105, + "valid_targets_mean": 9112.9, + "valid_targets_min": 4448 + }, + { + "epoch": 6.966101694915254, + "grad_norm": 0.40916895754360966, + "learning_rate": 3.150226723243055e-09, + "loss": 0.2685, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12793532013893127, + "step": 4110, + "valid_targets_mean": 8339.1, + "valid_targets_min": 2695 + }, + { + "epoch": 6.97457627118644, + "grad_norm": 0.4136374005938968, + "learning_rate": 1.8287231808322702e-09, + "loss": 0.2591, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14656734466552734, + "step": 4115, + "valid_targets_mean": 10133.8, + "valid_targets_min": 6907 + }, + { + "epoch": 6.983050847457627, + "grad_norm": 0.44077122285507164, + "learning_rate": 8.643643873962326e-10, + "loss": 0.2447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10336880385875702, + "step": 4120, + "valid_targets_mean": 7540.5, + "valid_targets_min": 4074 + }, + { + "epoch": 6.991525423728813, + "grad_norm": 1.279550969019676, + "learning_rate": 2.5716756528959553e-10, + "loss": 0.2545, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16964712738990784, + "step": 4125, + "valid_targets_mean": 9376.9, + "valid_targets_min": 3622 + }, + { + "epoch": 7.0, + "grad_norm": 0.42781761566450044, + "learning_rate": 7.143558364841597e-12, + "loss": 0.2477, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07686486095190048, + "step": 4130, + "valid_targets_mean": 6255.1, + "valid_targets_min": 3251 + }, + { + "epoch": 7.0, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07686486095190048, + "step": 4130, + "total_flos": 2.65446196155043e+18, + "train_loss": 0.30306281665335555, + "train_runtime": 64515.1665, + "train_samples_per_second": 1.024, + "train_steps_per_second": 0.064, + "valid_targets_mean": 6255.1, + "valid_targets_min": 3251 + } + ], + "logging_steps": 5, + "max_steps": 4130, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 1500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 2.65446196155043e+18, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +}