{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 5.0, "eval_steps": 500, "global_step": 4940, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.005063291139240506, "grad_norm": 4.609051043616223, "learning_rate": 3.238866396761134e-07, "loss": 0.5035, "loss_nan_ranks": 0, "loss_rank_avg": 0.25989317893981934, "step": 5, "valid_targets_mean": 3288.2, "valid_targets_min": 815 }, { "epoch": 0.010126582278481013, "grad_norm": 3.6056753367980687, "learning_rate": 7.287449392712551e-07, "loss": 0.4979, "loss_nan_ranks": 0, "loss_rank_avg": 0.23132257163524628, "step": 10, "valid_targets_mean": 4994.0, "valid_targets_min": 1103 }, { "epoch": 0.015189873417721518, "grad_norm": 3.75046312941662, "learning_rate": 1.133603238866397e-06, "loss": 0.5107, "loss_nan_ranks": 0, "loss_rank_avg": 0.23433995246887207, "step": 15, "valid_targets_mean": 4084.1, "valid_targets_min": 1248 }, { "epoch": 0.020253164556962026, "grad_norm": 4.009323566522028, "learning_rate": 1.5384615384615387e-06, "loss": 0.4757, "loss_nan_ranks": 0, "loss_rank_avg": 0.19289864599704742, "step": 20, "valid_targets_mean": 4351.0, "valid_targets_min": 1208 }, { "epoch": 0.02531645569620253, "grad_norm": 3.857687726883038, "learning_rate": 1.9433198380566803e-06, "loss": 0.4795, "loss_nan_ranks": 0, "loss_rank_avg": 0.25582650303840637, "step": 25, "valid_targets_mean": 4894.1, "valid_targets_min": 1784 }, { "epoch": 0.030379746835443037, "grad_norm": 2.431783748480512, "learning_rate": 2.348178137651822e-06, "loss": 0.4538, "loss_nan_ranks": 0, "loss_rank_avg": 0.21279120445251465, "step": 30, "valid_targets_mean": 4872.4, "valid_targets_min": 1107 }, { "epoch": 0.035443037974683546, "grad_norm": 2.0913610531108153, "learning_rate": 2.7530364372469636e-06, "loss": 0.4576, "loss_nan_ranks": 0, "loss_rank_avg": 0.21099823713302612, "step": 35, "valid_targets_mean": 4177.9, "valid_targets_min": 1173 }, { "epoch": 0.04050632911392405, "grad_norm": 2.1267526423567826, "learning_rate": 3.157894736842105e-06, "loss": 0.4362, "loss_nan_ranks": 0, "loss_rank_avg": 0.21998053789138794, "step": 40, "valid_targets_mean": 5318.6, "valid_targets_min": 1431 }, { "epoch": 0.04556962025316456, "grad_norm": 1.8229308674567508, "learning_rate": 3.562753036437247e-06, "loss": 0.4107, "loss_nan_ranks": 0, "loss_rank_avg": 0.21922659873962402, "step": 45, "valid_targets_mean": 3793.9, "valid_targets_min": 1470 }, { "epoch": 0.05063291139240506, "grad_norm": 1.1764023018227465, "learning_rate": 3.967611336032389e-06, "loss": 0.3992, "loss_nan_ranks": 0, "loss_rank_avg": 0.1912367194890976, "step": 50, "valid_targets_mean": 4403.0, "valid_targets_min": 1320 }, { "epoch": 0.05569620253164557, "grad_norm": 1.0017414517719199, "learning_rate": 4.372469635627531e-06, "loss": 0.3867, "loss_nan_ranks": 0, "loss_rank_avg": 0.19108061492443085, "step": 55, "valid_targets_mean": 4060.0, "valid_targets_min": 1137 }, { "epoch": 0.060759493670886074, "grad_norm": 0.7507852394561627, "learning_rate": 4.7773279352226725e-06, "loss": 0.3841, "loss_nan_ranks": 0, "loss_rank_avg": 0.16387608647346497, "step": 60, "valid_targets_mean": 4424.5, "valid_targets_min": 1409 }, { "epoch": 0.06582278481012659, "grad_norm": 0.557594133353884, "learning_rate": 5.1821862348178145e-06, "loss": 0.3711, "loss_nan_ranks": 0, "loss_rank_avg": 0.16386422514915466, "step": 65, "valid_targets_mean": 3916.2, "valid_targets_min": 1045 }, { "epoch": 0.07088607594936709, "grad_norm": 0.421043632829371, "learning_rate": 5.5870445344129565e-06, "loss": 0.3875, "loss_nan_ranks": 0, "loss_rank_avg": 0.19452455639839172, "step": 70, "valid_targets_mean": 5656.6, "valid_targets_min": 1746 }, { "epoch": 0.0759493670886076, "grad_norm": 0.41166529544187236, "learning_rate": 5.991902834008098e-06, "loss": 0.3747, "loss_nan_ranks": 0, "loss_rank_avg": 0.2017640769481659, "step": 75, "valid_targets_mean": 5565.6, "valid_targets_min": 1301 }, { "epoch": 0.0810126582278481, "grad_norm": 0.37589937170078513, "learning_rate": 6.39676113360324e-06, "loss": 0.3707, "loss_nan_ranks": 0, "loss_rank_avg": 0.13995295763015747, "step": 80, "valid_targets_mean": 3588.8, "valid_targets_min": 994 }, { "epoch": 0.08607594936708861, "grad_norm": 0.3714038081964425, "learning_rate": 6.801619433198381e-06, "loss": 0.3691, "loss_nan_ranks": 0, "loss_rank_avg": 0.21744906902313232, "step": 85, "valid_targets_mean": 5115.6, "valid_targets_min": 898 }, { "epoch": 0.09113924050632911, "grad_norm": 0.34597741271059124, "learning_rate": 7.206477732793523e-06, "loss": 0.3564, "loss_nan_ranks": 0, "loss_rank_avg": 0.17021265625953674, "step": 90, "valid_targets_mean": 5033.3, "valid_targets_min": 886 }, { "epoch": 0.09620253164556962, "grad_norm": 0.3172791695402959, "learning_rate": 7.611336032388664e-06, "loss": 0.3739, "loss_nan_ranks": 0, "loss_rank_avg": 0.16697894036769867, "step": 95, "valid_targets_mean": 5135.7, "valid_targets_min": 776 }, { "epoch": 0.10126582278481013, "grad_norm": 0.3605571673212477, "learning_rate": 8.016194331983806e-06, "loss": 0.3609, "loss_nan_ranks": 0, "loss_rank_avg": 0.17649498581886292, "step": 100, "valid_targets_mean": 4052.9, "valid_targets_min": 1407 }, { "epoch": 0.10632911392405063, "grad_norm": 0.3126393081213533, "learning_rate": 8.421052631578948e-06, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.14957275986671448, "step": 105, "valid_targets_mean": 4704.9, "valid_targets_min": 1914 }, { "epoch": 0.11139240506329114, "grad_norm": 0.3531313178759686, "learning_rate": 8.82591093117409e-06, "loss": 0.3726, "loss_nan_ranks": 0, "loss_rank_avg": 0.16743913292884827, "step": 110, "valid_targets_mean": 3947.0, "valid_targets_min": 1052 }, { "epoch": 0.11645569620253164, "grad_norm": 0.361312795641348, "learning_rate": 9.230769230769232e-06, "loss": 0.3633, "loss_nan_ranks": 0, "loss_rank_avg": 0.1453179121017456, "step": 115, "valid_targets_mean": 2979.1, "valid_targets_min": 1042 }, { "epoch": 0.12151898734177215, "grad_norm": 0.3118010440427671, "learning_rate": 9.635627530364373e-06, "loss": 0.3533, "loss_nan_ranks": 0, "loss_rank_avg": 0.1923716962337494, "step": 120, "valid_targets_mean": 5371.9, "valid_targets_min": 1279 }, { "epoch": 0.12658227848101267, "grad_norm": 0.35948459926380516, "learning_rate": 1.0040485829959515e-05, "loss": 0.348, "loss_nan_ranks": 0, "loss_rank_avg": 0.2048473060131073, "step": 125, "valid_targets_mean": 4750.8, "valid_targets_min": 990 }, { "epoch": 0.13164556962025317, "grad_norm": 0.31537572490184773, "learning_rate": 1.0445344129554658e-05, "loss": 0.3713, "loss_nan_ranks": 0, "loss_rank_avg": 0.20135825872421265, "step": 130, "valid_targets_mean": 4831.9, "valid_targets_min": 1663 }, { "epoch": 0.13670886075949368, "grad_norm": 0.36436085249069955, "learning_rate": 1.0850202429149799e-05, "loss": 0.3511, "loss_nan_ranks": 0, "loss_rank_avg": 0.21216928958892822, "step": 135, "valid_targets_mean": 4523.4, "valid_targets_min": 1238 }, { "epoch": 0.14177215189873418, "grad_norm": 0.3366824015027373, "learning_rate": 1.1255060728744939e-05, "loss": 0.3567, "loss_nan_ranks": 0, "loss_rank_avg": 0.17111346125602722, "step": 140, "valid_targets_mean": 3792.1, "valid_targets_min": 1100 }, { "epoch": 0.1468354430379747, "grad_norm": 0.35533807007148477, "learning_rate": 1.1659919028340081e-05, "loss": 0.3589, "loss_nan_ranks": 0, "loss_rank_avg": 0.1642487645149231, "step": 145, "valid_targets_mean": 4016.7, "valid_targets_min": 1556 }, { "epoch": 0.1518987341772152, "grad_norm": 0.31790675871917146, "learning_rate": 1.2064777327935225e-05, "loss": 0.3429, "loss_nan_ranks": 0, "loss_rank_avg": 0.197759211063385, "step": 150, "valid_targets_mean": 5829.0, "valid_targets_min": 1509 }, { "epoch": 0.1569620253164557, "grad_norm": 0.32375174058174566, "learning_rate": 1.2469635627530365e-05, "loss": 0.3571, "loss_nan_ranks": 0, "loss_rank_avg": 0.1860826313495636, "step": 155, "valid_targets_mean": 4697.8, "valid_targets_min": 1042 }, { "epoch": 0.1620253164556962, "grad_norm": 0.971603737593077, "learning_rate": 1.2874493927125507e-05, "loss": 0.3655, "loss_nan_ranks": 0, "loss_rank_avg": 0.2078309953212738, "step": 160, "valid_targets_mean": 5384.2, "valid_targets_min": 1144 }, { "epoch": 0.1670886075949367, "grad_norm": 0.47966039195161064, "learning_rate": 1.327935222672065e-05, "loss": 0.3588, "loss_nan_ranks": 0, "loss_rank_avg": 0.18700364232063293, "step": 165, "valid_targets_mean": 4719.9, "valid_targets_min": 1071 }, { "epoch": 0.17215189873417722, "grad_norm": 0.2955436571363374, "learning_rate": 1.3684210526315791e-05, "loss": 0.3413, "loss_nan_ranks": 0, "loss_rank_avg": 0.16040512919425964, "step": 170, "valid_targets_mean": 5175.4, "valid_targets_min": 1035 }, { "epoch": 0.17721518987341772, "grad_norm": 0.2909056024011537, "learning_rate": 1.4089068825910932e-05, "loss": 0.3611, "loss_nan_ranks": 0, "loss_rank_avg": 0.14239881932735443, "step": 175, "valid_targets_mean": 4601.9, "valid_targets_min": 1236 }, { "epoch": 0.18227848101265823, "grad_norm": 0.3684074269197893, "learning_rate": 1.4493927125506074e-05, "loss": 0.3607, "loss_nan_ranks": 0, "loss_rank_avg": 0.17205636203289032, "step": 180, "valid_targets_mean": 3363.9, "valid_targets_min": 899 }, { "epoch": 0.18734177215189873, "grad_norm": 0.2978543096994537, "learning_rate": 1.4898785425101216e-05, "loss": 0.3606, "loss_nan_ranks": 0, "loss_rank_avg": 0.1950611174106598, "step": 185, "valid_targets_mean": 5937.9, "valid_targets_min": 1368 }, { "epoch": 0.19240506329113924, "grad_norm": 0.30414263404359004, "learning_rate": 1.5303643724696356e-05, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.18548183143138885, "step": 190, "valid_targets_mean": 5815.7, "valid_targets_min": 1087 }, { "epoch": 0.19746835443037974, "grad_norm": 0.3751151244554016, "learning_rate": 1.5708502024291498e-05, "loss": 0.3638, "loss_nan_ranks": 0, "loss_rank_avg": 0.2703745365142822, "step": 195, "valid_targets_mean": 5632.3, "valid_targets_min": 1444 }, { "epoch": 0.20253164556962025, "grad_norm": 0.3183245241372493, "learning_rate": 1.6113360323886644e-05, "loss": 0.3597, "loss_nan_ranks": 0, "loss_rank_avg": 0.15712594985961914, "step": 200, "valid_targets_mean": 4035.7, "valid_targets_min": 1064 }, { "epoch": 0.20759493670886076, "grad_norm": 0.3632627857891178, "learning_rate": 1.6518218623481782e-05, "loss": 0.3525, "loss_nan_ranks": 0, "loss_rank_avg": 0.17240820825099945, "step": 205, "valid_targets_mean": 4021.2, "valid_targets_min": 1114 }, { "epoch": 0.21265822784810126, "grad_norm": 0.34057034041346584, "learning_rate": 1.6923076923076924e-05, "loss": 0.3621, "loss_nan_ranks": 0, "loss_rank_avg": 0.22665713727474213, "step": 210, "valid_targets_mean": 5157.8, "valid_targets_min": 1706 }, { "epoch": 0.21772151898734177, "grad_norm": 0.32892662546524415, "learning_rate": 1.7327935222672066e-05, "loss": 0.3516, "loss_nan_ranks": 0, "loss_rank_avg": 0.1358383297920227, "step": 215, "valid_targets_mean": 3612.9, "valid_targets_min": 1015 }, { "epoch": 0.22278481012658227, "grad_norm": 0.3323805458845017, "learning_rate": 1.7732793522267208e-05, "loss": 0.3405, "loss_nan_ranks": 0, "loss_rank_avg": 0.14480899274349213, "step": 220, "valid_targets_mean": 6220.1, "valid_targets_min": 1090 }, { "epoch": 0.22784810126582278, "grad_norm": 0.2969456771010524, "learning_rate": 1.813765182186235e-05, "loss": 0.345, "loss_nan_ranks": 0, "loss_rank_avg": 0.16806533932685852, "step": 225, "valid_targets_mean": 5594.2, "valid_targets_min": 1290 }, { "epoch": 0.23291139240506328, "grad_norm": 0.35442807757680916, "learning_rate": 1.8542510121457492e-05, "loss": 0.3466, "loss_nan_ranks": 0, "loss_rank_avg": 0.20088203251361847, "step": 230, "valid_targets_mean": 4364.5, "valid_targets_min": 1537 }, { "epoch": 0.2379746835443038, "grad_norm": 0.32766837251688363, "learning_rate": 1.894736842105263e-05, "loss": 0.3597, "loss_nan_ranks": 0, "loss_rank_avg": 0.12136702239513397, "step": 235, "valid_targets_mean": 2704.7, "valid_targets_min": 1252 }, { "epoch": 0.2430379746835443, "grad_norm": 0.3298038015043137, "learning_rate": 1.9352226720647776e-05, "loss": 0.3312, "loss_nan_ranks": 0, "loss_rank_avg": 0.17166192829608917, "step": 240, "valid_targets_mean": 4605.7, "valid_targets_min": 1445 }, { "epoch": 0.2481012658227848, "grad_norm": 0.2811058024334916, "learning_rate": 1.9757085020242915e-05, "loss": 0.3647, "loss_nan_ranks": 0, "loss_rank_avg": 0.17767693102359772, "step": 245, "valid_targets_mean": 5949.4, "valid_targets_min": 992 }, { "epoch": 0.25316455696202533, "grad_norm": 0.3238895469625763, "learning_rate": 2.016194331983806e-05, "loss": 0.3542, "loss_nan_ranks": 0, "loss_rank_avg": 0.1756962537765503, "step": 250, "valid_targets_mean": 4702.4, "valid_targets_min": 1101 }, { "epoch": 0.2582278481012658, "grad_norm": 0.30654096002239845, "learning_rate": 2.05668016194332e-05, "loss": 0.3556, "loss_nan_ranks": 0, "loss_rank_avg": 0.18253913521766663, "step": 255, "valid_targets_mean": 5601.0, "valid_targets_min": 977 }, { "epoch": 0.26329113924050634, "grad_norm": 0.33818696625352207, "learning_rate": 2.097165991902834e-05, "loss": 0.3604, "loss_nan_ranks": 0, "loss_rank_avg": 0.20197951793670654, "step": 260, "valid_targets_mean": 4999.4, "valid_targets_min": 859 }, { "epoch": 0.2683544303797468, "grad_norm": 0.3221593835641881, "learning_rate": 2.1376518218623487e-05, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.1421291083097458, "step": 265, "valid_targets_mean": 3732.8, "valid_targets_min": 1159 }, { "epoch": 0.27341772151898736, "grad_norm": 0.3467001085595146, "learning_rate": 2.1781376518218625e-05, "loss": 0.3541, "loss_nan_ranks": 0, "loss_rank_avg": 0.19689059257507324, "step": 270, "valid_targets_mean": 4544.8, "valid_targets_min": 1627 }, { "epoch": 0.27848101265822783, "grad_norm": 0.3893966405259359, "learning_rate": 2.2186234817813767e-05, "loss": 0.3502, "loss_nan_ranks": 0, "loss_rank_avg": 0.17629346251487732, "step": 275, "valid_targets_mean": 3116.6, "valid_targets_min": 1066 }, { "epoch": 0.28354430379746837, "grad_norm": 0.34248011251805455, "learning_rate": 2.2591093117408906e-05, "loss": 0.3517, "loss_nan_ranks": 0, "loss_rank_avg": 0.1394365131855011, "step": 280, "valid_targets_mean": 3400.1, "valid_targets_min": 1015 }, { "epoch": 0.28860759493670884, "grad_norm": 0.34292015860444375, "learning_rate": 2.299595141700405e-05, "loss": 0.3441, "loss_nan_ranks": 0, "loss_rank_avg": 0.18773144483566284, "step": 285, "valid_targets_mean": 4286.1, "valid_targets_min": 1425 }, { "epoch": 0.2936708860759494, "grad_norm": 0.3527832328000518, "learning_rate": 2.3400809716599193e-05, "loss": 0.3441, "loss_nan_ranks": 0, "loss_rank_avg": 0.18093225359916687, "step": 290, "valid_targets_mean": 4568.9, "valid_targets_min": 1281 }, { "epoch": 0.29873417721518986, "grad_norm": 0.3222755455970598, "learning_rate": 2.3805668016194332e-05, "loss": 0.3363, "loss_nan_ranks": 0, "loss_rank_avg": 0.13850252330303192, "step": 295, "valid_targets_mean": 3603.9, "valid_targets_min": 1101 }, { "epoch": 0.3037974683544304, "grad_norm": 0.3081645393207173, "learning_rate": 2.4210526315789474e-05, "loss": 0.3523, "loss_nan_ranks": 0, "loss_rank_avg": 0.1911936104297638, "step": 300, "valid_targets_mean": 6009.3, "valid_targets_min": 840 }, { "epoch": 0.30886075949367087, "grad_norm": 0.29187368241351513, "learning_rate": 2.461538461538462e-05, "loss": 0.3484, "loss_nan_ranks": 0, "loss_rank_avg": 0.17911839485168457, "step": 305, "valid_targets_mean": 7036.5, "valid_targets_min": 1310 }, { "epoch": 0.3139240506329114, "grad_norm": 0.49985981352299386, "learning_rate": 2.5020242914979758e-05, "loss": 0.3363, "loss_nan_ranks": 0, "loss_rank_avg": 0.16296392679214478, "step": 310, "valid_targets_mean": 3887.8, "valid_targets_min": 1192 }, { "epoch": 0.3189873417721519, "grad_norm": 0.38261294484090613, "learning_rate": 2.54251012145749e-05, "loss": 0.3454, "loss_nan_ranks": 0, "loss_rank_avg": 0.15782615542411804, "step": 315, "valid_targets_mean": 3376.2, "valid_targets_min": 1185 }, { "epoch": 0.3240506329113924, "grad_norm": 0.45061664130339874, "learning_rate": 2.5829959514170046e-05, "loss": 0.3502, "loss_nan_ranks": 0, "loss_rank_avg": 0.1975603699684143, "step": 320, "valid_targets_mean": 5570.6, "valid_targets_min": 1866 }, { "epoch": 0.3291139240506329, "grad_norm": 0.3182602149268292, "learning_rate": 2.6234817813765184e-05, "loss": 0.3351, "loss_nan_ranks": 0, "loss_rank_avg": 0.14342699944972992, "step": 325, "valid_targets_mean": 3784.2, "valid_targets_min": 849 }, { "epoch": 0.3341772151898734, "grad_norm": 0.3254644437199896, "learning_rate": 2.6639676113360326e-05, "loss": 0.3501, "loss_nan_ranks": 0, "loss_rank_avg": 0.16729095578193665, "step": 330, "valid_targets_mean": 3966.9, "valid_targets_min": 1392 }, { "epoch": 0.3392405063291139, "grad_norm": 0.32206841245268697, "learning_rate": 2.704453441295547e-05, "loss": 0.3476, "loss_nan_ranks": 0, "loss_rank_avg": 0.1826034039258957, "step": 335, "valid_targets_mean": 4157.9, "valid_targets_min": 1092 }, { "epoch": 0.34430379746835443, "grad_norm": 0.3602273548100487, "learning_rate": 2.744939271255061e-05, "loss": 0.3625, "loss_nan_ranks": 0, "loss_rank_avg": 0.2222571074962616, "step": 340, "valid_targets_mean": 4895.1, "valid_targets_min": 1074 }, { "epoch": 0.3493670886075949, "grad_norm": 0.3392767743330912, "learning_rate": 2.7854251012145752e-05, "loss": 0.3455, "loss_nan_ranks": 0, "loss_rank_avg": 0.13851270079612732, "step": 345, "valid_targets_mean": 3250.4, "valid_targets_min": 1001 }, { "epoch": 0.35443037974683544, "grad_norm": 0.32803869222957094, "learning_rate": 2.825910931174089e-05, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.18585026264190674, "step": 350, "valid_targets_mean": 4607.0, "valid_targets_min": 1164 }, { "epoch": 0.3594936708860759, "grad_norm": 0.2960837838285842, "learning_rate": 2.8663967611336033e-05, "loss": 0.3539, "loss_nan_ranks": 0, "loss_rank_avg": 0.23394142091274261, "step": 355, "valid_targets_mean": 8210.9, "valid_targets_min": 1637 }, { "epoch": 0.36455696202531646, "grad_norm": 0.3694811833098562, "learning_rate": 2.906882591093118e-05, "loss": 0.3468, "loss_nan_ranks": 0, "loss_rank_avg": 0.16552570462226868, "step": 360, "valid_targets_mean": 2960.9, "valid_targets_min": 1184 }, { "epoch": 0.369620253164557, "grad_norm": 0.31999701209701786, "learning_rate": 2.9473684210526317e-05, "loss": 0.3466, "loss_nan_ranks": 0, "loss_rank_avg": 0.16295602917671204, "step": 365, "valid_targets_mean": 3841.0, "valid_targets_min": 1068 }, { "epoch": 0.37468354430379747, "grad_norm": 0.29571436256727346, "learning_rate": 2.987854251012146e-05, "loss": 0.3567, "loss_nan_ranks": 0, "loss_rank_avg": 0.19385173916816711, "step": 370, "valid_targets_mean": 5434.1, "valid_targets_min": 904 }, { "epoch": 0.379746835443038, "grad_norm": 0.2794237498150064, "learning_rate": 3.0283400809716605e-05, "loss": 0.3384, "loss_nan_ranks": 0, "loss_rank_avg": 0.17324280738830566, "step": 375, "valid_targets_mean": 6533.0, "valid_targets_min": 914 }, { "epoch": 0.3848101265822785, "grad_norm": 0.46097531086569304, "learning_rate": 3.068825910931174e-05, "loss": 0.3441, "loss_nan_ranks": 0, "loss_rank_avg": 0.1612202525138855, "step": 380, "valid_targets_mean": 4019.0, "valid_targets_min": 1578 }, { "epoch": 0.389873417721519, "grad_norm": 0.33386509179906093, "learning_rate": 3.1093117408906885e-05, "loss": 0.3495, "loss_nan_ranks": 0, "loss_rank_avg": 0.14520494639873505, "step": 385, "valid_targets_mean": 3415.9, "valid_targets_min": 1118 }, { "epoch": 0.3949367088607595, "grad_norm": 0.3319526543378725, "learning_rate": 3.149797570850203e-05, "loss": 0.3487, "loss_nan_ranks": 0, "loss_rank_avg": 0.1795864999294281, "step": 390, "valid_targets_mean": 4239.8, "valid_targets_min": 991 }, { "epoch": 0.4, "grad_norm": 0.3406949335779596, "learning_rate": 3.190283400809717e-05, "loss": 0.3384, "loss_nan_ranks": 0, "loss_rank_avg": 0.16871468722820282, "step": 395, "valid_targets_mean": 3474.5, "valid_targets_min": 1133 }, { "epoch": 0.4050632911392405, "grad_norm": 0.36838681719013816, "learning_rate": 3.230769230769231e-05, "loss": 0.3522, "loss_nan_ranks": 0, "loss_rank_avg": 0.1932060271501541, "step": 400, "valid_targets_mean": 3488.6, "valid_targets_min": 1164 }, { "epoch": 0.41012658227848103, "grad_norm": 0.35042164458126773, "learning_rate": 3.271255060728745e-05, "loss": 0.3588, "loss_nan_ranks": 0, "loss_rank_avg": 0.17853647470474243, "step": 405, "valid_targets_mean": 3956.2, "valid_targets_min": 1293 }, { "epoch": 0.4151898734177215, "grad_norm": 0.3489327841744588, "learning_rate": 3.311740890688259e-05, "loss": 0.3585, "loss_nan_ranks": 0, "loss_rank_avg": 0.16795890033245087, "step": 410, "valid_targets_mean": 3783.9, "valid_targets_min": 1206 }, { "epoch": 0.42025316455696204, "grad_norm": 0.3454446525690692, "learning_rate": 3.352226720647774e-05, "loss": 0.3516, "loss_nan_ranks": 0, "loss_rank_avg": 0.2117060422897339, "step": 415, "valid_targets_mean": 4945.9, "valid_targets_min": 1096 }, { "epoch": 0.4253164556962025, "grad_norm": 0.3098825126338765, "learning_rate": 3.3927125506072876e-05, "loss": 0.3574, "loss_nan_ranks": 0, "loss_rank_avg": 0.20046228170394897, "step": 420, "valid_targets_mean": 6020.4, "valid_targets_min": 1220 }, { "epoch": 0.43037974683544306, "grad_norm": 0.37532962252838115, "learning_rate": 3.433198380566802e-05, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.1575276255607605, "step": 425, "valid_targets_mean": 3148.8, "valid_targets_min": 1434 }, { "epoch": 0.43544303797468353, "grad_norm": 0.41731233709453813, "learning_rate": 3.473684210526316e-05, "loss": 0.3536, "loss_nan_ranks": 0, "loss_rank_avg": 0.18151873350143433, "step": 430, "valid_targets_mean": 4121.1, "valid_targets_min": 882 }, { "epoch": 0.44050632911392407, "grad_norm": 0.2834549547224196, "learning_rate": 3.51417004048583e-05, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.21482950448989868, "step": 435, "valid_targets_mean": 7190.4, "valid_targets_min": 980 }, { "epoch": 0.44556962025316454, "grad_norm": 0.30073688146062255, "learning_rate": 3.5546558704453444e-05, "loss": 0.3511, "loss_nan_ranks": 0, "loss_rank_avg": 0.1362500786781311, "step": 440, "valid_targets_mean": 4360.6, "valid_targets_min": 1118 }, { "epoch": 0.4506329113924051, "grad_norm": 0.3750594432228394, "learning_rate": 3.595141700404859e-05, "loss": 0.3531, "loss_nan_ranks": 0, "loss_rank_avg": 0.20675930380821228, "step": 445, "valid_targets_mean": 4531.2, "valid_targets_min": 1680 }, { "epoch": 0.45569620253164556, "grad_norm": 0.3568782095433956, "learning_rate": 3.635627530364373e-05, "loss": 0.3454, "loss_nan_ranks": 0, "loss_rank_avg": 0.17187099158763885, "step": 450, "valid_targets_mean": 4279.3, "valid_targets_min": 1210 }, { "epoch": 0.4607594936708861, "grad_norm": 0.31010973542926373, "learning_rate": 3.676113360323887e-05, "loss": 0.349, "loss_nan_ranks": 0, "loss_rank_avg": 0.1888793706893921, "step": 455, "valid_targets_mean": 5464.9, "valid_targets_min": 540 }, { "epoch": 0.46582278481012657, "grad_norm": 0.30672819186326156, "learning_rate": 3.716599190283401e-05, "loss": 0.3369, "loss_nan_ranks": 0, "loss_rank_avg": 0.19805072247982025, "step": 460, "valid_targets_mean": 5570.1, "valid_targets_min": 1257 }, { "epoch": 0.4708860759493671, "grad_norm": 0.33237701694635524, "learning_rate": 3.757085020242915e-05, "loss": 0.3443, "loss_nan_ranks": 0, "loss_rank_avg": 0.17327673733234406, "step": 465, "valid_targets_mean": 4441.7, "valid_targets_min": 1062 }, { "epoch": 0.4759493670886076, "grad_norm": 0.3157269440092307, "learning_rate": 3.7975708502024296e-05, "loss": 0.3523, "loss_nan_ranks": 0, "loss_rank_avg": 0.2036791741847992, "step": 470, "valid_targets_mean": 5480.2, "valid_targets_min": 1147 }, { "epoch": 0.4810126582278481, "grad_norm": 0.3385448591385259, "learning_rate": 3.8380566801619435e-05, "loss": 0.3254, "loss_nan_ranks": 0, "loss_rank_avg": 0.18548253178596497, "step": 475, "valid_targets_mean": 5158.2, "valid_targets_min": 1322 }, { "epoch": 0.4860759493670886, "grad_norm": 0.3229813339259753, "learning_rate": 3.878542510121458e-05, "loss": 0.3539, "loss_nan_ranks": 0, "loss_rank_avg": 0.19486048817634583, "step": 480, "valid_targets_mean": 5207.5, "valid_targets_min": 1234 }, { "epoch": 0.4911392405063291, "grad_norm": 0.39888632177896866, "learning_rate": 3.919028340080972e-05, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.15041330456733704, "step": 485, "valid_targets_mean": 2910.4, "valid_targets_min": 826 }, { "epoch": 0.4962025316455696, "grad_norm": 0.3216838457166851, "learning_rate": 3.959514170040486e-05, "loss": 0.3535, "loss_nan_ranks": 0, "loss_rank_avg": 0.18031927943229675, "step": 490, "valid_targets_mean": 5146.9, "valid_targets_min": 1318 }, { "epoch": 0.5012658227848101, "grad_norm": 0.3463812343689675, "learning_rate": 4e-05, "loss": 0.3538, "loss_nan_ranks": 0, "loss_rank_avg": 0.13655783236026764, "step": 495, "valid_targets_mean": 3592.6, "valid_targets_min": 977 }, { "epoch": 0.5063291139240507, "grad_norm": 0.36468197040198047, "learning_rate": 3.999987517534179e-05, "loss": 0.3298, "loss_nan_ranks": 0, "loss_rank_avg": 0.17994073033332825, "step": 500, "valid_targets_mean": 3419.4, "valid_targets_min": 997 }, { "epoch": 0.5113924050632911, "grad_norm": 0.3123011360513197, "learning_rate": 3.999950070292526e-05, "loss": 0.3514, "loss_nan_ranks": 0, "loss_rank_avg": 0.13850685954093933, "step": 505, "valid_targets_mean": 4406.6, "valid_targets_min": 1006 }, { "epoch": 0.5164556962025316, "grad_norm": 0.3110207165348701, "learning_rate": 3.9998876587424764e-05, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.13691280782222748, "step": 510, "valid_targets_mean": 4396.4, "valid_targets_min": 1417 }, { "epoch": 0.5215189873417722, "grad_norm": 0.32363025722531935, "learning_rate": 3.99980028366308e-05, "loss": 0.3569, "loss_nan_ranks": 0, "loss_rank_avg": 0.24637667834758759, "step": 515, "valid_targets_mean": 5892.6, "valid_targets_min": 1208 }, { "epoch": 0.5265822784810127, "grad_norm": 0.3650846632854969, "learning_rate": 3.999687946144992e-05, "loss": 0.3581, "loss_nan_ranks": 0, "loss_rank_avg": 0.18719391524791718, "step": 520, "valid_targets_mean": 4166.3, "valid_targets_min": 1384 }, { "epoch": 0.5316455696202531, "grad_norm": 0.380513757297641, "learning_rate": 3.999550647590464e-05, "loss": 0.3508, "loss_nan_ranks": 0, "loss_rank_avg": 0.21175450086593628, "step": 525, "valid_targets_mean": 3908.1, "valid_targets_min": 1057 }, { "epoch": 0.5367088607594936, "grad_norm": 0.3303089638050748, "learning_rate": 3.9993883897133174e-05, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.1324310302734375, "step": 530, "valid_targets_mean": 3035.0, "valid_targets_min": 1176 }, { "epoch": 0.5417721518987342, "grad_norm": 0.3065345335498946, "learning_rate": 3.9992011745389335e-05, "loss": 0.3564, "loss_nan_ranks": 0, "loss_rank_avg": 0.18349391222000122, "step": 535, "valid_targets_mean": 5569.8, "valid_targets_min": 1419 }, { "epoch": 0.5468354430379747, "grad_norm": 0.3593697878507127, "learning_rate": 3.998989004404217e-05, "loss": 0.3477, "loss_nan_ranks": 0, "loss_rank_avg": 0.1619454324245453, "step": 540, "valid_targets_mean": 3932.5, "valid_targets_min": 1196 }, { "epoch": 0.5518987341772152, "grad_norm": 0.25234558053757633, "learning_rate": 3.998751881957576e-05, "loss": 0.3363, "loss_nan_ranks": 0, "loss_rank_avg": 0.16338235139846802, "step": 545, "valid_targets_mean": 5379.0, "valid_targets_min": 977 }, { "epoch": 0.5569620253164557, "grad_norm": 0.3445664068863559, "learning_rate": 3.998489810158883e-05, "loss": 0.3475, "loss_nan_ranks": 0, "loss_rank_avg": 0.1785704791545868, "step": 550, "valid_targets_mean": 3962.2, "valid_targets_min": 1209 }, { "epoch": 0.5620253164556962, "grad_norm": 0.3556936347323425, "learning_rate": 3.99820279227944e-05, "loss": 0.3345, "loss_nan_ranks": 0, "loss_rank_avg": 0.18062683939933777, "step": 555, "valid_targets_mean": 4593.2, "valid_targets_min": 1615 }, { "epoch": 0.5670886075949367, "grad_norm": 0.3792686598578621, "learning_rate": 3.997890831901938e-05, "loss": 0.3413, "loss_nan_ranks": 0, "loss_rank_avg": 0.19577497243881226, "step": 560, "valid_targets_mean": 4658.2, "valid_targets_min": 1474 }, { "epoch": 0.5721518987341773, "grad_norm": 0.32913492636939423, "learning_rate": 3.9975539329204116e-05, "loss": 0.3387, "loss_nan_ranks": 0, "loss_rank_avg": 0.17351575195789337, "step": 565, "valid_targets_mean": 4210.6, "valid_targets_min": 743 }, { "epoch": 0.5772151898734177, "grad_norm": 0.296950123523885, "learning_rate": 3.9971920995401905e-05, "loss": 0.3443, "loss_nan_ranks": 0, "loss_rank_avg": 0.20880410075187683, "step": 570, "valid_targets_mean": 6590.1, "valid_targets_min": 1899 }, { "epoch": 0.5822784810126582, "grad_norm": 0.34173998557875557, "learning_rate": 3.996805336277848e-05, "loss": 0.3508, "loss_nan_ranks": 0, "loss_rank_avg": 0.1291336864233017, "step": 575, "valid_targets_mean": 4007.8, "valid_targets_min": 1380 }, { "epoch": 0.5873417721518988, "grad_norm": 0.30049566187413324, "learning_rate": 3.996393647961143e-05, "loss": 0.34, "loss_nan_ranks": 0, "loss_rank_avg": 0.13710632920265198, "step": 580, "valid_targets_mean": 4320.4, "valid_targets_min": 1110 }, { "epoch": 0.5924050632911393, "grad_norm": 0.3451273067980245, "learning_rate": 3.995957039728962e-05, "loss": 0.3456, "loss_nan_ranks": 0, "loss_rank_avg": 0.18673017621040344, "step": 585, "valid_targets_mean": 4318.7, "valid_targets_min": 1318 }, { "epoch": 0.5974683544303797, "grad_norm": 0.3248655593711836, "learning_rate": 3.9954955170312504e-05, "loss": 0.335, "loss_nan_ranks": 0, "loss_rank_avg": 0.15301413834095, "step": 590, "valid_targets_mean": 4103.9, "valid_targets_min": 1260 }, { "epoch": 0.6025316455696202, "grad_norm": 0.3874469407061254, "learning_rate": 3.995009085628951e-05, "loss": 0.3417, "loss_nan_ranks": 0, "loss_rank_avg": 0.17825846374034882, "step": 595, "valid_targets_mean": 3280.8, "valid_targets_min": 1303 }, { "epoch": 0.6075949367088608, "grad_norm": 0.32514023580791557, "learning_rate": 3.994497751593927e-05, "loss": 0.3417, "loss_nan_ranks": 0, "loss_rank_avg": 0.17784975469112396, "step": 600, "valid_targets_mean": 4897.2, "valid_targets_min": 1343 }, { "epoch": 0.6126582278481013, "grad_norm": 0.32015309031323297, "learning_rate": 3.9939615213088865e-05, "loss": 0.3461, "loss_nan_ranks": 0, "loss_rank_avg": 0.1702687293291092, "step": 605, "valid_targets_mean": 5160.1, "valid_targets_min": 787 }, { "epoch": 0.6177215189873417, "grad_norm": 0.29531423820767827, "learning_rate": 3.993400401467308e-05, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.1590127795934677, "step": 610, "valid_targets_mean": 5178.2, "valid_targets_min": 1187 }, { "epoch": 0.6227848101265823, "grad_norm": 0.30956228742996816, "learning_rate": 3.992814399073349e-05, "loss": 0.3358, "loss_nan_ranks": 0, "loss_rank_avg": 0.1777225136756897, "step": 615, "valid_targets_mean": 5224.1, "valid_targets_min": 1044 }, { "epoch": 0.6278481012658228, "grad_norm": 0.2946569197224124, "learning_rate": 3.992203521441765e-05, "loss": 0.3566, "loss_nan_ranks": 0, "loss_rank_avg": 0.16454584896564484, "step": 620, "valid_targets_mean": 5873.6, "valid_targets_min": 1522 }, { "epoch": 0.6329113924050633, "grad_norm": 0.3566548256792116, "learning_rate": 3.991567776197815e-05, "loss": 0.3423, "loss_nan_ranks": 0, "loss_rank_avg": 0.1757839322090149, "step": 625, "valid_targets_mean": 5280.0, "valid_targets_min": 1179 }, { "epoch": 0.6379746835443038, "grad_norm": 0.34702302453822725, "learning_rate": 3.990907171277168e-05, "loss": 0.3406, "loss_nan_ranks": 0, "loss_rank_avg": 0.16491375863552094, "step": 630, "valid_targets_mean": 3738.1, "valid_targets_min": 1437 }, { "epoch": 0.6430379746835443, "grad_norm": 0.3122025130697409, "learning_rate": 3.990221714925802e-05, "loss": 0.3425, "loss_nan_ranks": 0, "loss_rank_avg": 0.19272474944591522, "step": 635, "valid_targets_mean": 5090.6, "valid_targets_min": 858 }, { "epoch": 0.6481012658227848, "grad_norm": 0.3289259973223097, "learning_rate": 3.989511415699901e-05, "loss": 0.3492, "loss_nan_ranks": 0, "loss_rank_avg": 0.21416299045085907, "step": 640, "valid_targets_mean": 5687.4, "valid_targets_min": 1558 }, { "epoch": 0.6531645569620254, "grad_norm": 0.31628182785649794, "learning_rate": 3.988776282465752e-05, "loss": 0.3472, "loss_nan_ranks": 0, "loss_rank_avg": 0.16229850053787231, "step": 645, "valid_targets_mean": 5641.7, "valid_targets_min": 1228 }, { "epoch": 0.6582278481012658, "grad_norm": 0.32370069272186214, "learning_rate": 3.9880163243996314e-05, "loss": 0.3439, "loss_nan_ranks": 0, "loss_rank_avg": 0.1790936440229416, "step": 650, "valid_targets_mean": 4757.5, "valid_targets_min": 828 }, { "epoch": 0.6632911392405063, "grad_norm": 0.331462646919884, "learning_rate": 3.9872315509876885e-05, "loss": 0.3465, "loss_nan_ranks": 0, "loss_rank_avg": 0.2034873068332672, "step": 655, "valid_targets_mean": 6825.2, "valid_targets_min": 1430 }, { "epoch": 0.6683544303797468, "grad_norm": 0.2773031962593845, "learning_rate": 3.986421972025831e-05, "loss": 0.3362, "loss_nan_ranks": 0, "loss_rank_avg": 0.13872382044792175, "step": 660, "valid_targets_mean": 5178.6, "valid_targets_min": 1303 }, { "epoch": 0.6734177215189874, "grad_norm": 0.3282605048208077, "learning_rate": 3.9855875976196e-05, "loss": 0.3336, "loss_nan_ranks": 0, "loss_rank_avg": 0.1442852020263672, "step": 665, "valid_targets_mean": 3767.0, "valid_targets_min": 1309 }, { "epoch": 0.6784810126582278, "grad_norm": 0.5817158484637879, "learning_rate": 3.984728438184047e-05, "loss": 0.348, "loss_nan_ranks": 0, "loss_rank_avg": 0.1867026388645172, "step": 670, "valid_targets_mean": 4197.3, "valid_targets_min": 1119 }, { "epoch": 0.6835443037974683, "grad_norm": 0.3539656970185502, "learning_rate": 3.9838445044435997e-05, "loss": 0.3543, "loss_nan_ranks": 0, "loss_rank_avg": 0.16187211871147156, "step": 675, "valid_targets_mean": 4067.3, "valid_targets_min": 1024 }, { "epoch": 0.6886075949367089, "grad_norm": 0.33229865798563013, "learning_rate": 3.9829358074319295e-05, "loss": 0.343, "loss_nan_ranks": 0, "loss_rank_avg": 0.17157503962516785, "step": 680, "valid_targets_mean": 4686.7, "valid_targets_min": 1496 }, { "epoch": 0.6936708860759494, "grad_norm": 0.2791093667927135, "learning_rate": 3.982002358491817e-05, "loss": 0.3385, "loss_nan_ranks": 0, "loss_rank_avg": 0.1936018466949463, "step": 685, "valid_targets_mean": 6395.1, "valid_targets_min": 1038 }, { "epoch": 0.6987341772151898, "grad_norm": 0.3350209099910488, "learning_rate": 3.981044169275006e-05, "loss": 0.3363, "loss_nan_ranks": 0, "loss_rank_avg": 0.1778436303138733, "step": 690, "valid_targets_mean": 4567.5, "valid_targets_min": 1080 }, { "epoch": 0.7037974683544304, "grad_norm": 0.3531099254353881, "learning_rate": 3.9800612517420626e-05, "loss": 0.3469, "loss_nan_ranks": 0, "loss_rank_avg": 0.16938315331935883, "step": 695, "valid_targets_mean": 3896.1, "valid_targets_min": 1641 }, { "epoch": 0.7088607594936709, "grad_norm": 0.318049795345604, "learning_rate": 3.979053618162219e-05, "loss": 0.3564, "loss_nan_ranks": 0, "loss_rank_avg": 0.1946740746498108, "step": 700, "valid_targets_mean": 5408.9, "valid_targets_min": 1410 }, { "epoch": 0.7139240506329114, "grad_norm": 0.3320763821369659, "learning_rate": 3.978021281113228e-05, "loss": 0.3393, "loss_nan_ranks": 0, "loss_rank_avg": 0.17016340792179108, "step": 705, "valid_targets_mean": 4967.0, "valid_targets_min": 882 }, { "epoch": 0.7189873417721518, "grad_norm": 0.2847828838514781, "learning_rate": 3.9769642534812e-05, "loss": 0.3414, "loss_nan_ranks": 0, "loss_rank_avg": 0.1707335114479065, "step": 710, "valid_targets_mean": 6450.3, "valid_targets_min": 1014 }, { "epoch": 0.7240506329113924, "grad_norm": 0.3321384385821899, "learning_rate": 3.9758825484604494e-05, "loss": 0.3447, "loss_nan_ranks": 0, "loss_rank_avg": 0.1961357295513153, "step": 715, "valid_targets_mean": 4652.9, "valid_targets_min": 1387 }, { "epoch": 0.7291139240506329, "grad_norm": 0.3032184720855355, "learning_rate": 3.9747761795533194e-05, "loss": 0.3451, "loss_nan_ranks": 0, "loss_rank_avg": 0.1426798403263092, "step": 720, "valid_targets_mean": 6012.8, "valid_targets_min": 1966 }, { "epoch": 0.7341772151898734, "grad_norm": 0.3448777606898466, "learning_rate": 3.973645160570023e-05, "loss": 0.3546, "loss_nan_ranks": 0, "loss_rank_avg": 0.1586744487285614, "step": 725, "valid_targets_mean": 4090.4, "valid_targets_min": 1678 }, { "epoch": 0.739240506329114, "grad_norm": 0.3156506831386379, "learning_rate": 3.9724895056284665e-05, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.1619202196598053, "step": 730, "valid_targets_mean": 4218.2, "valid_targets_min": 1064 }, { "epoch": 0.7443037974683544, "grad_norm": 0.35504669537877936, "learning_rate": 3.971309229154072e-05, "loss": 0.3336, "loss_nan_ranks": 0, "loss_rank_avg": 0.21181583404541016, "step": 735, "valid_targets_mean": 4926.1, "valid_targets_min": 1207 }, { "epoch": 0.7493670886075949, "grad_norm": 0.3201734939222349, "learning_rate": 3.9701043458796015e-05, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.22177475690841675, "step": 740, "valid_targets_mean": 6330.8, "valid_targets_min": 1448 }, { "epoch": 0.7544303797468355, "grad_norm": 0.3323013925433624, "learning_rate": 3.9688748708449686e-05, "loss": 0.3383, "loss_nan_ranks": 0, "loss_rank_avg": 0.15360356867313385, "step": 745, "valid_targets_mean": 4397.9, "valid_targets_min": 1528 }, { "epoch": 0.759493670886076, "grad_norm": 0.2700426394697059, "learning_rate": 3.967620819397053e-05, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.15975482761859894, "step": 750, "valid_targets_mean": 5138.0, "valid_targets_min": 1494 }, { "epoch": 0.7645569620253164, "grad_norm": 0.32491869195537754, "learning_rate": 3.9663422071895103e-05, "loss": 0.3534, "loss_nan_ranks": 0, "loss_rank_avg": 0.1329491138458252, "step": 755, "valid_targets_mean": 3496.6, "valid_targets_min": 1333 }, { "epoch": 0.769620253164557, "grad_norm": 0.30201583766650153, "learning_rate": 3.965039050182573e-05, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.17797686159610748, "step": 760, "valid_targets_mean": 5996.1, "valid_targets_min": 1405 }, { "epoch": 0.7746835443037975, "grad_norm": 0.28815946203036474, "learning_rate": 3.963711364642854e-05, "loss": 0.3397, "loss_nan_ranks": 0, "loss_rank_avg": 0.19754289090633392, "step": 765, "valid_targets_mean": 6895.8, "valid_targets_min": 1767 }, { "epoch": 0.779746835443038, "grad_norm": 0.3154202174762482, "learning_rate": 3.9623591671431416e-05, "loss": 0.355, "loss_nan_ranks": 0, "loss_rank_avg": 0.18379993736743927, "step": 770, "valid_targets_mean": 5009.2, "valid_targets_min": 1303 }, { "epoch": 0.7848101265822784, "grad_norm": 0.3575700176888927, "learning_rate": 3.960982474562196e-05, "loss": 0.3389, "loss_nan_ranks": 0, "loss_rank_avg": 0.17523907124996185, "step": 775, "valid_targets_mean": 4694.8, "valid_targets_min": 1661 }, { "epoch": 0.789873417721519, "grad_norm": 0.3310517991000096, "learning_rate": 3.959581304084536e-05, "loss": 0.345, "loss_nan_ranks": 0, "loss_rank_avg": 0.1610376238822937, "step": 780, "valid_targets_mean": 4332.1, "valid_targets_min": 863 }, { "epoch": 0.7949367088607595, "grad_norm": 0.31363025202931233, "learning_rate": 3.958155673200223e-05, "loss": 0.3547, "loss_nan_ranks": 0, "loss_rank_avg": 0.2106252908706665, "step": 785, "valid_targets_mean": 5876.1, "valid_targets_min": 1285 }, { "epoch": 0.8, "grad_norm": 0.2999707270623021, "learning_rate": 3.956705599704645e-05, "loss": 0.3307, "loss_nan_ranks": 0, "loss_rank_avg": 0.19507791101932526, "step": 790, "valid_targets_mean": 5528.2, "valid_targets_min": 1012 }, { "epoch": 0.8050632911392405, "grad_norm": 0.34798398865892316, "learning_rate": 3.9552311016982964e-05, "loss": 0.3301, "loss_nan_ranks": 0, "loss_rank_avg": 0.1592869609594345, "step": 795, "valid_targets_mean": 3994.4, "valid_targets_min": 1020 }, { "epoch": 0.810126582278481, "grad_norm": 0.3486093165843197, "learning_rate": 3.953732197586549e-05, "loss": 0.3299, "loss_nan_ranks": 0, "loss_rank_avg": 0.14387521147727966, "step": 800, "valid_targets_mean": 3136.8, "valid_targets_min": 969 }, { "epoch": 0.8151898734177215, "grad_norm": 0.34294729405636676, "learning_rate": 3.952208906079419e-05, "loss": 0.339, "loss_nan_ranks": 0, "loss_rank_avg": 0.14744120836257935, "step": 805, "valid_targets_mean": 3541.7, "valid_targets_min": 1023 }, { "epoch": 0.8202531645569621, "grad_norm": 0.29811481034198406, "learning_rate": 3.950661246191344e-05, "loss": 0.3327, "loss_nan_ranks": 0, "loss_rank_avg": 0.20451560616493225, "step": 810, "valid_targets_mean": 5959.1, "valid_targets_min": 1170 }, { "epoch": 0.8253164556962025, "grad_norm": 0.29859308801266926, "learning_rate": 3.949089237240933e-05, "loss": 0.3261, "loss_nan_ranks": 0, "loss_rank_avg": 0.17102043330669403, "step": 815, "valid_targets_mean": 5425.9, "valid_targets_min": 1281 }, { "epoch": 0.830379746835443, "grad_norm": 0.33822208957438105, "learning_rate": 3.947492898850736e-05, "loss": 0.3379, "loss_nan_ranks": 0, "loss_rank_avg": 0.12047713249921799, "step": 820, "valid_targets_mean": 2989.9, "valid_targets_min": 1525 }, { "epoch": 0.8354430379746836, "grad_norm": 0.30589016543655284, "learning_rate": 3.94587225094699e-05, "loss": 0.3466, "loss_nan_ranks": 0, "loss_rank_avg": 0.16248869895935059, "step": 825, "valid_targets_mean": 4684.8, "valid_targets_min": 1392 }, { "epoch": 0.8405063291139241, "grad_norm": 0.2936931469479608, "learning_rate": 3.94422731375938e-05, "loss": 0.3185, "loss_nan_ranks": 0, "loss_rank_avg": 0.12211855500936508, "step": 830, "valid_targets_mean": 3796.8, "valid_targets_min": 1392 }, { "epoch": 0.8455696202531645, "grad_norm": 0.37559686297102585, "learning_rate": 3.9425581078207764e-05, "loss": 0.3532, "loss_nan_ranks": 0, "loss_rank_avg": 0.12265650928020477, "step": 835, "valid_targets_mean": 2870.8, "valid_targets_min": 1300 }, { "epoch": 0.850632911392405, "grad_norm": 0.35124796916797185, "learning_rate": 3.940864653966985e-05, "loss": 0.3336, "loss_nan_ranks": 0, "loss_rank_avg": 0.1492408812046051, "step": 840, "valid_targets_mean": 3748.4, "valid_targets_min": 1108 }, { "epoch": 0.8556962025316456, "grad_norm": 0.3196010195709303, "learning_rate": 3.939146973336487e-05, "loss": 0.3411, "loss_nan_ranks": 0, "loss_rank_avg": 0.21070614457130432, "step": 845, "valid_targets_mean": 5815.2, "valid_targets_min": 1741 }, { "epoch": 0.8607594936708861, "grad_norm": 0.278654689286952, "learning_rate": 3.937405087370171e-05, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.16281408071517944, "step": 850, "valid_targets_mean": 6301.6, "valid_targets_min": 1867 }, { "epoch": 0.8658227848101265, "grad_norm": 0.32174716361043904, "learning_rate": 3.9356390178110694e-05, "loss": 0.346, "loss_nan_ranks": 0, "loss_rank_avg": 0.11544165015220642, "step": 855, "valid_targets_mean": 3471.2, "valid_targets_min": 1247 }, { "epoch": 0.8708860759493671, "grad_norm": 0.31597886690897176, "learning_rate": 3.9338487867040855e-05, "loss": 0.3514, "loss_nan_ranks": 0, "loss_rank_avg": 0.1751353144645691, "step": 860, "valid_targets_mean": 4752.5, "valid_targets_min": 1271 }, { "epoch": 0.8759493670886076, "grad_norm": 0.3376382881344058, "learning_rate": 3.9320344163957177e-05, "loss": 0.3505, "loss_nan_ranks": 0, "loss_rank_avg": 0.1628148853778839, "step": 865, "valid_targets_mean": 4121.5, "valid_targets_min": 1412 }, { "epoch": 0.8810126582278481, "grad_norm": 0.3174487269237297, "learning_rate": 3.9301959295337816e-05, "loss": 0.3381, "loss_nan_ranks": 0, "loss_rank_avg": 0.19904953241348267, "step": 870, "valid_targets_mean": 6095.4, "valid_targets_min": 1694 }, { "epoch": 0.8860759493670886, "grad_norm": 0.29589750599326486, "learning_rate": 3.928333349067125e-05, "loss": 0.3319, "loss_nan_ranks": 0, "loss_rank_avg": 0.22740904986858368, "step": 875, "valid_targets_mean": 6433.5, "valid_targets_min": 979 }, { "epoch": 0.8911392405063291, "grad_norm": 0.28879537949688816, "learning_rate": 3.926446698245347e-05, "loss": 0.3262, "loss_nan_ranks": 0, "loss_rank_avg": 0.1922253668308258, "step": 880, "valid_targets_mean": 5540.3, "valid_targets_min": 1526 }, { "epoch": 0.8962025316455696, "grad_norm": 0.3183527697451739, "learning_rate": 3.924536000618501e-05, "loss": 0.3435, "loss_nan_ranks": 0, "loss_rank_avg": 0.1510843187570572, "step": 885, "valid_targets_mean": 4520.7, "valid_targets_min": 1446 }, { "epoch": 0.9012658227848102, "grad_norm": 0.3190560534322978, "learning_rate": 3.922601280036805e-05, "loss": 0.328, "loss_nan_ranks": 0, "loss_rank_avg": 0.19017574191093445, "step": 890, "valid_targets_mean": 4967.6, "valid_targets_min": 1199 }, { "epoch": 0.9063291139240506, "grad_norm": 0.4456031002758009, "learning_rate": 3.920642560650343e-05, "loss": 0.3351, "loss_nan_ranks": 0, "loss_rank_avg": 0.22871103882789612, "step": 895, "valid_targets_mean": 5971.6, "valid_targets_min": 1331 }, { "epoch": 0.9113924050632911, "grad_norm": 0.30090137054069316, "learning_rate": 3.918659866908762e-05, "loss": 0.3296, "loss_nan_ranks": 0, "loss_rank_avg": 0.15791599452495575, "step": 900, "valid_targets_mean": 5456.4, "valid_targets_min": 1469 }, { "epoch": 0.9164556962025316, "grad_norm": 0.33133512730966574, "learning_rate": 3.9166532235609695e-05, "loss": 0.3397, "loss_nan_ranks": 0, "loss_rank_avg": 0.21240505576133728, "step": 905, "valid_targets_mean": 5933.7, "valid_targets_min": 1591 }, { "epoch": 0.9215189873417722, "grad_norm": 0.3573450052442163, "learning_rate": 3.914622655654822e-05, "loss": 0.3434, "loss_nan_ranks": 0, "loss_rank_avg": 0.13716688752174377, "step": 910, "valid_targets_mean": 5188.8, "valid_targets_min": 1591 }, { "epoch": 0.9265822784810127, "grad_norm": 0.3538932529953643, "learning_rate": 3.912568188536814e-05, "loss": 0.3537, "loss_nan_ranks": 0, "loss_rank_avg": 0.16137436032295227, "step": 915, "valid_targets_mean": 3634.4, "valid_targets_min": 1339 }, { "epoch": 0.9316455696202531, "grad_norm": 0.3208113773796828, "learning_rate": 3.910489847851761e-05, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.17828276753425598, "step": 920, "valid_targets_mean": 4550.2, "valid_targets_min": 1178 }, { "epoch": 0.9367088607594937, "grad_norm": 0.3094131187909477, "learning_rate": 3.908387659542481e-05, "loss": 0.3457, "loss_nan_ranks": 0, "loss_rank_avg": 0.14312776923179626, "step": 925, "valid_targets_mean": 4335.3, "valid_targets_min": 1291 }, { "epoch": 0.9417721518987342, "grad_norm": 0.33010185993106733, "learning_rate": 3.9062616498494656e-05, "loss": 0.3354, "loss_nan_ranks": 0, "loss_rank_avg": 0.17049264907836914, "step": 930, "valid_targets_mean": 3559.0, "valid_targets_min": 1428 }, { "epoch": 0.9468354430379747, "grad_norm": 0.3152672156222691, "learning_rate": 3.904111845310559e-05, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.16469566524028778, "step": 935, "valid_targets_mean": 4357.5, "valid_targets_min": 1218 }, { "epoch": 0.9518987341772152, "grad_norm": 0.3201518158080734, "learning_rate": 3.901938272760623e-05, "loss": 0.3452, "loss_nan_ranks": 0, "loss_rank_avg": 0.1640382707118988, "step": 940, "valid_targets_mean": 4409.8, "valid_targets_min": 696 }, { "epoch": 0.9569620253164557, "grad_norm": 0.3422558014341276, "learning_rate": 3.899740959331204e-05, "loss": 0.3411, "loss_nan_ranks": 0, "loss_rank_avg": 0.14299672842025757, "step": 945, "valid_targets_mean": 3149.9, "valid_targets_min": 866 }, { "epoch": 0.9620253164556962, "grad_norm": 0.3039490414348751, "learning_rate": 3.897519932450189e-05, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.14147335290908813, "step": 950, "valid_targets_mean": 4333.5, "valid_targets_min": 1238 }, { "epoch": 0.9670886075949368, "grad_norm": 0.3264243877990281, "learning_rate": 3.8952752198414716e-05, "loss": 0.3515, "loss_nan_ranks": 0, "loss_rank_avg": 0.17327773571014404, "step": 955, "valid_targets_mean": 4177.0, "valid_targets_min": 1111 }, { "epoch": 0.9721518987341772, "grad_norm": 0.3108694369949979, "learning_rate": 3.893006849524601e-05, "loss": 0.3335, "loss_nan_ranks": 0, "loss_rank_avg": 0.16756384074687958, "step": 960, "valid_targets_mean": 4619.9, "valid_targets_min": 1156 }, { "epoch": 0.9772151898734177, "grad_norm": 0.3448421182167878, "learning_rate": 3.890714849814431e-05, "loss": 0.343, "loss_nan_ranks": 0, "loss_rank_avg": 0.15267406404018402, "step": 965, "valid_targets_mean": 4085.4, "valid_targets_min": 1188 }, { "epoch": 0.9822784810126582, "grad_norm": 0.30352124369356204, "learning_rate": 3.8883992493207696e-05, "loss": 0.3489, "loss_nan_ranks": 0, "loss_rank_avg": 0.2034776359796524, "step": 970, "valid_targets_mean": 5403.8, "valid_targets_min": 1133 }, { "epoch": 0.9873417721518988, "grad_norm": 0.2876598919430634, "learning_rate": 3.8860600769480215e-05, "loss": 0.3446, "loss_nan_ranks": 0, "loss_rank_avg": 0.17782637476921082, "step": 975, "valid_targets_mean": 5421.9, "valid_targets_min": 876 }, { "epoch": 0.9924050632911392, "grad_norm": 0.33380559486032607, "learning_rate": 3.883697361894825e-05, "loss": 0.3439, "loss_nan_ranks": 0, "loss_rank_avg": 0.2117309868335724, "step": 980, "valid_targets_mean": 4499.0, "valid_targets_min": 1184 }, { "epoch": 0.9974683544303797, "grad_norm": 0.3618917728963476, "learning_rate": 3.881311133653691e-05, "loss": 0.3412, "loss_nan_ranks": 0, "loss_rank_avg": 0.16749724745750427, "step": 985, "valid_targets_mean": 3879.4, "valid_targets_min": 966 }, { "epoch": 1.0020253164556963, "grad_norm": 0.3195092960965727, "learning_rate": 3.878901422010632e-05, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.21217718720436096, "step": 990, "valid_targets_mean": 6226.9, "valid_targets_min": 1827 }, { "epoch": 1.0070886075949368, "grad_norm": 0.32404855006530575, "learning_rate": 3.87646825704479e-05, "loss": 0.3259, "loss_nan_ranks": 0, "loss_rank_avg": 0.1381339430809021, "step": 995, "valid_targets_mean": 3916.4, "valid_targets_min": 1401 }, { "epoch": 1.0121518987341773, "grad_norm": 0.3141166003779331, "learning_rate": 3.874011669128065e-05, "loss": 0.3446, "loss_nan_ranks": 0, "loss_rank_avg": 0.1709311306476593, "step": 1000, "valid_targets_mean": 4634.4, "valid_targets_min": 1322 }, { "epoch": 1.0172151898734176, "grad_norm": 0.33255131568231555, "learning_rate": 3.871531688924731e-05, "loss": 0.3176, "loss_nan_ranks": 0, "loss_rank_avg": 0.11075881123542786, "step": 1005, "valid_targets_mean": 2777.5, "valid_targets_min": 899 }, { "epoch": 1.0222784810126582, "grad_norm": 0.3551119238834457, "learning_rate": 3.8690283473910555e-05, "loss": 0.3343, "loss_nan_ranks": 0, "loss_rank_avg": 0.18998833000659943, "step": 1010, "valid_targets_mean": 5065.8, "valid_targets_min": 1392 }, { "epoch": 1.0273417721518987, "grad_norm": 0.36295431013252033, "learning_rate": 3.866501675774914e-05, "loss": 0.3282, "loss_nan_ranks": 0, "loss_rank_avg": 0.1773543804883957, "step": 1015, "valid_targets_mean": 3819.9, "valid_targets_min": 1174 }, { "epoch": 1.0324050632911392, "grad_norm": 0.33540491774621956, "learning_rate": 3.8639517056153997e-05, "loss": 0.3362, "loss_nan_ranks": 0, "loss_rank_avg": 0.16152143478393555, "step": 1020, "valid_targets_mean": 4223.1, "valid_targets_min": 858 }, { "epoch": 1.0374683544303798, "grad_norm": 0.32077100355601573, "learning_rate": 3.8613784687424275e-05, "loss": 0.3378, "loss_nan_ranks": 0, "loss_rank_avg": 0.19795547425746918, "step": 1025, "valid_targets_mean": 5295.2, "valid_targets_min": 1496 }, { "epoch": 1.0425316455696203, "grad_norm": 0.3216906551189178, "learning_rate": 3.858781997276337e-05, "loss": 0.3318, "loss_nan_ranks": 0, "loss_rank_avg": 0.16188682615756989, "step": 1030, "valid_targets_mean": 5138.4, "valid_targets_min": 947 }, { "epoch": 1.0475949367088608, "grad_norm": 0.4486889227248024, "learning_rate": 3.856162323627497e-05, "loss": 0.3251, "loss_nan_ranks": 0, "loss_rank_avg": 0.09634960442781448, "step": 1035, "valid_targets_mean": 3724.6, "valid_targets_min": 934 }, { "epoch": 1.0526582278481014, "grad_norm": 0.2934117207565638, "learning_rate": 3.8535194804958924e-05, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.1526038944721222, "step": 1040, "valid_targets_mean": 4829.0, "valid_targets_min": 1401 }, { "epoch": 1.0577215189873417, "grad_norm": 0.2931878952686227, "learning_rate": 3.8508535008707236e-05, "loss": 0.346, "loss_nan_ranks": 0, "loss_rank_avg": 0.20354345440864563, "step": 1045, "valid_targets_mean": 6153.3, "valid_targets_min": 1336 }, { "epoch": 1.0627848101265822, "grad_norm": 0.322713813844516, "learning_rate": 3.848164418029989e-05, "loss": 0.3364, "loss_nan_ranks": 0, "loss_rank_avg": 0.1375882625579834, "step": 1050, "valid_targets_mean": 4300.9, "valid_targets_min": 1361 }, { "epoch": 1.0678481012658227, "grad_norm": 0.31096701689662554, "learning_rate": 3.845452265540074e-05, "loss": 0.3296, "loss_nan_ranks": 0, "loss_rank_avg": 0.1565578281879425, "step": 1055, "valid_targets_mean": 4115.1, "valid_targets_min": 1141 }, { "epoch": 1.0729113924050633, "grad_norm": 0.31792661099154035, "learning_rate": 3.842717077255329e-05, "loss": 0.3265, "loss_nan_ranks": 0, "loss_rank_avg": 0.18725517392158508, "step": 1060, "valid_targets_mean": 5399.2, "valid_targets_min": 1440 }, { "epoch": 1.0779746835443038, "grad_norm": 0.2966357451403385, "learning_rate": 3.839958887317649e-05, "loss": 0.3267, "loss_nan_ranks": 0, "loss_rank_avg": 0.1931026577949524, "step": 1065, "valid_targets_mean": 6788.4, "valid_targets_min": 1285 }, { "epoch": 1.0830379746835443, "grad_norm": 0.32526509145376603, "learning_rate": 3.837177730156045e-05, "loss": 0.3283, "loss_nan_ranks": 0, "loss_rank_avg": 0.18849416077136993, "step": 1070, "valid_targets_mean": 5493.9, "valid_targets_min": 884 }, { "epoch": 1.0881012658227849, "grad_norm": 0.3176994766517001, "learning_rate": 3.834373640486216e-05, "loss": 0.329, "loss_nan_ranks": 0, "loss_rank_avg": 0.13460056483745575, "step": 1075, "valid_targets_mean": 3655.2, "valid_targets_min": 1173 }, { "epoch": 1.0931645569620254, "grad_norm": 0.3802547345823635, "learning_rate": 3.8315466533101154e-05, "loss": 0.3191, "loss_nan_ranks": 0, "loss_rank_avg": 0.1390688419342041, "step": 1080, "valid_targets_mean": 3724.8, "valid_targets_min": 686 }, { "epoch": 1.0982278481012657, "grad_norm": 0.30409901587440336, "learning_rate": 3.828696803915515e-05, "loss": 0.3295, "loss_nan_ranks": 0, "loss_rank_avg": 0.19093772768974304, "step": 1085, "valid_targets_mean": 5509.2, "valid_targets_min": 1316 }, { "epoch": 1.1032911392405063, "grad_norm": 0.31857188574561196, "learning_rate": 3.8258241278755613e-05, "loss": 0.3259, "loss_nan_ranks": 0, "loss_rank_avg": 0.18015238642692566, "step": 1090, "valid_targets_mean": 5178.9, "valid_targets_min": 1381 }, { "epoch": 1.1083544303797468, "grad_norm": 0.32050011818280044, "learning_rate": 3.8229286610483356e-05, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.18884283304214478, "step": 1095, "valid_targets_mean": 5116.2, "valid_targets_min": 1159 }, { "epoch": 1.1134177215189873, "grad_norm": 0.3113272756450795, "learning_rate": 3.820010439576403e-05, "loss": 0.3164, "loss_nan_ranks": 0, "loss_rank_avg": 0.16775749623775482, "step": 1100, "valid_targets_mean": 4514.6, "valid_targets_min": 1605 }, { "epoch": 1.1184810126582279, "grad_norm": 0.33153340730169845, "learning_rate": 3.817069499886364e-05, "loss": 0.3196, "loss_nan_ranks": 0, "loss_rank_avg": 0.12046626210212708, "step": 1105, "valid_targets_mean": 3291.4, "valid_targets_min": 962 }, { "epoch": 1.1235443037974684, "grad_norm": 0.3013874756589958, "learning_rate": 3.814105878688397e-05, "loss": 0.3325, "loss_nan_ranks": 0, "loss_rank_avg": 0.16391009092330933, "step": 1110, "valid_targets_mean": 6036.4, "valid_targets_min": 1055 }, { "epoch": 1.128607594936709, "grad_norm": 0.331804851918644, "learning_rate": 3.8111196129758025e-05, "loss": 0.3281, "loss_nan_ranks": 0, "loss_rank_avg": 0.1217694953083992, "step": 1115, "valid_targets_mean": 2960.4, "valid_targets_min": 1255 }, { "epoch": 1.1336708860759495, "grad_norm": 0.35058089757688515, "learning_rate": 3.808110740024541e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.18976081907749176, "step": 1120, "valid_targets_mean": 4311.5, "valid_targets_min": 1573 }, { "epoch": 1.13873417721519, "grad_norm": 0.2598654453403866, "learning_rate": 3.8050792973927654e-05, "loss": 0.3227, "loss_nan_ranks": 0, "loss_rank_avg": 0.16648131608963013, "step": 1125, "valid_targets_mean": 6690.9, "valid_targets_min": 1006 }, { "epoch": 1.1437974683544303, "grad_norm": 0.36580297380970445, "learning_rate": 3.8020253229203555e-05, "loss": 0.327, "loss_nan_ranks": 0, "loss_rank_avg": 0.173434779047966, "step": 1130, "valid_targets_mean": 3429.3, "valid_targets_min": 1217 }, { "epoch": 1.1488607594936708, "grad_norm": 0.3170699501916741, "learning_rate": 3.798948854728441e-05, "loss": 0.3303, "loss_nan_ranks": 0, "loss_rank_avg": 0.12679925560951233, "step": 1135, "valid_targets_mean": 3721.6, "valid_targets_min": 726 }, { "epoch": 1.1539240506329114, "grad_norm": 0.3315048726728199, "learning_rate": 3.7958499312189344e-05, "loss": 0.3389, "loss_nan_ranks": 0, "loss_rank_avg": 0.11187270283699036, "step": 1140, "valid_targets_mean": 3303.8, "valid_targets_min": 954 }, { "epoch": 1.158987341772152, "grad_norm": 0.2969536976332786, "learning_rate": 3.792728591074041e-05, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.11002499610185623, "step": 1145, "valid_targets_mean": 4168.6, "valid_targets_min": 1316 }, { "epoch": 1.1640506329113924, "grad_norm": 0.29906816062312314, "learning_rate": 3.7895848732557815e-05, "loss": 0.3329, "loss_nan_ranks": 0, "loss_rank_avg": 0.1309490203857422, "step": 1150, "valid_targets_mean": 4264.5, "valid_targets_min": 945 }, { "epoch": 1.169113924050633, "grad_norm": 0.3373393294160328, "learning_rate": 3.786418817005507e-05, "loss": 0.3299, "loss_nan_ranks": 0, "loss_rank_avg": 0.16449810564517975, "step": 1155, "valid_targets_mean": 4430.1, "valid_targets_min": 1548 }, { "epoch": 1.1741772151898735, "grad_norm": 0.31814918332777564, "learning_rate": 3.783230461843406e-05, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.1603396236896515, "step": 1160, "valid_targets_mean": 4611.4, "valid_targets_min": 1192 }, { "epoch": 1.1792405063291138, "grad_norm": 0.37957067548492934, "learning_rate": 3.7800198475680136e-05, "loss": 0.3264, "loss_nan_ranks": 0, "loss_rank_avg": 0.09246158599853516, "step": 1165, "valid_targets_mean": 2677.1, "valid_targets_min": 1357 }, { "epoch": 1.1843037974683543, "grad_norm": 0.3094282166752189, "learning_rate": 3.776787014255712e-05, "loss": 0.3292, "loss_nan_ranks": 0, "loss_rank_avg": 0.1497591733932495, "step": 1170, "valid_targets_mean": 4014.9, "valid_targets_min": 1510 }, { "epoch": 1.1893670886075949, "grad_norm": 0.35082198305199175, "learning_rate": 3.773532002260233e-05, "loss": 0.3276, "loss_nan_ranks": 0, "loss_rank_avg": 0.1902400553226471, "step": 1175, "valid_targets_mean": 4051.2, "valid_targets_min": 926 }, { "epoch": 1.1944303797468354, "grad_norm": 0.3363300235759021, "learning_rate": 3.770254852212152e-05, "loss": 0.3236, "loss_nan_ranks": 0, "loss_rank_avg": 0.1484481394290924, "step": 1180, "valid_targets_mean": 4022.1, "valid_targets_min": 949 }, { "epoch": 1.199493670886076, "grad_norm": 0.2959219712023686, "learning_rate": 3.766955605018384e-05, "loss": 0.3197, "loss_nan_ranks": 0, "loss_rank_avg": 0.17988604307174683, "step": 1185, "valid_targets_mean": 5788.9, "valid_targets_min": 927 }, { "epoch": 1.2045569620253165, "grad_norm": 0.30513862700761135, "learning_rate": 3.7636343018616675e-05, "loss": 0.3243, "loss_nan_ranks": 0, "loss_rank_avg": 0.162398099899292, "step": 1190, "valid_targets_mean": 4152.4, "valid_targets_min": 1183 }, { "epoch": 1.209620253164557, "grad_norm": 0.3256099867852839, "learning_rate": 3.7602909842000565e-05, "loss": 0.3255, "loss_nan_ranks": 0, "loss_rank_avg": 0.1604665219783783, "step": 1195, "valid_targets_mean": 4510.4, "valid_targets_min": 1107 }, { "epoch": 1.2146835443037975, "grad_norm": 0.31652452857276137, "learning_rate": 3.7569256937663995e-05, "loss": 0.3228, "loss_nan_ranks": 0, "loss_rank_avg": 0.11722761392593384, "step": 1200, "valid_targets_mean": 3867.2, "valid_targets_min": 1428 }, { "epoch": 1.219746835443038, "grad_norm": 0.3570058144248121, "learning_rate": 3.753538472567819e-05, "loss": 0.3343, "loss_nan_ranks": 0, "loss_rank_avg": 0.132009819149971, "step": 1205, "valid_targets_mean": 3776.8, "valid_targets_min": 1444 }, { "epoch": 1.2248101265822784, "grad_norm": 0.3253492095946553, "learning_rate": 3.750129362885188e-05, "loss": 0.3491, "loss_nan_ranks": 0, "loss_rank_avg": 0.20971378684043884, "step": 1210, "valid_targets_mean": 5854.2, "valid_targets_min": 895 }, { "epoch": 1.229873417721519, "grad_norm": 0.31813799271358817, "learning_rate": 3.7466984072726014e-05, "loss": 0.3278, "loss_nan_ranks": 0, "loss_rank_avg": 0.14392566680908203, "step": 1215, "valid_targets_mean": 4255.3, "valid_targets_min": 1377 }, { "epoch": 1.2349367088607595, "grad_norm": 0.3161090773410782, "learning_rate": 3.743245648556845e-05, "loss": 0.333, "loss_nan_ranks": 0, "loss_rank_avg": 0.15600383281707764, "step": 1220, "valid_targets_mean": 4627.6, "valid_targets_min": 1186 }, { "epoch": 1.24, "grad_norm": 0.3383098606932185, "learning_rate": 3.739771129836863e-05, "loss": 0.3106, "loss_nan_ranks": 0, "loss_rank_avg": 0.15630879998207092, "step": 1225, "valid_targets_mean": 3907.4, "valid_targets_min": 1318 }, { "epoch": 1.2450632911392405, "grad_norm": 0.380311170159032, "learning_rate": 3.736274894483215e-05, "loss": 0.3443, "loss_nan_ranks": 0, "loss_rank_avg": 0.17396849393844604, "step": 1230, "valid_targets_mean": 3654.8, "valid_targets_min": 1228 }, { "epoch": 1.250126582278481, "grad_norm": 0.29633634831203143, "learning_rate": 3.7327569861375404e-05, "loss": 0.3368, "loss_nan_ranks": 0, "loss_rank_avg": 0.20720690488815308, "step": 1235, "valid_targets_mean": 6698.7, "valid_targets_min": 1554 }, { "epoch": 1.2551898734177216, "grad_norm": 0.32181581382324975, "learning_rate": 3.729217448712009e-05, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.15546496212482452, "step": 1240, "valid_targets_mean": 4598.5, "valid_targets_min": 1081 }, { "epoch": 1.260253164556962, "grad_norm": 0.2876370801591027, "learning_rate": 3.725656326388776e-05, "loss": 0.312, "loss_nan_ranks": 0, "loss_rank_avg": 0.12497955560684204, "step": 1245, "valid_targets_mean": 4425.2, "valid_targets_min": 1167 }, { "epoch": 1.2653164556962024, "grad_norm": 0.3193054610028216, "learning_rate": 3.722073663619429e-05, "loss": 0.3268, "loss_nan_ranks": 0, "loss_rank_avg": 0.15073925256729126, "step": 1250, "valid_targets_mean": 4511.2, "valid_targets_min": 1143 }, { "epoch": 1.270379746835443, "grad_norm": 0.39145813292181675, "learning_rate": 3.718469505124434e-05, "loss": 0.3246, "loss_nan_ranks": 0, "loss_rank_avg": 0.15670371055603027, "step": 1255, "valid_targets_mean": 4593.4, "valid_targets_min": 885 }, { "epoch": 1.2754430379746835, "grad_norm": 0.3007158793143366, "learning_rate": 3.714843895892576e-05, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.14526674151420593, "step": 1260, "valid_targets_mean": 4201.2, "valid_targets_min": 1015 }, { "epoch": 1.280506329113924, "grad_norm": 0.3431473760602178, "learning_rate": 3.7111968811803985e-05, "loss": 0.3374, "loss_nan_ranks": 0, "loss_rank_avg": 0.11407409608364105, "step": 1265, "valid_targets_mean": 2609.9, "valid_targets_min": 1008 }, { "epoch": 1.2855696202531646, "grad_norm": 0.31430226120597105, "learning_rate": 3.7075285065116376e-05, "loss": 0.3255, "loss_nan_ranks": 0, "loss_rank_avg": 0.21788525581359863, "step": 1270, "valid_targets_mean": 5227.1, "valid_targets_min": 1159 }, { "epoch": 1.290632911392405, "grad_norm": 0.2942207875130029, "learning_rate": 3.703838817676654e-05, "loss": 0.3248, "loss_nan_ranks": 0, "loss_rank_avg": 0.16078102588653564, "step": 1275, "valid_targets_mean": 5179.4, "valid_targets_min": 966 }, { "epoch": 1.2956962025316456, "grad_norm": 0.33801133523700155, "learning_rate": 3.7001278607318646e-05, "loss": 0.3293, "loss_nan_ranks": 0, "loss_rank_avg": 0.13204364478588104, "step": 1280, "valid_targets_mean": 3593.9, "valid_targets_min": 1351 }, { "epoch": 1.3007594936708862, "grad_norm": 0.36194997437445076, "learning_rate": 3.696395681999161e-05, "loss": 0.3315, "loss_nan_ranks": 0, "loss_rank_avg": 0.15205729007720947, "step": 1285, "valid_targets_mean": 3709.8, "valid_targets_min": 1456 }, { "epoch": 1.3058227848101267, "grad_norm": 0.37635182260044775, "learning_rate": 3.692642328065337e-05, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.12143959850072861, "step": 1290, "valid_targets_mean": 3222.8, "valid_targets_min": 1077 }, { "epoch": 1.310886075949367, "grad_norm": 0.3080355652465348, "learning_rate": 3.688867845781506e-05, "loss": 0.327, "loss_nan_ranks": 0, "loss_rank_avg": 0.14508505165576935, "step": 1295, "valid_targets_mean": 3859.7, "valid_targets_min": 1113 }, { "epoch": 1.3159493670886075, "grad_norm": 0.3439159780043492, "learning_rate": 3.685072282262511e-05, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.14666421711444855, "step": 1300, "valid_targets_mean": 3587.8, "valid_targets_min": 1142 }, { "epoch": 1.321012658227848, "grad_norm": 0.30506292484752023, "learning_rate": 3.6812556848863474e-05, "loss": 0.3253, "loss_nan_ranks": 0, "loss_rank_avg": 0.15456736087799072, "step": 1305, "valid_targets_mean": 3908.8, "valid_targets_min": 1305 }, { "epoch": 1.3260759493670886, "grad_norm": 0.32896698136778196, "learning_rate": 3.6774181012935595e-05, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.14750021696090698, "step": 1310, "valid_targets_mean": 3579.4, "valid_targets_min": 696 }, { "epoch": 1.3311392405063291, "grad_norm": 0.3494681443588045, "learning_rate": 3.673559579386653e-05, "loss": 0.3329, "loss_nan_ranks": 0, "loss_rank_avg": 0.16966864466667175, "step": 1315, "valid_targets_mean": 3639.5, "valid_targets_min": 1136 }, { "epoch": 1.3362025316455697, "grad_norm": 0.3191056529939702, "learning_rate": 3.6696801673294984e-05, "loss": 0.3274, "loss_nan_ranks": 0, "loss_rank_avg": 0.2022847682237625, "step": 1320, "valid_targets_mean": 6126.2, "valid_targets_min": 1760 }, { "epoch": 1.34126582278481, "grad_norm": 0.40439808049151743, "learning_rate": 3.665779913546721e-05, "loss": 0.3207, "loss_nan_ranks": 0, "loss_rank_avg": 0.1815149486064911, "step": 1325, "valid_targets_mean": 3929.4, "valid_targets_min": 1092 }, { "epoch": 1.3463291139240505, "grad_norm": 0.29566683990417303, "learning_rate": 3.6618588667231064e-05, "loss": 0.3244, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440686285495758, "step": 1330, "valid_targets_mean": 4236.4, "valid_targets_min": 1086 }, { "epoch": 1.351392405063291, "grad_norm": 0.3344359616665295, "learning_rate": 3.6579170758029885e-05, "loss": 0.324, "loss_nan_ranks": 0, "loss_rank_avg": 0.15648147463798523, "step": 1335, "valid_targets_mean": 3588.6, "valid_targets_min": 1635 }, { "epoch": 1.3564556962025316, "grad_norm": 0.2879031761545053, "learning_rate": 3.653954589989637e-05, "loss": 0.3215, "loss_nan_ranks": 0, "loss_rank_avg": 0.16395555436611176, "step": 1340, "valid_targets_mean": 4903.5, "valid_targets_min": 1401 }, { "epoch": 1.3615189873417721, "grad_norm": 0.3076034430138629, "learning_rate": 3.649971458744645e-05, "loss": 0.3332, "loss_nan_ranks": 0, "loss_rank_avg": 0.14920540153980255, "step": 1345, "valid_targets_mean": 4404.3, "valid_targets_min": 1479 }, { "epoch": 1.3665822784810127, "grad_norm": 0.37728920822736073, "learning_rate": 3.645967731787313e-05, "loss": 0.3273, "loss_nan_ranks": 0, "loss_rank_avg": 0.16919684410095215, "step": 1350, "valid_targets_mean": 3916.3, "valid_targets_min": 1491 }, { "epoch": 1.3716455696202532, "grad_norm": 0.2944205665752948, "learning_rate": 3.641943459094026e-05, "loss": 0.32, "loss_nan_ranks": 0, "loss_rank_avg": 0.20011773705482483, "step": 1355, "valid_targets_mean": 6104.8, "valid_targets_min": 1110 }, { "epoch": 1.3767088607594937, "grad_norm": 0.31998862065193057, "learning_rate": 3.63789869089763e-05, "loss": 0.3281, "loss_nan_ranks": 0, "loss_rank_avg": 0.17156195640563965, "step": 1360, "valid_targets_mean": 4435.9, "valid_targets_min": 1056 }, { "epoch": 1.3817721518987343, "grad_norm": 0.3359058600132148, "learning_rate": 3.633833477686805e-05, "loss": 0.326, "loss_nan_ranks": 0, "loss_rank_avg": 0.1116013303399086, "step": 1365, "valid_targets_mean": 2720.7, "valid_targets_min": 1100 }, { "epoch": 1.3868354430379748, "grad_norm": 0.3167283899854193, "learning_rate": 3.629747870205438e-05, "loss": 0.3375, "loss_nan_ranks": 0, "loss_rank_avg": 0.15123698115348816, "step": 1370, "valid_targets_mean": 4809.0, "valid_targets_min": 1288 }, { "epoch": 1.3918987341772153, "grad_norm": 0.3176638421764831, "learning_rate": 3.625641919451982e-05, "loss": 0.3251, "loss_nan_ranks": 0, "loss_rank_avg": 0.116270050406456, "step": 1375, "valid_targets_mean": 3099.4, "valid_targets_min": 1302 }, { "epoch": 1.3969620253164556, "grad_norm": 0.3567607135105218, "learning_rate": 3.621515676678829e-05, "loss": 0.3403, "loss_nan_ranks": 0, "loss_rank_avg": 0.18901550769805908, "step": 1380, "valid_targets_mean": 4234.6, "valid_targets_min": 1078 }, { "epoch": 1.4020253164556962, "grad_norm": 0.33150001426521647, "learning_rate": 3.617369193391663e-05, "loss": 0.3257, "loss_nan_ranks": 0, "loss_rank_avg": 0.14285731315612793, "step": 1385, "valid_targets_mean": 3883.8, "valid_targets_min": 1292 }, { "epoch": 1.4070886075949367, "grad_norm": 0.32040861152447253, "learning_rate": 3.61320252134882e-05, "loss": 0.3202, "loss_nan_ranks": 0, "loss_rank_avg": 0.15014925599098206, "step": 1390, "valid_targets_mean": 4633.4, "valid_targets_min": 1150 }, { "epoch": 1.4121518987341772, "grad_norm": 0.3364407178912512, "learning_rate": 3.6090157125606405e-05, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.19701796770095825, "step": 1395, "valid_targets_mean": 4298.4, "valid_targets_min": 1055 }, { "epoch": 1.4172151898734178, "grad_norm": 0.2998592984370577, "learning_rate": 3.604808819288823e-05, "loss": 0.3213, "loss_nan_ranks": 0, "loss_rank_avg": 0.21334891021251678, "step": 1400, "valid_targets_mean": 6774.6, "valid_targets_min": 1471 }, { "epoch": 1.4222784810126583, "grad_norm": 0.32266679078127786, "learning_rate": 3.600581894045768e-05, "loss": 0.3162, "loss_nan_ranks": 0, "loss_rank_avg": 0.10229863971471786, "step": 1405, "valid_targets_mean": 2818.3, "valid_targets_min": 1002 }, { "epoch": 1.4273417721518986, "grad_norm": 0.2989355644726402, "learning_rate": 3.596334989593927e-05, "loss": 0.3324, "loss_nan_ranks": 0, "loss_rank_avg": 0.16216593980789185, "step": 1410, "valid_targets_mean": 4271.4, "valid_targets_min": 773 }, { "epoch": 1.4324050632911391, "grad_norm": 0.33686789223908364, "learning_rate": 3.5920681589451385e-05, "loss": 0.3177, "loss_nan_ranks": 0, "loss_rank_avg": 0.16129520535469055, "step": 1415, "valid_targets_mean": 3987.1, "valid_targets_min": 776 }, { "epoch": 1.4374683544303797, "grad_norm": 0.2948991655130385, "learning_rate": 3.58778145535997e-05, "loss": 0.3152, "loss_nan_ranks": 0, "loss_rank_avg": 0.14479148387908936, "step": 1420, "valid_targets_mean": 4191.2, "valid_targets_min": 1049 }, { "epoch": 1.4425316455696202, "grad_norm": 0.278153706236472, "learning_rate": 3.583474932347054e-05, "loss": 0.3194, "loss_nan_ranks": 0, "loss_rank_avg": 0.15073184669017792, "step": 1425, "valid_targets_mean": 5600.0, "valid_targets_min": 978 }, { "epoch": 1.4475949367088607, "grad_norm": 0.2989703152632012, "learning_rate": 3.5791486436624145e-05, "loss": 0.322, "loss_nan_ranks": 0, "loss_rank_avg": 0.1581433117389679, "step": 1430, "valid_targets_mean": 4557.4, "valid_targets_min": 1311 }, { "epoch": 1.4526582278481013, "grad_norm": 0.3156763543957603, "learning_rate": 3.5748026433088036e-05, "loss": 0.3234, "loss_nan_ranks": 0, "loss_rank_avg": 0.1554793417453766, "step": 1435, "valid_targets_mean": 5105.0, "valid_targets_min": 1086 }, { "epoch": 1.4577215189873418, "grad_norm": 0.30549649598454104, "learning_rate": 3.5704369855350226e-05, "loss": 0.3285, "loss_nan_ranks": 0, "loss_rank_avg": 0.10838840901851654, "step": 1440, "valid_targets_mean": 2855.1, "valid_targets_min": 1382 }, { "epoch": 1.4627848101265823, "grad_norm": 0.37394597619150627, "learning_rate": 3.566051724835245e-05, "loss": 0.3409, "loss_nan_ranks": 0, "loss_rank_avg": 0.13602185249328613, "step": 1445, "valid_targets_mean": 3419.4, "valid_targets_min": 1146 }, { "epoch": 1.4678481012658229, "grad_norm": 0.3156375413907948, "learning_rate": 3.5616469159483363e-05, "loss": 0.3224, "loss_nan_ranks": 0, "loss_rank_avg": 0.14657479524612427, "step": 1450, "valid_targets_mean": 4287.6, "valid_targets_min": 1162 }, { "epoch": 1.4729113924050634, "grad_norm": 0.32282455141307365, "learning_rate": 3.5572226138571753e-05, "loss": 0.3428, "loss_nan_ranks": 0, "loss_rank_avg": 0.21434099972248077, "step": 1455, "valid_targets_mean": 6099.5, "valid_targets_min": 1650 }, { "epoch": 1.4779746835443037, "grad_norm": 0.3934165636040704, "learning_rate": 3.5527788737879595e-05, "loss": 0.3293, "loss_nan_ranks": 0, "loss_rank_avg": 0.13554619252681732, "step": 1460, "valid_targets_mean": 3898.6, "valid_targets_min": 749 }, { "epoch": 1.4830379746835443, "grad_norm": 0.3532333332147838, "learning_rate": 3.548315751209524e-05, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.1423749029636383, "step": 1465, "valid_targets_mean": 3396.2, "valid_targets_min": 1245 }, { "epoch": 1.4881012658227848, "grad_norm": 0.3046035862379382, "learning_rate": 3.543833301832642e-05, "loss": 0.3092, "loss_nan_ranks": 0, "loss_rank_avg": 0.11005077511072159, "step": 1470, "valid_targets_mean": 3165.8, "valid_targets_min": 1018 }, { "epoch": 1.4931645569620253, "grad_norm": 0.2934515113132098, "learning_rate": 3.539331581609337e-05, "loss": 0.3228, "loss_nan_ranks": 0, "loss_rank_avg": 0.16373209655284882, "step": 1475, "valid_targets_mean": 5422.3, "valid_targets_min": 938 }, { "epoch": 1.4982278481012659, "grad_norm": 0.29330851366159866, "learning_rate": 3.5348106467321756e-05, "loss": 0.3204, "loss_nan_ranks": 0, "loss_rank_avg": 0.1334601640701294, "step": 1480, "valid_targets_mean": 4623.2, "valid_targets_min": 1060 }, { "epoch": 1.5032911392405062, "grad_norm": 0.3494149115756711, "learning_rate": 3.530270553633574e-05, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.14463084936141968, "step": 1485, "valid_targets_mean": 3681.4, "valid_targets_min": 1175 }, { "epoch": 1.5083544303797467, "grad_norm": 0.34094476372572885, "learning_rate": 3.5257113589850895e-05, "loss": 0.3283, "loss_nan_ranks": 0, "loss_rank_avg": 0.13542452454566956, "step": 1490, "valid_targets_mean": 3142.8, "valid_targets_min": 1338 }, { "epoch": 1.5134177215189872, "grad_norm": 0.33689606267312805, "learning_rate": 3.521133119696712e-05, "loss": 0.3264, "loss_nan_ranks": 0, "loss_rank_avg": 0.16328886151313782, "step": 1495, "valid_targets_mean": 4708.0, "valid_targets_min": 1214 }, { "epoch": 1.5184810126582278, "grad_norm": 0.8587040130178458, "learning_rate": 3.516535892916159e-05, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.166406512260437, "step": 1500, "valid_targets_mean": 4267.1, "valid_targets_min": 1066 }, { "epoch": 1.5235443037974683, "grad_norm": 0.31747165527732263, "learning_rate": 3.5119197360281553e-05, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.1378452181816101, "step": 1505, "valid_targets_mean": 3656.2, "valid_targets_min": 1064 }, { "epoch": 1.5286075949367088, "grad_norm": 0.3521429432867297, "learning_rate": 3.507284706653722e-05, "loss": 0.3369, "loss_nan_ranks": 0, "loss_rank_avg": 0.22082693874835968, "step": 1510, "valid_targets_mean": 4618.8, "valid_targets_min": 1392 }, { "epoch": 1.5336708860759494, "grad_norm": 0.3319407091362445, "learning_rate": 3.5026308626494545e-05, "loss": 0.3134, "loss_nan_ranks": 0, "loss_rank_avg": 0.18031668663024902, "step": 1515, "valid_targets_mean": 3750.2, "valid_targets_min": 977 }, { "epoch": 1.53873417721519, "grad_norm": 0.33498834727615584, "learning_rate": 3.497958262106801e-05, "loss": 0.3205, "loss_nan_ranks": 0, "loss_rank_avg": 0.1643165647983551, "step": 1520, "valid_targets_mean": 3328.2, "valid_targets_min": 1474 }, { "epoch": 1.5437974683544304, "grad_norm": 0.3537186281988192, "learning_rate": 3.493266963351339e-05, "loss": 0.3115, "loss_nan_ranks": 0, "loss_rank_avg": 0.1584773063659668, "step": 1525, "valid_targets_mean": 3274.9, "valid_targets_min": 1245 }, { "epoch": 1.548860759493671, "grad_norm": 0.30657928098680826, "learning_rate": 3.4885570249420454e-05, "loss": 0.3272, "loss_nan_ranks": 0, "loss_rank_avg": 0.1703530102968216, "step": 1530, "valid_targets_mean": 5461.6, "valid_targets_min": 1154 }, { "epoch": 1.5539240506329115, "grad_norm": 0.338680368171272, "learning_rate": 3.483828505670563e-05, "loss": 0.3255, "loss_nan_ranks": 0, "loss_rank_avg": 0.15479744970798492, "step": 1535, "valid_targets_mean": 4522.8, "valid_targets_min": 1326 }, { "epoch": 1.558987341772152, "grad_norm": 0.369309200288726, "learning_rate": 3.479081464560475e-05, "loss": 0.3191, "loss_nan_ranks": 0, "loss_rank_avg": 0.12721368670463562, "step": 1540, "valid_targets_mean": 2568.1, "valid_targets_min": 1187 }, { "epoch": 1.5640506329113926, "grad_norm": 0.3519884099657949, "learning_rate": 3.474315960866558e-05, "loss": 0.326, "loss_nan_ranks": 0, "loss_rank_avg": 0.21022453904151917, "step": 1545, "valid_targets_mean": 5003.4, "valid_targets_min": 1333 }, { "epoch": 1.5691139240506329, "grad_norm": 0.33365501094495986, "learning_rate": 3.469532054074049e-05, "loss": 0.3275, "loss_nan_ranks": 0, "loss_rank_avg": 0.11454639583826065, "step": 1550, "valid_targets_mean": 3473.1, "valid_targets_min": 1181 }, { "epoch": 1.5741772151898734, "grad_norm": 0.3487036569312814, "learning_rate": 3.464729803897902e-05, "loss": 0.3207, "loss_nan_ranks": 0, "loss_rank_avg": 0.0789409726858139, "step": 1555, "valid_targets_mean": 2519.6, "valid_targets_min": 1102 }, { "epoch": 1.579240506329114, "grad_norm": 0.33603816281790033, "learning_rate": 3.4599092702820394e-05, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.11025889217853546, "step": 1560, "valid_targets_mean": 2999.4, "valid_targets_min": 1318 }, { "epoch": 1.5843037974683545, "grad_norm": 0.33746214929234886, "learning_rate": 3.4550705133986085e-05, "loss": 0.3297, "loss_nan_ranks": 0, "loss_rank_avg": 0.1540479212999344, "step": 1565, "valid_targets_mean": 3550.0, "valid_targets_min": 1130 }, { "epoch": 1.5893670886075948, "grad_norm": 0.3700007824527567, "learning_rate": 3.450213593647226e-05, "loss": 0.3235, "loss_nan_ranks": 0, "loss_rank_avg": 0.179176926612854, "step": 1570, "valid_targets_mean": 3797.9, "valid_targets_min": 1468 }, { "epoch": 1.5944303797468353, "grad_norm": 0.43557784622964635, "learning_rate": 3.445338571654227e-05, "loss": 0.3245, "loss_nan_ranks": 0, "loss_rank_avg": 0.12111867964267731, "step": 1575, "valid_targets_mean": 3459.7, "valid_targets_min": 1321 }, { "epoch": 1.5994936708860759, "grad_norm": 0.3234005911683535, "learning_rate": 3.440445508271907e-05, "loss": 0.3303, "loss_nan_ranks": 0, "loss_rank_avg": 0.11545059829950333, "step": 1580, "valid_targets_mean": 3151.1, "valid_targets_min": 966 }, { "epoch": 1.6045569620253164, "grad_norm": 0.31481487050082757, "learning_rate": 3.435534464577762e-05, "loss": 0.3185, "loss_nan_ranks": 0, "loss_rank_avg": 0.14349615573883057, "step": 1585, "valid_targets_mean": 4098.8, "valid_targets_min": 1553 }, { "epoch": 1.609620253164557, "grad_norm": 0.3263020753319533, "learning_rate": 3.4306055018737274e-05, "loss": 0.3262, "loss_nan_ranks": 0, "loss_rank_avg": 0.1886909306049347, "step": 1590, "valid_targets_mean": 5531.9, "valid_targets_min": 1290 }, { "epoch": 1.6146835443037975, "grad_norm": 0.3440773642804762, "learning_rate": 3.425658681685412e-05, "loss": 0.3247, "loss_nan_ranks": 0, "loss_rank_avg": 0.17707081139087677, "step": 1595, "valid_targets_mean": 3534.2, "valid_targets_min": 1301 }, { "epoch": 1.619746835443038, "grad_norm": 0.32440177535383535, "learning_rate": 3.420694065761328e-05, "loss": 0.3282, "loss_nan_ranks": 0, "loss_rank_avg": 0.16896334290504456, "step": 1600, "valid_targets_mean": 4122.1, "valid_targets_min": 965 }, { "epoch": 1.6248101265822785, "grad_norm": 0.2928837040048521, "learning_rate": 3.415711716072126e-05, "loss": 0.3318, "loss_nan_ranks": 0, "loss_rank_avg": 0.17395883798599243, "step": 1605, "valid_targets_mean": 5510.7, "valid_targets_min": 1836 }, { "epoch": 1.629873417721519, "grad_norm": 0.29996111358110616, "learning_rate": 3.4107116948098155e-05, "loss": 0.3208, "loss_nan_ranks": 0, "loss_rank_avg": 0.16087687015533447, "step": 1610, "valid_targets_mean": 5291.1, "valid_targets_min": 812 }, { "epoch": 1.6349367088607596, "grad_norm": 0.3391636106718898, "learning_rate": 3.4056940643869905e-05, "loss": 0.328, "loss_nan_ranks": 0, "loss_rank_avg": 0.12102165073156357, "step": 1615, "valid_targets_mean": 2991.2, "valid_targets_min": 987 }, { "epoch": 1.6400000000000001, "grad_norm": 0.30250385799846535, "learning_rate": 3.400658887436051e-05, "loss": 0.3274, "loss_nan_ranks": 0, "loss_rank_avg": 0.15453828871250153, "step": 1620, "valid_targets_mean": 4200.3, "valid_targets_min": 1171 }, { "epoch": 1.6450632911392407, "grad_norm": 0.31602413877978186, "learning_rate": 3.3956062268084215e-05, "loss": 0.3167, "loss_nan_ranks": 0, "loss_rank_avg": 0.1669228971004486, "step": 1625, "valid_targets_mean": 4059.0, "valid_targets_min": 1494 }, { "epoch": 1.650126582278481, "grad_norm": 0.3430073741627476, "learning_rate": 3.390536145573766e-05, "loss": 0.3311, "loss_nan_ranks": 0, "loss_rank_avg": 0.15472730994224548, "step": 1630, "valid_targets_mean": 4020.9, "valid_targets_min": 1121 }, { "epoch": 1.6551898734177215, "grad_norm": 0.30844530157775457, "learning_rate": 3.385448707019199e-05, "loss": 0.3353, "loss_nan_ranks": 0, "loss_rank_avg": 0.13865000009536743, "step": 1635, "valid_targets_mean": 3493.1, "valid_targets_min": 1516 }, { "epoch": 1.660253164556962, "grad_norm": 0.29309820401088355, "learning_rate": 3.3803439746484996e-05, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.18344934284687042, "step": 1640, "valid_targets_mean": 5938.8, "valid_targets_min": 1370 }, { "epoch": 1.6653164556962026, "grad_norm": 0.2917099753276015, "learning_rate": 3.375222012181315e-05, "loss": 0.3324, "loss_nan_ranks": 0, "loss_rank_avg": 0.15374572575092316, "step": 1645, "valid_targets_mean": 4424.8, "valid_targets_min": 1247 }, { "epoch": 1.6703797468354429, "grad_norm": 0.31174326634371047, "learning_rate": 3.370082883552366e-05, "loss": 0.3248, "loss_nan_ranks": 0, "loss_rank_avg": 0.18676675856113434, "step": 1650, "valid_targets_mean": 4577.7, "valid_targets_min": 1153 }, { "epoch": 1.6754430379746834, "grad_norm": 0.2937468748877549, "learning_rate": 3.364926652910651e-05, "loss": 0.328, "loss_nan_ranks": 0, "loss_rank_avg": 0.14714813232421875, "step": 1655, "valid_targets_mean": 4791.8, "valid_targets_min": 1213 }, { "epoch": 1.680506329113924, "grad_norm": 0.2879601888076102, "learning_rate": 3.359753384618641e-05, "loss": 0.3339, "loss_nan_ranks": 0, "loss_rank_avg": 0.19825273752212524, "step": 1660, "valid_targets_mean": 6597.8, "valid_targets_min": 1694 }, { "epoch": 1.6855696202531645, "grad_norm": 0.28734174588103684, "learning_rate": 3.354563143251483e-05, "loss": 0.3251, "loss_nan_ranks": 0, "loss_rank_avg": 0.13350191712379456, "step": 1665, "valid_targets_mean": 4193.6, "valid_targets_min": 1311 }, { "epoch": 1.690632911392405, "grad_norm": 0.3163624678749021, "learning_rate": 3.3493559935961854e-05, "loss": 0.3332, "loss_nan_ranks": 0, "loss_rank_avg": 0.19836895167827606, "step": 1670, "valid_targets_mean": 4911.9, "valid_targets_min": 1235 }, { "epoch": 1.6956962025316455, "grad_norm": 0.26723388677186943, "learning_rate": 3.344132000650817e-05, "loss": 0.3229, "loss_nan_ranks": 0, "loss_rank_avg": 0.14954085648059845, "step": 1675, "valid_targets_mean": 5300.8, "valid_targets_min": 1208 }, { "epoch": 1.700759493670886, "grad_norm": 0.3367011427653921, "learning_rate": 3.3388912296236906e-05, "loss": 0.3369, "loss_nan_ranks": 0, "loss_rank_avg": 0.15727460384368896, "step": 1680, "valid_targets_mean": 3988.7, "valid_targets_min": 1264 }, { "epoch": 1.7058227848101266, "grad_norm": 0.46226016366837236, "learning_rate": 3.3336337459325526e-05, "loss": 0.3267, "loss_nan_ranks": 0, "loss_rank_avg": 0.18564224243164062, "step": 1685, "valid_targets_mean": 6143.1, "valid_targets_min": 1246 }, { "epoch": 1.7108860759493671, "grad_norm": 0.3175894026472926, "learning_rate": 3.328359615203762e-05, "loss": 0.3183, "loss_nan_ranks": 0, "loss_rank_avg": 0.19139517843723297, "step": 1690, "valid_targets_mean": 5133.2, "valid_targets_min": 1080 }, { "epoch": 1.7159493670886077, "grad_norm": 0.27972490266827565, "learning_rate": 3.323068903271476e-05, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.11912492662668228, "step": 1695, "valid_targets_mean": 4236.9, "valid_targets_min": 1213 }, { "epoch": 1.7210126582278482, "grad_norm": 0.28905133463909916, "learning_rate": 3.317761676176825e-05, "loss": 0.326, "loss_nan_ranks": 0, "loss_rank_avg": 0.1582462191581726, "step": 1700, "valid_targets_mean": 5365.8, "valid_targets_min": 1347 }, { "epoch": 1.7260759493670887, "grad_norm": 0.2928951231194897, "learning_rate": 3.31243800016709e-05, "loss": 0.3223, "loss_nan_ranks": 0, "loss_rank_avg": 0.16399666666984558, "step": 1705, "valid_targets_mean": 4478.1, "valid_targets_min": 913 }, { "epoch": 1.7311392405063293, "grad_norm": 0.3067909993527847, "learning_rate": 3.307097941694876e-05, "loss": 0.3203, "loss_nan_ranks": 0, "loss_rank_avg": 0.1793975532054901, "step": 1710, "valid_targets_mean": 4923.8, "valid_targets_min": 1793 }, { "epoch": 1.7362025316455696, "grad_norm": 0.29679310025747774, "learning_rate": 3.3017415674172795e-05, "loss": 0.3205, "loss_nan_ranks": 0, "loss_rank_avg": 0.1398848444223404, "step": 1715, "valid_targets_mean": 3729.8, "valid_targets_min": 1281 }, { "epoch": 1.7412658227848101, "grad_norm": 0.33157110353633035, "learning_rate": 3.296368944195059e-05, "loss": 0.3258, "loss_nan_ranks": 0, "loss_rank_avg": 0.16532516479492188, "step": 1720, "valid_targets_mean": 4614.5, "valid_targets_min": 1146 }, { "epoch": 1.7463291139240507, "grad_norm": 0.3237383031466305, "learning_rate": 3.2909801390918e-05, "loss": 0.3165, "loss_nan_ranks": 0, "loss_rank_avg": 0.16484834253787994, "step": 1725, "valid_targets_mean": 4277.1, "valid_targets_min": 1022 }, { "epoch": 1.7513924050632912, "grad_norm": 0.30303998742275196, "learning_rate": 3.285575219373079e-05, "loss": 0.3068, "loss_nan_ranks": 0, "loss_rank_avg": 0.1231764703989029, "step": 1730, "valid_targets_mean": 3492.9, "valid_targets_min": 908 }, { "epoch": 1.7564556962025315, "grad_norm": 0.3131204074959935, "learning_rate": 3.2801542525056204e-05, "loss": 0.3236, "loss_nan_ranks": 0, "loss_rank_avg": 0.16018734872341156, "step": 1735, "valid_targets_mean": 4216.1, "valid_targets_min": 909 }, { "epoch": 1.761518987341772, "grad_norm": 0.5226006047690179, "learning_rate": 3.27471730615646e-05, "loss": 0.3168, "loss_nan_ranks": 0, "loss_rank_avg": 0.13336879014968872, "step": 1740, "valid_targets_mean": 3926.2, "valid_targets_min": 1825 }, { "epoch": 1.7665822784810126, "grad_norm": 0.288468699839479, "learning_rate": 3.2692644481920926e-05, "loss": 0.3091, "loss_nan_ranks": 0, "loss_rank_avg": 0.1637478768825531, "step": 1745, "valid_targets_mean": 5375.8, "valid_targets_min": 1193 }, { "epoch": 1.771645569620253, "grad_norm": 0.3345448593431147, "learning_rate": 3.263795746677633e-05, "loss": 0.3169, "loss_nan_ranks": 0, "loss_rank_avg": 0.1924804151058197, "step": 1750, "valid_targets_mean": 4262.6, "valid_targets_min": 1246 }, { "epoch": 1.7767088607594936, "grad_norm": 0.31362215927542564, "learning_rate": 3.258311269875959e-05, "loss": 0.3295, "loss_nan_ranks": 0, "loss_rank_avg": 0.17079243063926697, "step": 1755, "valid_targets_mean": 4860.1, "valid_targets_min": 1270 }, { "epoch": 1.7817721518987342, "grad_norm": 0.2881402537381144, "learning_rate": 3.2528110862468664e-05, "loss": 0.3212, "loss_nan_ranks": 0, "loss_rank_avg": 0.1843501329421997, "step": 1760, "valid_targets_mean": 5736.6, "valid_targets_min": 1442 }, { "epoch": 1.7868354430379747, "grad_norm": 0.33940507923082636, "learning_rate": 3.247295264446209e-05, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.14896419644355774, "step": 1765, "valid_targets_mean": 4003.1, "valid_targets_min": 960 }, { "epoch": 1.7918987341772152, "grad_norm": 0.305481958944062, "learning_rate": 3.241763873325044e-05, "loss": 0.3321, "loss_nan_ranks": 0, "loss_rank_avg": 0.1464659869670868, "step": 1770, "valid_targets_mean": 4571.4, "valid_targets_min": 1342 }, { "epoch": 1.7969620253164558, "grad_norm": 0.3372959294620817, "learning_rate": 3.2362169819287714e-05, "loss": 0.3198, "loss_nan_ranks": 0, "loss_rank_avg": 0.17976534366607666, "step": 1775, "valid_targets_mean": 4028.4, "valid_targets_min": 1261 }, { "epoch": 1.8020253164556963, "grad_norm": 0.3104430678347615, "learning_rate": 3.2306546594962744e-05, "loss": 0.3274, "loss_nan_ranks": 0, "loss_rank_avg": 0.16419640183448792, "step": 1780, "valid_targets_mean": 4230.2, "valid_targets_min": 1132 }, { "epoch": 1.8070886075949368, "grad_norm": 0.3241781257834898, "learning_rate": 3.225076975459051e-05, "loss": 0.3243, "loss_nan_ranks": 0, "loss_rank_avg": 0.21455496549606323, "step": 1785, "valid_targets_mean": 7327.5, "valid_targets_min": 1343 }, { "epoch": 1.8121518987341774, "grad_norm": 0.3169044936479542, "learning_rate": 3.219483999440354e-05, "loss": 0.3169, "loss_nan_ranks": 0, "loss_rank_avg": 0.12079709023237228, "step": 1790, "valid_targets_mean": 3173.1, "valid_targets_min": 1329 }, { "epoch": 1.8172151898734177, "grad_norm": 0.331980276874436, "learning_rate": 3.213875801254314e-05, "loss": 0.3276, "loss_nan_ranks": 0, "loss_rank_avg": 0.14299997687339783, "step": 1795, "valid_targets_mean": 3476.8, "valid_targets_min": 942 }, { "epoch": 1.8222784810126582, "grad_norm": 0.25978521097127444, "learning_rate": 3.2082524509050723e-05, "loss": 0.3194, "loss_nan_ranks": 0, "loss_rank_avg": 0.14637430012226105, "step": 1800, "valid_targets_mean": 5356.4, "valid_targets_min": 1492 }, { "epoch": 1.8273417721518987, "grad_norm": 0.4563427674089283, "learning_rate": 3.20261401858591e-05, "loss": 0.3246, "loss_nan_ranks": 0, "loss_rank_avg": 0.16923454403877258, "step": 1805, "valid_targets_mean": 4621.6, "valid_targets_min": 954 }, { "epoch": 1.8324050632911393, "grad_norm": 0.28306126650762187, "learning_rate": 3.196960574678363e-05, "loss": 0.3335, "loss_nan_ranks": 0, "loss_rank_avg": 0.11796549707651138, "step": 1810, "valid_targets_mean": 4214.6, "valid_targets_min": 1296 }, { "epoch": 1.8374683544303796, "grad_norm": 0.32499866336342004, "learning_rate": 3.191292189751353e-05, "loss": 0.3441, "loss_nan_ranks": 0, "loss_rank_avg": 0.1776324212551117, "step": 1815, "valid_targets_mean": 5706.0, "valid_targets_min": 1377 }, { "epoch": 1.8425316455696201, "grad_norm": 0.29118017187843964, "learning_rate": 3.185608934560301e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.12048833072185516, "step": 1820, "valid_targets_mean": 3490.6, "valid_targets_min": 1465 }, { "epoch": 1.8475949367088607, "grad_norm": 0.3114271880772345, "learning_rate": 3.1799108800462466e-05, "loss": 0.3377, "loss_nan_ranks": 0, "loss_rank_avg": 0.14511121809482574, "step": 1825, "valid_targets_mean": 3770.2, "valid_targets_min": 1165 }, { "epoch": 1.8526582278481012, "grad_norm": 0.28385385385120393, "learning_rate": 3.174198097334959e-05, "loss": 0.3248, "loss_nan_ranks": 0, "loss_rank_avg": 0.16951501369476318, "step": 1830, "valid_targets_mean": 4812.1, "valid_targets_min": 995 }, { "epoch": 1.8577215189873417, "grad_norm": 0.33205815359378843, "learning_rate": 3.168470657736053e-05, "loss": 0.3306, "loss_nan_ranks": 0, "loss_rank_avg": 0.1585332751274109, "step": 1835, "valid_targets_mean": 5364.6, "valid_targets_min": 1166 }, { "epoch": 1.8627848101265823, "grad_norm": 0.31689534847164214, "learning_rate": 3.162728632742098e-05, "loss": 0.3115, "loss_nan_ranks": 0, "loss_rank_avg": 0.16908031702041626, "step": 1840, "valid_targets_mean": 4225.1, "valid_targets_min": 1101 }, { "epoch": 1.8678481012658228, "grad_norm": 0.3087921045352938, "learning_rate": 3.1569720940277267e-05, "loss": 0.3178, "loss_nan_ranks": 0, "loss_rank_avg": 0.17665991187095642, "step": 1845, "valid_targets_mean": 4580.1, "valid_targets_min": 1284 }, { "epoch": 1.8729113924050633, "grad_norm": 0.28162350739466746, "learning_rate": 3.151201113448735e-05, "loss": 0.3198, "loss_nan_ranks": 0, "loss_rank_avg": 0.16834816336631775, "step": 1850, "valid_targets_mean": 5581.1, "valid_targets_min": 1362 }, { "epoch": 1.8779746835443039, "grad_norm": 0.33622728572725646, "learning_rate": 3.1454157630411905e-05, "loss": 0.3297, "loss_nan_ranks": 0, "loss_rank_avg": 0.13378959894180298, "step": 1855, "valid_targets_mean": 3264.8, "valid_targets_min": 1178 }, { "epoch": 1.8830379746835444, "grad_norm": 0.2888883767197038, "learning_rate": 3.1396161150205324e-05, "loss": 0.3243, "loss_nan_ranks": 0, "loss_rank_avg": 0.15173028409481049, "step": 1860, "valid_targets_mean": 5245.6, "valid_targets_min": 1061 }, { "epoch": 1.888101265822785, "grad_norm": 0.3008873149690533, "learning_rate": 3.133802241780669e-05, "loss": 0.3417, "loss_nan_ranks": 0, "loss_rank_avg": 0.168132483959198, "step": 1865, "valid_targets_mean": 5342.9, "valid_targets_min": 1360 }, { "epoch": 1.8931645569620255, "grad_norm": 0.30961408751335806, "learning_rate": 3.127974215893075e-05, "loss": 0.3319, "loss_nan_ranks": 0, "loss_rank_avg": 0.15519672632217407, "step": 1870, "valid_targets_mean": 4829.4, "valid_targets_min": 1051 }, { "epoch": 1.8982278481012658, "grad_norm": 0.3375894079078535, "learning_rate": 3.1221321101058826e-05, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.2031598687171936, "step": 1875, "valid_targets_mean": 4846.2, "valid_targets_min": 1616 }, { "epoch": 1.9032911392405063, "grad_norm": 0.30102939403192525, "learning_rate": 3.116275997342979e-05, "loss": 0.3328, "loss_nan_ranks": 0, "loss_rank_avg": 0.1768466830253601, "step": 1880, "valid_targets_mean": 5417.4, "valid_targets_min": 1149 }, { "epoch": 1.9083544303797468, "grad_norm": 0.31204461528240096, "learning_rate": 3.110405950703091e-05, "loss": 0.3286, "loss_nan_ranks": 0, "loss_rank_avg": 0.15786431729793549, "step": 1885, "valid_targets_mean": 4424.1, "valid_targets_min": 1590 }, { "epoch": 1.9134177215189874, "grad_norm": 0.3212411559315451, "learning_rate": 3.104522043458875e-05, "loss": 0.3326, "loss_nan_ranks": 0, "loss_rank_avg": 0.15173178911209106, "step": 1890, "valid_targets_mean": 3546.5, "valid_targets_min": 1048 }, { "epoch": 1.918481012658228, "grad_norm": 0.3477054279687247, "learning_rate": 3.098624349056003e-05, "loss": 0.3131, "loss_nan_ranks": 0, "loss_rank_avg": 0.09834770858287811, "step": 1895, "valid_targets_mean": 3314.4, "valid_targets_min": 1081 }, { "epoch": 1.9235443037974682, "grad_norm": 0.3224350947488976, "learning_rate": 3.0927129411122433e-05, "loss": 0.3307, "loss_nan_ranks": 0, "loss_rank_avg": 0.1967785656452179, "step": 1900, "valid_targets_mean": 5401.0, "valid_targets_min": 1631 }, { "epoch": 1.9286075949367087, "grad_norm": 0.3407210065894635, "learning_rate": 3.086787893416543e-05, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.15977072715759277, "step": 1905, "valid_targets_mean": 3843.9, "valid_targets_min": 1465 }, { "epoch": 1.9336708860759493, "grad_norm": 0.3048824087454436, "learning_rate": 3.080849279928108e-05, "loss": 0.3186, "loss_nan_ranks": 0, "loss_rank_avg": 0.21388033032417297, "step": 1910, "valid_targets_mean": 5811.2, "valid_targets_min": 735 }, { "epoch": 1.9387341772151898, "grad_norm": 0.3220507717171466, "learning_rate": 3.074897174775478e-05, "loss": 0.3231, "loss_nan_ranks": 0, "loss_rank_avg": 0.17468535900115967, "step": 1915, "valid_targets_mean": 4189.4, "valid_targets_min": 1442 }, { "epoch": 1.9437974683544303, "grad_norm": 0.33220201972445723, "learning_rate": 3.0689316522556026e-05, "loss": 0.3242, "loss_nan_ranks": 0, "loss_rank_avg": 0.1948956400156021, "step": 1920, "valid_targets_mean": 4742.3, "valid_targets_min": 1598 }, { "epoch": 1.9488607594936709, "grad_norm": 0.32448507249493624, "learning_rate": 3.062952786832912e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440562605857849, "step": 1925, "valid_targets_mean": 4186.6, "valid_targets_min": 1640 }, { "epoch": 1.9539240506329114, "grad_norm": 0.29766519811078285, "learning_rate": 3.05696065313839e-05, "loss": 0.3306, "loss_nan_ranks": 0, "loss_rank_avg": 0.18304754793643951, "step": 1930, "valid_targets_mean": 6132.7, "valid_targets_min": 1516 }, { "epoch": 1.958987341772152, "grad_norm": 0.2949900786324887, "learning_rate": 3.050955325968641e-05, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.15778782963752747, "step": 1935, "valid_targets_mean": 5078.4, "valid_targets_min": 1196 }, { "epoch": 1.9640506329113925, "grad_norm": 0.3263199970381054, "learning_rate": 3.0449368802849553e-05, "loss": 0.3181, "loss_nan_ranks": 0, "loss_rank_avg": 0.14029563963413239, "step": 1940, "valid_targets_mean": 4289.6, "valid_targets_min": 1207 }, { "epoch": 1.969113924050633, "grad_norm": 0.3116697424009326, "learning_rate": 3.0389053912123755e-05, "loss": 0.3215, "loss_nan_ranks": 0, "loss_rank_avg": 0.1622355878353119, "step": 1945, "valid_targets_mean": 4043.3, "valid_targets_min": 1217 }, { "epoch": 1.9741772151898735, "grad_norm": 0.33957146598689614, "learning_rate": 3.0328609340387584e-05, "loss": 0.319, "loss_nan_ranks": 0, "loss_rank_avg": 0.1829889565706253, "step": 1950, "valid_targets_mean": 3790.2, "valid_targets_min": 768 }, { "epoch": 1.979240506329114, "grad_norm": 0.31004887940586384, "learning_rate": 3.026803584213834e-05, "loss": 0.3196, "loss_nan_ranks": 0, "loss_rank_avg": 0.1571284979581833, "step": 1955, "valid_targets_mean": 4538.4, "valid_targets_min": 956 }, { "epoch": 1.9843037974683544, "grad_norm": 0.2945095160712328, "learning_rate": 3.0207334173482635e-05, "loss": 0.3223, "loss_nan_ranks": 0, "loss_rank_avg": 0.14519169926643372, "step": 1960, "valid_targets_mean": 3616.2, "valid_targets_min": 1058 }, { "epoch": 1.989367088607595, "grad_norm": 0.29690655635239654, "learning_rate": 3.0146505092126987e-05, "loss": 0.3159, "loss_nan_ranks": 0, "loss_rank_avg": 0.14115923643112183, "step": 1965, "valid_targets_mean": 4046.1, "valid_targets_min": 1832 }, { "epoch": 1.9944303797468355, "grad_norm": 0.3836659337432429, "learning_rate": 3.0085549357368316e-05, "loss": 0.3245, "loss_nan_ranks": 0, "loss_rank_avg": 0.16044825315475464, "step": 1970, "valid_targets_mean": 4667.9, "valid_targets_min": 1443 }, { "epoch": 1.999493670886076, "grad_norm": 0.3322124150108135, "learning_rate": 3.0024467730084508e-05, "loss": 0.3169, "loss_nan_ranks": 0, "loss_rank_avg": 0.12640810012817383, "step": 1975, "valid_targets_mean": 3170.9, "valid_targets_min": 832 }, { "epoch": 2.0040506329113925, "grad_norm": 0.3291075554103832, "learning_rate": 2.996326097272487e-05, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.16433456540107727, "step": 1980, "valid_targets_mean": 4258.9, "valid_targets_min": 1370 }, { "epoch": 2.009113924050633, "grad_norm": 0.28624539538450133, "learning_rate": 2.9901929849300676e-05, "loss": 0.3121, "loss_nan_ranks": 0, "loss_rank_avg": 0.156062513589859, "step": 1985, "valid_targets_mean": 5479.2, "valid_targets_min": 1383 }, { "epoch": 2.0141772151898736, "grad_norm": 0.31864237413570884, "learning_rate": 2.984047512537557e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.17700161039829254, "step": 1990, "valid_targets_mean": 4326.2, "valid_targets_min": 1491 }, { "epoch": 2.019240506329114, "grad_norm": 0.29138155253699194, "learning_rate": 2.977889756805604e-05, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.19598735868930817, "step": 1995, "valid_targets_mean": 5823.9, "valid_targets_min": 1470 }, { "epoch": 2.0243037974683546, "grad_norm": 0.32618376749689376, "learning_rate": 2.9717197945981844e-05, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.14639677107334137, "step": 2000, "valid_targets_mean": 3956.3, "valid_targets_min": 1251 }, { "epoch": 2.0293670886075947, "grad_norm": 0.3231822134904899, "learning_rate": 2.9655377029316415e-05, "loss": 0.3038, "loss_nan_ranks": 0, "loss_rank_avg": 0.1973341703414917, "step": 2005, "valid_targets_mean": 6070.5, "valid_targets_min": 1268 }, { "epoch": 2.0344303797468353, "grad_norm": 0.4445885950556669, "learning_rate": 2.9593435589737212e-05, "loss": 0.3081, "loss_nan_ranks": 0, "loss_rank_avg": 0.1424170434474945, "step": 2010, "valid_targets_mean": 3355.1, "valid_targets_min": 1257 }, { "epoch": 2.039493670886076, "grad_norm": 0.31012702805843667, "learning_rate": 2.9531374400426158e-05, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.17267721891403198, "step": 2015, "valid_targets_mean": 5018.6, "valid_targets_min": 803 }, { "epoch": 2.0445569620253163, "grad_norm": 0.27456099255552485, "learning_rate": 2.9469194236059916e-05, "loss": 0.3109, "loss_nan_ranks": 0, "loss_rank_avg": 0.18913531303405762, "step": 2020, "valid_targets_mean": 6316.9, "valid_targets_min": 1565 }, { "epoch": 2.049620253164557, "grad_norm": 0.30759866121772944, "learning_rate": 2.940689587280027e-05, "loss": 0.3056, "loss_nan_ranks": 0, "loss_rank_avg": 0.17620842158794403, "step": 2025, "valid_targets_mean": 5025.1, "valid_targets_min": 1103 }, { "epoch": 2.0546835443037974, "grad_norm": 0.3107498769401775, "learning_rate": 2.9344480088284403e-05, "loss": 0.3108, "loss_nan_ranks": 0, "loss_rank_avg": 0.14356273412704468, "step": 2030, "valid_targets_mean": 3878.3, "valid_targets_min": 1435 }, { "epoch": 2.059746835443038, "grad_norm": 0.3272342894958522, "learning_rate": 2.9281947661615206e-05, "loss": 0.3141, "loss_nan_ranks": 0, "loss_rank_avg": 0.11045265197753906, "step": 2035, "valid_targets_mean": 2769.6, "valid_targets_min": 775 }, { "epoch": 2.0648101265822785, "grad_norm": 0.28376297804532025, "learning_rate": 2.921929937335157e-05, "loss": 0.3134, "loss_nan_ranks": 0, "loss_rank_avg": 0.18254786729812622, "step": 2040, "valid_targets_mean": 6384.8, "valid_targets_min": 726 }, { "epoch": 2.069873417721519, "grad_norm": 0.3494712370742931, "learning_rate": 2.9156536005498616e-05, "loss": 0.3226, "loss_nan_ranks": 0, "loss_rank_avg": 0.15539231896400452, "step": 2045, "valid_targets_mean": 3678.8, "valid_targets_min": 558 }, { "epoch": 2.0749367088607595, "grad_norm": 0.36306320132408093, "learning_rate": 2.909365834149792e-05, "loss": 0.3188, "loss_nan_ranks": 0, "loss_rank_avg": 0.16074064373970032, "step": 2050, "valid_targets_mean": 3803.6, "valid_targets_min": 992 }, { "epoch": 2.08, "grad_norm": 0.28771743850152404, "learning_rate": 2.903066716621779e-05, "loss": 0.3257, "loss_nan_ranks": 0, "loss_rank_avg": 0.17194947600364685, "step": 2055, "valid_targets_mean": 6007.1, "valid_targets_min": 788 }, { "epoch": 2.0850632911392406, "grad_norm": 0.3176958806269076, "learning_rate": 2.896756326594341e-05, "loss": 0.3174, "loss_nan_ranks": 0, "loss_rank_avg": 0.15832051634788513, "step": 2060, "valid_targets_mean": 4807.6, "valid_targets_min": 1533 }, { "epoch": 2.090126582278481, "grad_norm": 0.30643347389492315, "learning_rate": 2.890434742836706e-05, "loss": 0.3061, "loss_nan_ranks": 0, "loss_rank_avg": 0.17868554592132568, "step": 2065, "valid_targets_mean": 5870.9, "valid_targets_min": 1477 }, { "epoch": 2.0951898734177217, "grad_norm": 0.328300503212321, "learning_rate": 2.8841020442578274e-05, "loss": 0.3219, "loss_nan_ranks": 0, "loss_rank_avg": 0.15090826153755188, "step": 2070, "valid_targets_mean": 4159.4, "valid_targets_min": 767 }, { "epoch": 2.100253164556962, "grad_norm": 0.3116451598810816, "learning_rate": 2.8777583099053985e-05, "loss": 0.3096, "loss_nan_ranks": 0, "loss_rank_avg": 0.15223953127861023, "step": 2075, "valid_targets_mean": 4922.9, "valid_targets_min": 1236 }, { "epoch": 2.1053164556962027, "grad_norm": 0.32927381366700853, "learning_rate": 2.871403618964867e-05, "loss": 0.3177, "loss_nan_ranks": 0, "loss_rank_avg": 0.18153706192970276, "step": 2080, "valid_targets_mean": 4833.8, "valid_targets_min": 1513 }, { "epoch": 2.110379746835443, "grad_norm": 0.30099077420276216, "learning_rate": 2.8650380507584444e-05, "loss": 0.3185, "loss_nan_ranks": 0, "loss_rank_avg": 0.11155495047569275, "step": 2085, "valid_targets_mean": 3890.5, "valid_targets_min": 1469 }, { "epoch": 2.1154430379746834, "grad_norm": 0.304896658143913, "learning_rate": 2.8586616847441192e-05, "loss": 0.3203, "loss_nan_ranks": 0, "loss_rank_avg": 0.143421471118927, "step": 2090, "valid_targets_mean": 4747.4, "valid_targets_min": 849 }, { "epoch": 2.120506329113924, "grad_norm": 0.33627609235395134, "learning_rate": 2.852274600514662e-05, "loss": 0.3236, "loss_nan_ranks": 0, "loss_rank_avg": 0.17665691673755646, "step": 2095, "valid_targets_mean": 4558.9, "valid_targets_min": 1540 }, { "epoch": 2.1255696202531644, "grad_norm": 0.3025889533254811, "learning_rate": 2.8458768777966333e-05, "loss": 0.3151, "loss_nan_ranks": 0, "loss_rank_avg": 0.16682836413383484, "step": 2100, "valid_targets_mean": 5740.6, "valid_targets_min": 1809 }, { "epoch": 2.130632911392405, "grad_norm": 0.3039388867958498, "learning_rate": 2.8394685964493886e-05, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.0811905711889267, "step": 2105, "valid_targets_mean": 3185.6, "valid_targets_min": 1428 }, { "epoch": 2.1356962025316455, "grad_norm": 0.34645798201468236, "learning_rate": 2.8330498364640803e-05, "loss": 0.3169, "loss_nan_ranks": 0, "loss_rank_avg": 0.20455661416053772, "step": 2110, "valid_targets_mean": 5101.9, "valid_targets_min": 1051 }, { "epoch": 2.140759493670886, "grad_norm": 0.2965620255799478, "learning_rate": 2.8266206779626604e-05, "loss": 0.2991, "loss_nan_ranks": 0, "loss_rank_avg": 0.15685412287712097, "step": 2115, "valid_targets_mean": 5286.0, "valid_targets_min": 1289 }, { "epoch": 2.1458227848101266, "grad_norm": 0.3555931137634147, "learning_rate": 2.8201812011968807e-05, "loss": 0.3027, "loss_nan_ranks": 0, "loss_rank_avg": 0.16602477431297302, "step": 2120, "valid_targets_mean": 4031.6, "valid_targets_min": 1147 }, { "epoch": 2.150886075949367, "grad_norm": 0.31549642905504277, "learning_rate": 2.8137314865472896e-05, "loss": 0.3115, "loss_nan_ranks": 0, "loss_rank_avg": 0.2147747278213501, "step": 2125, "valid_targets_mean": 5917.6, "valid_targets_min": 1516 }, { "epoch": 2.1559493670886076, "grad_norm": 0.3817360788487001, "learning_rate": 2.8072716145222295e-05, "loss": 0.3204, "loss_nan_ranks": 0, "loss_rank_avg": 0.1429363489151001, "step": 2130, "valid_targets_mean": 4846.5, "valid_targets_min": 1233 }, { "epoch": 2.161012658227848, "grad_norm": 0.29099253723913165, "learning_rate": 2.800801665756833e-05, "loss": 0.3076, "loss_nan_ranks": 0, "loss_rank_avg": 0.1667858213186264, "step": 2135, "valid_targets_mean": 5250.2, "valid_targets_min": 1352 }, { "epoch": 2.1660759493670887, "grad_norm": 0.31033307443976493, "learning_rate": 2.794321721012013e-05, "loss": 0.3174, "loss_nan_ranks": 0, "loss_rank_avg": 0.15342216193675995, "step": 2140, "valid_targets_mean": 4172.6, "valid_targets_min": 959 }, { "epoch": 2.1711392405063292, "grad_norm": 0.32002549909894445, "learning_rate": 2.78783186117346e-05, "loss": 0.3136, "loss_nan_ranks": 0, "loss_rank_avg": 0.1935744285583496, "step": 2145, "valid_targets_mean": 5775.0, "valid_targets_min": 1696 }, { "epoch": 2.1762025316455698, "grad_norm": 0.3337487659466844, "learning_rate": 2.7813321672506268e-05, "loss": 0.3176, "loss_nan_ranks": 0, "loss_rank_avg": 0.19408701360225677, "step": 2150, "valid_targets_mean": 5285.5, "valid_targets_min": 1837 }, { "epoch": 2.1812658227848103, "grad_norm": 0.30999599957531293, "learning_rate": 2.77482272037572e-05, "loss": 0.3085, "loss_nan_ranks": 0, "loss_rank_avg": 0.16555137932300568, "step": 2155, "valid_targets_mean": 4545.2, "valid_targets_min": 1035 }, { "epoch": 2.186329113924051, "grad_norm": 0.32893298945558314, "learning_rate": 2.768303601802689e-05, "loss": 0.3059, "loss_nan_ranks": 0, "loss_rank_avg": 0.15684665739536285, "step": 2160, "valid_targets_mean": 3914.8, "valid_targets_min": 1135 }, { "epoch": 2.191392405063291, "grad_norm": 0.32177861173163685, "learning_rate": 2.7617748929062084e-05, "loss": 0.3113, "loss_nan_ranks": 0, "loss_rank_avg": 0.13835042715072632, "step": 2165, "valid_targets_mean": 4624.2, "valid_targets_min": 911 }, { "epoch": 2.1964556962025314, "grad_norm": 0.2604316010544582, "learning_rate": 2.7552366751806624e-05, "loss": 0.296, "loss_nan_ranks": 0, "loss_rank_avg": 0.14997389912605286, "step": 2170, "valid_targets_mean": 6796.2, "valid_targets_min": 1292 }, { "epoch": 2.201518987341772, "grad_norm": 0.30476092949327993, "learning_rate": 2.7486890302391316e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.1621738076210022, "step": 2175, "valid_targets_mean": 5079.0, "valid_targets_min": 1369 }, { "epoch": 2.2065822784810125, "grad_norm": 0.3322580301103298, "learning_rate": 2.7421320398123702e-05, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.1476869136095047, "step": 2180, "valid_targets_mean": 3784.2, "valid_targets_min": 1640 }, { "epoch": 2.211645569620253, "grad_norm": 0.2990722276821268, "learning_rate": 2.735565785747787e-05, "loss": 0.3077, "loss_nan_ranks": 0, "loss_rank_avg": 0.13568082451820374, "step": 2185, "valid_targets_mean": 4330.4, "valid_targets_min": 815 }, { "epoch": 2.2167088607594936, "grad_norm": 0.30616718547526817, "learning_rate": 2.728990350008423e-05, "loss": 0.3215, "loss_nan_ranks": 0, "loss_rank_avg": 0.17533037066459656, "step": 2190, "valid_targets_mean": 5132.6, "valid_targets_min": 949 }, { "epoch": 2.221772151898734, "grad_norm": 0.28127500881615763, "learning_rate": 2.722405814671931e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.134933739900589, "step": 2195, "valid_targets_mean": 5636.6, "valid_targets_min": 732 }, { "epoch": 2.2268354430379746, "grad_norm": 0.27748602615715384, "learning_rate": 2.715812261929548e-05, "loss": 0.3208, "loss_nan_ranks": 0, "loss_rank_avg": 0.1636897474527359, "step": 2200, "valid_targets_mean": 5998.6, "valid_targets_min": 1351 }, { "epoch": 2.231898734177215, "grad_norm": 0.3255757575300295, "learning_rate": 2.7092097740850712e-05, "loss": 0.3094, "loss_nan_ranks": 0, "loss_rank_avg": 0.1682029664516449, "step": 2205, "valid_targets_mean": 4255.6, "valid_targets_min": 1238 }, { "epoch": 2.2369620253164557, "grad_norm": 0.30015032841488015, "learning_rate": 2.7025984335538297e-05, "loss": 0.3163, "loss_nan_ranks": 0, "loss_rank_avg": 0.1712615191936493, "step": 2210, "valid_targets_mean": 5242.7, "valid_targets_min": 968 }, { "epoch": 2.2420253164556962, "grad_norm": 0.35257346632541897, "learning_rate": 2.6959783228616543e-05, "loss": 0.3258, "loss_nan_ranks": 0, "loss_rank_avg": 0.14988690614700317, "step": 2215, "valid_targets_mean": 3744.8, "valid_targets_min": 1368 }, { "epoch": 2.247088607594937, "grad_norm": 0.34270763531215714, "learning_rate": 2.6893495246438512e-05, "loss": 0.3099, "loss_nan_ranks": 0, "loss_rank_avg": 0.13658785820007324, "step": 2220, "valid_targets_mean": 3438.7, "valid_targets_min": 1173 }, { "epoch": 2.2521518987341773, "grad_norm": 0.3370660380071177, "learning_rate": 2.682712121644168e-05, "loss": 0.3137, "loss_nan_ranks": 0, "loss_rank_avg": 0.1949615478515625, "step": 2225, "valid_targets_mean": 4599.9, "valid_targets_min": 1016 }, { "epoch": 2.257215189873418, "grad_norm": 0.348355336462014, "learning_rate": 2.6760661967137597e-05, "loss": 0.3047, "loss_nan_ranks": 0, "loss_rank_avg": 0.16294927895069122, "step": 2230, "valid_targets_mean": 4107.5, "valid_targets_min": 1022 }, { "epoch": 2.2622784810126584, "grad_norm": 0.3249186301351007, "learning_rate": 2.6694118328101592e-05, "loss": 0.3144, "loss_nan_ranks": 0, "loss_rank_avg": 0.09672749042510986, "step": 2235, "valid_targets_mean": 2920.3, "valid_targets_min": 950 }, { "epoch": 2.267341772151899, "grad_norm": 0.30303571071751967, "learning_rate": 2.6627491129962343e-05, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.1442355215549469, "step": 2240, "valid_targets_mean": 4454.2, "valid_targets_min": 1369 }, { "epoch": 2.2724050632911394, "grad_norm": 0.31715305103924707, "learning_rate": 2.6560781204391584e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.10361987352371216, "step": 2245, "valid_targets_mean": 3143.1, "valid_targets_min": 1447 }, { "epoch": 2.27746835443038, "grad_norm": 0.28484792889639327, "learning_rate": 2.6493989384093674e-05, "loss": 0.3142, "loss_nan_ranks": 0, "loss_rank_avg": 0.14160794019699097, "step": 2250, "valid_targets_mean": 4650.6, "valid_targets_min": 954 }, { "epoch": 2.28253164556962, "grad_norm": 0.2878082890562957, "learning_rate": 2.642711650279523e-05, "loss": 0.3094, "loss_nan_ranks": 0, "loss_rank_avg": 0.1957184076309204, "step": 2255, "valid_targets_mean": 5700.1, "valid_targets_min": 1450 }, { "epoch": 2.2875949367088606, "grad_norm": 0.28921634890872305, "learning_rate": 2.636016339523472e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.1497688591480255, "step": 2260, "valid_targets_mean": 5892.9, "valid_targets_min": 1182 }, { "epoch": 2.292658227848101, "grad_norm": 0.374304372121314, "learning_rate": 2.6293130897152005e-05, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.10483106970787048, "step": 2265, "valid_targets_mean": 2732.1, "valid_targets_min": 909 }, { "epoch": 2.2977215189873417, "grad_norm": 0.360265224368032, "learning_rate": 2.6226019845277954e-05, "loss": 0.3026, "loss_nan_ranks": 0, "loss_rank_avg": 0.15251410007476807, "step": 2270, "valid_targets_mean": 3089.3, "valid_targets_min": 1121 }, { "epoch": 2.302784810126582, "grad_norm": 0.3076018448534471, "learning_rate": 2.615883107732398e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.10678346455097198, "step": 2275, "valid_targets_mean": 3471.9, "valid_targets_min": 1050 }, { "epoch": 2.3078481012658227, "grad_norm": 0.30671877576562406, "learning_rate": 2.609156543197158e-05, "loss": 0.3101, "loss_nan_ranks": 0, "loss_rank_avg": 0.18611571192741394, "step": 2280, "valid_targets_mean": 5213.1, "valid_targets_min": 1379 }, { "epoch": 2.3129113924050633, "grad_norm": 0.42457395280342314, "learning_rate": 2.6024223748861883e-05, "loss": 0.3039, "loss_nan_ranks": 0, "loss_rank_avg": 0.17773228883743286, "step": 2285, "valid_targets_mean": 5313.4, "valid_targets_min": 929 }, { "epoch": 2.317974683544304, "grad_norm": 0.343397113662205, "learning_rate": 2.5956806868585136e-05, "loss": 0.305, "loss_nan_ranks": 0, "loss_rank_avg": 0.1606595367193222, "step": 2290, "valid_targets_mean": 3827.6, "valid_targets_min": 1248 }, { "epoch": 2.3230379746835443, "grad_norm": 0.2808278753890521, "learning_rate": 2.5889315632670247e-05, "loss": 0.3132, "loss_nan_ranks": 0, "loss_rank_avg": 0.11440195143222809, "step": 2295, "valid_targets_mean": 3889.9, "valid_targets_min": 1216 }, { "epoch": 2.328101265822785, "grad_norm": 0.3112053561319972, "learning_rate": 2.582175088357426e-05, "loss": 0.3108, "loss_nan_ranks": 0, "loss_rank_avg": 0.14229443669319153, "step": 2300, "valid_targets_mean": 3906.9, "valid_targets_min": 1129 }, { "epoch": 2.3331645569620254, "grad_norm": 0.29738973838136984, "learning_rate": 2.575411346467185e-05, "loss": 0.304, "loss_nan_ranks": 0, "loss_rank_avg": 0.12370048463344574, "step": 2305, "valid_targets_mean": 4034.3, "valid_targets_min": 1620 }, { "epoch": 2.338227848101266, "grad_norm": 0.3012147807699108, "learning_rate": 2.568640422024478e-05, "loss": 0.3076, "loss_nan_ranks": 0, "loss_rank_avg": 0.2278967797756195, "step": 2310, "valid_targets_mean": 5961.9, "valid_targets_min": 1399 }, { "epoch": 2.3432911392405065, "grad_norm": 0.2922942701946769, "learning_rate": 2.5618623995471394e-05, "loss": 0.3133, "loss_nan_ranks": 0, "loss_rank_avg": 0.16622743010520935, "step": 2315, "valid_targets_mean": 5404.4, "valid_targets_min": 1235 }, { "epoch": 2.348354430379747, "grad_norm": 0.36432427585365534, "learning_rate": 2.5550773636416008e-05, "loss": 0.3196, "loss_nan_ranks": 0, "loss_rank_avg": 0.1854952722787857, "step": 2320, "valid_targets_mean": 3965.4, "valid_targets_min": 1201 }, { "epoch": 2.353417721518987, "grad_norm": 0.33468505049542446, "learning_rate": 2.548285399001843e-05, "loss": 0.3099, "loss_nan_ranks": 0, "loss_rank_avg": 0.15984870493412018, "step": 2325, "valid_targets_mean": 3767.3, "valid_targets_min": 900 }, { "epoch": 2.3584810126582276, "grad_norm": 0.30206170793614096, "learning_rate": 2.5414865904083314e-05, "loss": 0.3161, "loss_nan_ranks": 0, "loss_rank_avg": 0.18496757745742798, "step": 2330, "valid_targets_mean": 5605.0, "valid_targets_min": 1244 }, { "epoch": 2.363544303797468, "grad_norm": 0.3069574368019458, "learning_rate": 2.534681022726962e-05, "loss": 0.3143, "loss_nan_ranks": 0, "loss_rank_avg": 0.20892611145973206, "step": 2335, "valid_targets_mean": 5443.6, "valid_targets_min": 1904 }, { "epoch": 2.3686075949367087, "grad_norm": 0.324406187683953, "learning_rate": 2.5278687809080017e-05, "loss": 0.3157, "loss_nan_ranks": 0, "loss_rank_avg": 0.13418112695217133, "step": 2340, "valid_targets_mean": 3362.5, "valid_targets_min": 1043 }, { "epoch": 2.3736708860759492, "grad_norm": 0.32283224636579144, "learning_rate": 2.5210499499850252e-05, "loss": 0.3236, "loss_nan_ranks": 0, "loss_rank_avg": 0.14372019469738007, "step": 2345, "valid_targets_mean": 3757.2, "valid_targets_min": 1046 }, { "epoch": 2.3787341772151898, "grad_norm": 0.2954201993306155, "learning_rate": 2.5142246150738566e-05, "loss": 0.3132, "loss_nan_ranks": 0, "loss_rank_avg": 0.16226419806480408, "step": 2350, "valid_targets_mean": 5083.2, "valid_targets_min": 1909 }, { "epoch": 2.3837974683544303, "grad_norm": 0.278033728430402, "learning_rate": 2.5073928613715053e-05, "loss": 0.3122, "loss_nan_ranks": 0, "loss_rank_avg": 0.13732075691223145, "step": 2355, "valid_targets_mean": 5177.6, "valid_targets_min": 1378 }, { "epoch": 2.388860759493671, "grad_norm": 0.3406821151852307, "learning_rate": 2.5005547741551045e-05, "loss": 0.3207, "loss_nan_ranks": 0, "loss_rank_avg": 0.1702435463666916, "step": 2360, "valid_targets_mean": 3885.0, "valid_targets_min": 1146 }, { "epoch": 2.3939240506329114, "grad_norm": 0.2924901782943758, "learning_rate": 2.4937104387808434e-05, "loss": 0.3117, "loss_nan_ranks": 0, "loss_rank_avg": 0.17096886038780212, "step": 2365, "valid_targets_mean": 5283.7, "valid_targets_min": 1374 }, { "epoch": 2.398987341772152, "grad_norm": 0.30986779863862535, "learning_rate": 2.4868599406829045e-05, "loss": 0.308, "loss_nan_ranks": 0, "loss_rank_avg": 0.17868509888648987, "step": 2370, "valid_targets_mean": 4610.5, "valid_targets_min": 824 }, { "epoch": 2.4040506329113924, "grad_norm": 0.2951664773380052, "learning_rate": 2.4800033653723962e-05, "loss": 0.3137, "loss_nan_ranks": 0, "loss_rank_avg": 0.14138385653495789, "step": 2375, "valid_targets_mean": 4383.0, "valid_targets_min": 1267 }, { "epoch": 2.409113924050633, "grad_norm": 0.3206066119244924, "learning_rate": 2.473140798436285e-05, "loss": 0.3221, "loss_nan_ranks": 0, "loss_rank_avg": 0.150266632437706, "step": 2380, "valid_targets_mean": 3835.7, "valid_targets_min": 1476 }, { "epoch": 2.4141772151898735, "grad_norm": 0.30473370037176944, "learning_rate": 2.466272325536329e-05, "loss": 0.3015, "loss_nan_ranks": 0, "loss_rank_avg": 0.19058401882648468, "step": 2385, "valid_targets_mean": 6384.8, "valid_targets_min": 935 }, { "epoch": 2.419240506329114, "grad_norm": 0.31479938811797176, "learning_rate": 2.4593980324080054e-05, "loss": 0.3267, "loss_nan_ranks": 0, "loss_rank_avg": 0.11872898042201996, "step": 2390, "valid_targets_mean": 3557.1, "valid_targets_min": 1099 }, { "epoch": 2.4243037974683546, "grad_norm": 0.3392666541666469, "learning_rate": 2.4525180048594452e-05, "loss": 0.3163, "loss_nan_ranks": 0, "loss_rank_avg": 0.15524475276470184, "step": 2395, "valid_targets_mean": 4042.5, "valid_targets_min": 1334 }, { "epoch": 2.429367088607595, "grad_norm": 0.3116160865837986, "learning_rate": 2.445632328770354e-05, "loss": 0.3079, "loss_nan_ranks": 0, "loss_rank_avg": 0.14736303687095642, "step": 2400, "valid_targets_mean": 4778.8, "valid_targets_min": 1194 }, { "epoch": 2.4344303797468356, "grad_norm": 0.3248761370284341, "learning_rate": 2.438741090090951e-05, "loss": 0.3148, "loss_nan_ranks": 0, "loss_rank_avg": 0.1985064595937729, "step": 2405, "valid_targets_mean": 6140.9, "valid_targets_min": 1429 }, { "epoch": 2.439493670886076, "grad_norm": 0.2819598660386808, "learning_rate": 2.431844374840886e-05, "loss": 0.3066, "loss_nan_ranks": 0, "loss_rank_avg": 0.13578057289123535, "step": 2410, "valid_targets_mean": 4853.0, "valid_targets_min": 1602 }, { "epoch": 2.4445569620253167, "grad_norm": 0.31885986982040326, "learning_rate": 2.4249422691081722e-05, "loss": 0.3057, "loss_nan_ranks": 0, "loss_rank_avg": 0.15936186909675598, "step": 2415, "valid_targets_mean": 4181.2, "valid_targets_min": 1349 }, { "epoch": 2.449620253164557, "grad_norm": 0.30296726343845826, "learning_rate": 2.4180348590481075e-05, "loss": 0.3026, "loss_nan_ranks": 0, "loss_rank_avg": 0.12165558338165283, "step": 2420, "valid_targets_mean": 3419.1, "valid_targets_min": 883 }, { "epoch": 2.4546835443037973, "grad_norm": 0.309483869681844, "learning_rate": 2.411122230882203e-05, "loss": 0.3102, "loss_nan_ranks": 0, "loss_rank_avg": 0.1562597155570984, "step": 2425, "valid_targets_mean": 4920.2, "valid_targets_min": 983 }, { "epoch": 2.459746835443038, "grad_norm": 1.2885193054997446, "learning_rate": 2.4042044708971027e-05, "loss": 0.3045, "loss_nan_ranks": 0, "loss_rank_avg": 0.1394486129283905, "step": 2430, "valid_targets_mean": 4328.4, "valid_targets_min": 1162 }, { "epoch": 2.4648101265822784, "grad_norm": 0.27206002510649857, "learning_rate": 2.3972816654435103e-05, "loss": 0.3161, "loss_nan_ranks": 0, "loss_rank_avg": 0.16065040230751038, "step": 2435, "valid_targets_mean": 6525.3, "valid_targets_min": 1098 }, { "epoch": 2.469873417721519, "grad_norm": 0.3427940884240252, "learning_rate": 2.390353900935107e-05, "loss": 0.3198, "loss_nan_ranks": 0, "loss_rank_avg": 0.19091764092445374, "step": 2440, "valid_targets_mean": 4360.0, "valid_targets_min": 1133 }, { "epoch": 2.4749367088607594, "grad_norm": 0.42327373841330385, "learning_rate": 2.3834212638474773e-05, "loss": 0.306, "loss_nan_ranks": 0, "loss_rank_avg": 0.12319037318229675, "step": 2445, "valid_targets_mean": 3837.3, "valid_targets_min": 873 }, { "epoch": 2.48, "grad_norm": 0.49287136211086113, "learning_rate": 2.376483840717026e-05, "loss": 0.3236, "loss_nan_ranks": 0, "loss_rank_avg": 0.15457025170326233, "step": 2450, "valid_targets_mean": 3929.6, "valid_targets_min": 1205 }, { "epoch": 2.4850632911392405, "grad_norm": 0.32265608836896076, "learning_rate": 2.3695417181399004e-05, "loss": 0.3138, "loss_nan_ranks": 0, "loss_rank_avg": 0.13117042183876038, "step": 2455, "valid_targets_mean": 3683.8, "valid_targets_min": 1015 }, { "epoch": 2.490126582278481, "grad_norm": 0.28497626230687617, "learning_rate": 2.362594982770909e-05, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.13846123218536377, "step": 2460, "valid_targets_mean": 4725.8, "valid_targets_min": 1651 }, { "epoch": 2.4951898734177216, "grad_norm": 0.30556606202877784, "learning_rate": 2.3556437213224378e-05, "loss": 0.3149, "loss_nan_ranks": 0, "loss_rank_avg": 0.1903924196958542, "step": 2465, "valid_targets_mean": 5195.9, "valid_targets_min": 1317 }, { "epoch": 2.500253164556962, "grad_norm": 0.2957801020557521, "learning_rate": 2.348688020563371e-05, "loss": 0.3202, "loss_nan_ranks": 0, "loss_rank_avg": 0.15225407481193542, "step": 2470, "valid_targets_mean": 4614.5, "valid_targets_min": 892 }, { "epoch": 2.5053164556962026, "grad_norm": 0.29068264222113155, "learning_rate": 2.3417279673180048e-05, "loss": 0.312, "loss_nan_ranks": 0, "loss_rank_avg": 0.15005727112293243, "step": 2475, "valid_targets_mean": 5253.2, "valid_targets_min": 1364 }, { "epoch": 2.510379746835443, "grad_norm": 0.34824655792906656, "learning_rate": 2.3347636484649662e-05, "loss": 0.3107, "loss_nan_ranks": 0, "loss_rank_avg": 0.11774547398090363, "step": 2480, "valid_targets_mean": 3077.8, "valid_targets_min": 1062 }, { "epoch": 2.5154430379746833, "grad_norm": 0.3255931573908884, "learning_rate": 2.3277951509361273e-05, "loss": 0.3317, "loss_nan_ranks": 0, "loss_rank_avg": 0.20479710400104523, "step": 2485, "valid_targets_mean": 5133.7, "valid_targets_min": 1091 }, { "epoch": 2.520506329113924, "grad_norm": 0.30263280385351665, "learning_rate": 2.3208225617155206e-05, "loss": 0.3121, "loss_nan_ranks": 0, "loss_rank_avg": 0.14676184952259064, "step": 2490, "valid_targets_mean": 4788.9, "valid_targets_min": 1004 }, { "epoch": 2.5255696202531643, "grad_norm": 0.34344447055299104, "learning_rate": 2.3138459678382524e-05, "loss": 0.3156, "loss_nan_ranks": 0, "loss_rank_avg": 0.18363483250141144, "step": 2495, "valid_targets_mean": 4170.4, "valid_targets_min": 1007 }, { "epoch": 2.530632911392405, "grad_norm": 0.2844384480121892, "learning_rate": 2.3068654563894183e-05, "loss": 0.3172, "loss_nan_ranks": 0, "loss_rank_avg": 0.12592104077339172, "step": 2500, "valid_targets_mean": 4493.2, "valid_targets_min": 1334 }, { "epoch": 2.5356962025316454, "grad_norm": 0.32631729959150463, "learning_rate": 2.2998811145030117e-05, "loss": 0.3101, "loss_nan_ranks": 0, "loss_rank_avg": 0.15357106924057007, "step": 2505, "valid_targets_mean": 4361.8, "valid_targets_min": 1071 }, { "epoch": 2.540759493670886, "grad_norm": 0.2650853449197667, "learning_rate": 2.2928930293608435e-05, "loss": 0.307, "loss_nan_ranks": 0, "loss_rank_avg": 0.13759788870811462, "step": 2510, "valid_targets_mean": 5130.8, "valid_targets_min": 1080 }, { "epoch": 2.5458227848101265, "grad_norm": 0.3267807848788021, "learning_rate": 2.2859012881914464e-05, "loss": 0.3037, "loss_nan_ranks": 0, "loss_rank_avg": 0.16794613003730774, "step": 2515, "valid_targets_mean": 4673.6, "valid_targets_min": 1083 }, { "epoch": 2.550886075949367, "grad_norm": 0.278879282582265, "learning_rate": 2.278905978268992e-05, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.11442182958126068, "step": 2520, "valid_targets_mean": 4874.6, "valid_targets_min": 1101 }, { "epoch": 2.5559493670886075, "grad_norm": 0.32085560175743244, "learning_rate": 2.271907186912196e-05, "loss": 0.3119, "loss_nan_ranks": 0, "loss_rank_avg": 0.12187394499778748, "step": 2525, "valid_targets_mean": 3503.1, "valid_targets_min": 882 }, { "epoch": 2.561012658227848, "grad_norm": 0.3284259732307929, "learning_rate": 2.2649050014832326e-05, "loss": 0.3112, "loss_nan_ranks": 0, "loss_rank_avg": 0.16201844811439514, "step": 2530, "valid_targets_mean": 4727.4, "valid_targets_min": 1505 }, { "epoch": 2.5660759493670886, "grad_norm": 0.2991569094124765, "learning_rate": 2.2578995093866424e-05, "loss": 0.3126, "loss_nan_ranks": 0, "loss_rank_avg": 0.1367436945438385, "step": 2535, "valid_targets_mean": 5286.4, "valid_targets_min": 1301 }, { "epoch": 2.571139240506329, "grad_norm": 0.2923839601296598, "learning_rate": 2.2508907980682406e-05, "loss": 0.3066, "loss_nan_ranks": 0, "loss_rank_avg": 0.15937817096710205, "step": 2540, "valid_targets_mean": 5033.3, "valid_targets_min": 1409 }, { "epoch": 2.5762025316455697, "grad_norm": 0.29834149017437644, "learning_rate": 2.2438789550140272e-05, "loss": 0.3208, "loss_nan_ranks": 0, "loss_rank_avg": 0.1662355363368988, "step": 2545, "valid_targets_mean": 4474.9, "valid_targets_min": 1458 }, { "epoch": 2.58126582278481, "grad_norm": 0.31248285204558157, "learning_rate": 2.2368640677490935e-05, "loss": 0.3111, "loss_nan_ranks": 0, "loss_rank_avg": 0.12987586855888367, "step": 2550, "valid_targets_mean": 4253.7, "valid_targets_min": 1334 }, { "epoch": 2.5863291139240507, "grad_norm": 0.2913592791130016, "learning_rate": 2.2298462238365293e-05, "loss": 0.3037, "loss_nan_ranks": 0, "loss_rank_avg": 0.20642492175102234, "step": 2555, "valid_targets_mean": 6304.3, "valid_targets_min": 1349 }, { "epoch": 2.5913924050632913, "grad_norm": 0.35349413261981677, "learning_rate": 2.222825510876332e-05, "loss": 0.3202, "loss_nan_ranks": 0, "loss_rank_avg": 0.17145583033561707, "step": 2560, "valid_targets_mean": 4713.6, "valid_targets_min": 1409 }, { "epoch": 2.596455696202532, "grad_norm": 0.3451688511848506, "learning_rate": 2.2158020165043114e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.16764461994171143, "step": 2565, "valid_targets_mean": 3924.4, "valid_targets_min": 1285 }, { "epoch": 2.6015189873417723, "grad_norm": 0.2797909726976478, "learning_rate": 2.2087758283909954e-05, "loss": 0.3196, "loss_nan_ranks": 0, "loss_rank_avg": 0.1547449380159378, "step": 2570, "valid_targets_mean": 5481.8, "valid_targets_min": 1376 }, { "epoch": 2.606582278481013, "grad_norm": 0.3101010476898593, "learning_rate": 2.201747034240537e-05, "loss": 0.3135, "loss_nan_ranks": 0, "loss_rank_avg": 0.1627534031867981, "step": 2575, "valid_targets_mean": 4466.9, "valid_targets_min": 987 }, { "epoch": 2.6116455696202534, "grad_norm": 1.1618173704395123, "learning_rate": 2.1947157217896188e-05, "loss": 0.3095, "loss_nan_ranks": 0, "loss_rank_avg": 0.165956050157547, "step": 2580, "valid_targets_mean": 4300.5, "valid_targets_min": 778 }, { "epoch": 2.616708860759494, "grad_norm": 0.31858634458407287, "learning_rate": 2.1876819788063586e-05, "loss": 0.3115, "loss_nan_ranks": 0, "loss_rank_avg": 0.15230509638786316, "step": 2585, "valid_targets_mean": 3920.5, "valid_targets_min": 1479 }, { "epoch": 2.621772151898734, "grad_norm": 0.30557996470586596, "learning_rate": 2.1806458930892127e-05, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.18883772194385529, "step": 2590, "valid_targets_mean": 6008.9, "valid_targets_min": 1408 }, { "epoch": 2.6268354430379746, "grad_norm": 0.2883450262202285, "learning_rate": 2.173607552465881e-05, "loss": 0.3166, "loss_nan_ranks": 0, "loss_rank_avg": 0.17338699102401733, "step": 2595, "valid_targets_mean": 5570.2, "valid_targets_min": 1526 }, { "epoch": 2.631898734177215, "grad_norm": 0.33234113394369846, "learning_rate": 2.1665670447922084e-05, "loss": 0.3129, "loss_nan_ranks": 0, "loss_rank_avg": 0.12816452980041504, "step": 2600, "valid_targets_mean": 4282.2, "valid_targets_min": 812 }, { "epoch": 2.6369620253164556, "grad_norm": 0.31643919888427663, "learning_rate": 2.1595244579510933e-05, "loss": 0.3073, "loss_nan_ranks": 0, "loss_rank_avg": 0.17621192336082458, "step": 2605, "valid_targets_mean": 5060.8, "valid_targets_min": 1369 }, { "epoch": 2.642025316455696, "grad_norm": 0.30039427757871706, "learning_rate": 2.1524798798513835e-05, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.16294711828231812, "step": 2610, "valid_targets_mean": 4472.4, "valid_targets_min": 1304 }, { "epoch": 2.6470886075949367, "grad_norm": 0.3231328181820057, "learning_rate": 2.1454333984267852e-05, "loss": 0.322, "loss_nan_ranks": 0, "loss_rank_avg": 0.16857695579528809, "step": 2615, "valid_targets_mean": 5128.5, "valid_targets_min": 1215 }, { "epoch": 2.6521518987341772, "grad_norm": 0.331376941255876, "learning_rate": 2.1383851016347614e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.1293996274471283, "step": 2620, "valid_targets_mean": 3696.2, "valid_targets_min": 781 }, { "epoch": 2.6572151898734178, "grad_norm": 0.2898986778677013, "learning_rate": 2.1313350774554366e-05, "loss": 0.308, "loss_nan_ranks": 0, "loss_rank_avg": 0.14066889882087708, "step": 2625, "valid_targets_mean": 4409.5, "valid_targets_min": 1181 }, { "epoch": 2.6622784810126583, "grad_norm": 0.3792545064079998, "learning_rate": 2.1242834138904962e-05, "loss": 0.3034, "loss_nan_ranks": 0, "loss_rank_avg": 0.14408881962299347, "step": 2630, "valid_targets_mean": 3892.1, "valid_targets_min": 1313 }, { "epoch": 2.667341772151899, "grad_norm": 0.34582044479522395, "learning_rate": 2.1172301989620898e-05, "loss": 0.3087, "loss_nan_ranks": 0, "loss_rank_avg": 0.15445685386657715, "step": 2635, "valid_targets_mean": 4015.2, "valid_targets_min": 743 }, { "epoch": 2.6724050632911394, "grad_norm": 0.31734348855671907, "learning_rate": 2.110175520711731e-05, "loss": 0.3182, "loss_nan_ranks": 0, "loss_rank_avg": 0.14247769117355347, "step": 2640, "valid_targets_mean": 4152.1, "valid_targets_min": 1532 }, { "epoch": 2.67746835443038, "grad_norm": 0.3108375470698165, "learning_rate": 2.1031194671992013e-05, "loss": 0.3145, "loss_nan_ranks": 0, "loss_rank_avg": 0.13973818719387054, "step": 2645, "valid_targets_mean": 4321.8, "valid_targets_min": 1096 }, { "epoch": 2.68253164556962, "grad_norm": 0.3378134291776038, "learning_rate": 2.0960621265014462e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.17127710580825806, "step": 2650, "valid_targets_mean": 4009.1, "valid_targets_min": 1241 }, { "epoch": 2.6875949367088605, "grad_norm": 0.29939660412855834, "learning_rate": 2.0890035867114808e-05, "loss": 0.3131, "loss_nan_ranks": 0, "loss_rank_avg": 0.15695559978485107, "step": 2655, "valid_targets_mean": 5238.8, "valid_targets_min": 1128 }, { "epoch": 2.692658227848101, "grad_norm": 0.3230482978021318, "learning_rate": 2.081943935937286e-05, "loss": 0.3075, "loss_nan_ranks": 0, "loss_rank_avg": 0.1587713658809662, "step": 2660, "valid_targets_mean": 4748.3, "valid_targets_min": 1323 }, { "epoch": 2.6977215189873416, "grad_norm": 0.29402248645547446, "learning_rate": 2.0748832623007117e-05, "loss": 0.3217, "loss_nan_ranks": 0, "loss_rank_avg": 0.10896088182926178, "step": 2665, "valid_targets_mean": 3750.2, "valid_targets_min": 1426 }, { "epoch": 2.702784810126582, "grad_norm": 0.27936531158953143, "learning_rate": 2.067821653936375e-05, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.1711559295654297, "step": 2670, "valid_targets_mean": 6852.6, "valid_targets_min": 1209 }, { "epoch": 2.7078481012658226, "grad_norm": 0.28924656402783777, "learning_rate": 2.060759198990561e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.14176371693611145, "step": 2675, "valid_targets_mean": 5084.8, "valid_targets_min": 1430 }, { "epoch": 2.712911392405063, "grad_norm": 0.3123266627731589, "learning_rate": 2.053695985620123e-05, "loss": 0.3074, "loss_nan_ranks": 0, "loss_rank_avg": 0.15624725818634033, "step": 2680, "valid_targets_mean": 4276.9, "valid_targets_min": 1150 }, { "epoch": 2.7179746835443037, "grad_norm": 0.30428837341523135, "learning_rate": 2.0466321019913787e-05, "loss": 0.3083, "loss_nan_ranks": 0, "loss_rank_avg": 0.12444409728050232, "step": 2685, "valid_targets_mean": 5104.2, "valid_targets_min": 1036 }, { "epoch": 2.7230379746835442, "grad_norm": 0.2899541063761625, "learning_rate": 2.0395676362790157e-05, "loss": 0.3139, "loss_nan_ranks": 0, "loss_rank_avg": 0.18925632536411285, "step": 2690, "valid_targets_mean": 6929.8, "valid_targets_min": 1156 }, { "epoch": 2.728101265822785, "grad_norm": 0.3000387772557557, "learning_rate": 2.032502676664985e-05, "loss": 0.3256, "loss_nan_ranks": 0, "loss_rank_avg": 0.15346036851406097, "step": 2695, "valid_targets_mean": 4285.7, "valid_targets_min": 1379 }, { "epoch": 2.7331645569620253, "grad_norm": 0.3021057118413619, "learning_rate": 2.025437311337404e-05, "loss": 0.3162, "loss_nan_ranks": 0, "loss_rank_avg": 0.14610332250595093, "step": 2700, "valid_targets_mean": 4591.1, "valid_targets_min": 1675 }, { "epoch": 2.738227848101266, "grad_norm": 0.32691877516784146, "learning_rate": 2.0183716284894533e-05, "loss": 0.3225, "loss_nan_ranks": 0, "loss_rank_avg": 0.14551448822021484, "step": 2705, "valid_targets_mean": 3989.2, "valid_targets_min": 919 }, { "epoch": 2.7432911392405064, "grad_norm": 0.3657473594680315, "learning_rate": 2.011305716318278e-05, "loss": 0.3074, "loss_nan_ranks": 0, "loss_rank_avg": 0.22241473197937012, "step": 2710, "valid_targets_mean": 6030.1, "valid_targets_min": 1316 }, { "epoch": 2.748354430379747, "grad_norm": 0.3038961961226564, "learning_rate": 2.004239663023885e-05, "loss": 0.3028, "loss_nan_ranks": 0, "loss_rank_avg": 0.16947516798973083, "step": 2715, "valid_targets_mean": 5248.6, "valid_targets_min": 1555 }, { "epoch": 2.7534177215189874, "grad_norm": 0.3050248442776484, "learning_rate": 1.997173556808043e-05, "loss": 0.294, "loss_nan_ranks": 0, "loss_rank_avg": 0.1630948781967163, "step": 2720, "valid_targets_mean": 5884.7, "valid_targets_min": 895 }, { "epoch": 2.758481012658228, "grad_norm": 0.35402206211471576, "learning_rate": 1.9901074858731825e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.1823733150959015, "step": 2725, "valid_targets_mean": 4029.6, "valid_targets_min": 1404 }, { "epoch": 2.7635443037974685, "grad_norm": 0.2902629337004639, "learning_rate": 1.98304153842129e-05, "loss": 0.313, "loss_nan_ranks": 0, "loss_rank_avg": 0.1647607535123825, "step": 2730, "valid_targets_mean": 5231.3, "valid_targets_min": 1100 }, { "epoch": 2.768607594936709, "grad_norm": 0.2844550099011252, "learning_rate": 1.9759758026528162e-05, "loss": 0.3181, "loss_nan_ranks": 0, "loss_rank_avg": 0.20809857547283173, "step": 2735, "valid_targets_mean": 6735.6, "valid_targets_min": 1644 }, { "epoch": 2.7736708860759496, "grad_norm": 0.3348579330081765, "learning_rate": 1.9689103667655634e-05, "loss": 0.3088, "loss_nan_ranks": 0, "loss_rank_avg": 0.1527232825756073, "step": 2740, "valid_targets_mean": 3877.4, "valid_targets_min": 1491 }, { "epoch": 2.77873417721519, "grad_norm": 0.33857120124730805, "learning_rate": 1.9618453189535958e-05, "loss": 0.3168, "loss_nan_ranks": 0, "loss_rank_avg": 0.20601877570152283, "step": 2745, "valid_targets_mean": 4548.2, "valid_targets_min": 1232 }, { "epoch": 2.7837974683544306, "grad_norm": 0.3346701582946249, "learning_rate": 1.9547807474061303e-05, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.13511428236961365, "step": 2750, "valid_targets_mean": 3345.6, "valid_targets_min": 1298 }, { "epoch": 2.7888607594936707, "grad_norm": 0.3375591584241796, "learning_rate": 1.947716740306439e-05, "loss": 0.3089, "loss_nan_ranks": 0, "loss_rank_avg": 0.16758695244789124, "step": 2755, "valid_targets_mean": 3964.9, "valid_targets_min": 1047 }, { "epoch": 2.7939240506329113, "grad_norm": 0.340384343325027, "learning_rate": 1.9406533858307503e-05, "loss": 0.3178, "loss_nan_ranks": 0, "loss_rank_avg": 0.1304406374692917, "step": 2760, "valid_targets_mean": 3351.9, "valid_targets_min": 1109 }, { "epoch": 2.798987341772152, "grad_norm": 0.29188887212643894, "learning_rate": 1.9335907721471438e-05, "loss": 0.3042, "loss_nan_ranks": 0, "loss_rank_avg": 0.15948455035686493, "step": 2765, "valid_targets_mean": 4508.9, "valid_targets_min": 970 }, { "epoch": 2.8040506329113923, "grad_norm": 0.2914363526376243, "learning_rate": 1.9265289874144554e-05, "loss": 0.3112, "loss_nan_ranks": 0, "loss_rank_avg": 0.18582302331924438, "step": 2770, "valid_targets_mean": 6648.4, "valid_targets_min": 2048 }, { "epoch": 2.809113924050633, "grad_norm": 0.3447263204953251, "learning_rate": 1.9194681197811703e-05, "loss": 0.3154, "loss_nan_ranks": 0, "loss_rank_avg": 0.11537902057170868, "step": 2775, "valid_targets_mean": 3061.1, "valid_targets_min": 1261 }, { "epoch": 2.8141772151898734, "grad_norm": 0.28824906654455074, "learning_rate": 1.912408257384327e-05, "loss": 0.3173, "loss_nan_ranks": 0, "loss_rank_avg": 0.18753370642662048, "step": 2780, "valid_targets_mean": 6277.4, "valid_targets_min": 1561 }, { "epoch": 2.819240506329114, "grad_norm": 0.31551057795248955, "learning_rate": 1.9053494883484177e-05, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.1113462746143341, "step": 2785, "valid_targets_mean": 3603.0, "valid_targets_min": 966 }, { "epoch": 2.8243037974683545, "grad_norm": 0.3130169957194376, "learning_rate": 1.898291900784284e-05, "loss": 0.3045, "loss_nan_ranks": 0, "loss_rank_avg": 0.17591753602027893, "step": 2790, "valid_targets_mean": 4849.0, "valid_targets_min": 1241 }, { "epoch": 2.829367088607595, "grad_norm": 0.36153291519489483, "learning_rate": 1.8912355827880237e-05, "loss": 0.3166, "loss_nan_ranks": 0, "loss_rank_avg": 0.13046428561210632, "step": 2795, "valid_targets_mean": 3138.6, "valid_targets_min": 1174 }, { "epoch": 2.8344303797468355, "grad_norm": 0.35818567026601295, "learning_rate": 1.884180622439884e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.15154902637004852, "step": 2800, "valid_targets_mean": 3774.6, "valid_targets_min": 731 }, { "epoch": 2.839493670886076, "grad_norm": 0.33153674409005546, "learning_rate": 1.8771271078031648e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.17227354645729065, "step": 2805, "valid_targets_mean": 5559.2, "valid_targets_min": 981 }, { "epoch": 2.8445569620253166, "grad_norm": 0.30646195273462673, "learning_rate": 1.8700751269231243e-05, "loss": 0.3028, "loss_nan_ranks": 0, "loss_rank_avg": 0.17971369624137878, "step": 2810, "valid_targets_mean": 5315.5, "valid_targets_min": 1235 }, { "epoch": 2.8496202531645567, "grad_norm": 0.3147470597121468, "learning_rate": 1.86302476782587e-05, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.1408463716506958, "step": 2815, "valid_targets_mean": 3962.4, "valid_targets_min": 820 }, { "epoch": 2.8546835443037972, "grad_norm": 0.35549269402291417, "learning_rate": 1.855976118517271e-05, "loss": 0.3075, "loss_nan_ranks": 0, "loss_rank_avg": 0.19130544364452362, "step": 2820, "valid_targets_mean": 4855.5, "valid_targets_min": 959 }, { "epoch": 2.8597468354430378, "grad_norm": 0.2823602428424915, "learning_rate": 1.8489292669818494e-05, "loss": 0.3066, "loss_nan_ranks": 0, "loss_rank_avg": 0.1796441674232483, "step": 2825, "valid_targets_mean": 5933.9, "valid_targets_min": 1652 }, { "epoch": 2.8648101265822783, "grad_norm": 0.3086469012489834, "learning_rate": 1.8418843011816894e-05, "loss": 0.3113, "loss_nan_ranks": 0, "loss_rank_avg": 0.14876966178417206, "step": 2830, "valid_targets_mean": 4459.1, "valid_targets_min": 1431 }, { "epoch": 2.869873417721519, "grad_norm": 0.33219619271405165, "learning_rate": 1.8348413090553356e-05, "loss": 0.3147, "loss_nan_ranks": 0, "loss_rank_avg": 0.1837439239025116, "step": 2835, "valid_targets_mean": 5042.5, "valid_targets_min": 1015 }, { "epoch": 2.8749367088607594, "grad_norm": 0.28160060670414677, "learning_rate": 1.8278003785166967e-05, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.13023114204406738, "step": 2840, "valid_targets_mean": 4408.2, "valid_targets_min": 1093 }, { "epoch": 2.88, "grad_norm": 0.2701611603230975, "learning_rate": 1.8207615974539476e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.12874723970890045, "step": 2845, "valid_targets_mean": 4858.8, "valid_targets_min": 863 }, { "epoch": 2.8850632911392404, "grad_norm": 0.33079935847646824, "learning_rate": 1.8137250537284325e-05, "loss": 0.3093, "loss_nan_ranks": 0, "loss_rank_avg": 0.17800703644752502, "step": 2850, "valid_targets_mean": 4857.1, "valid_targets_min": 1713 }, { "epoch": 2.890126582278481, "grad_norm": 0.23595757958591787, "learning_rate": 1.8066908351735666e-05, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.1269092708826065, "step": 2855, "valid_targets_mean": 5766.2, "valid_targets_min": 1183 }, { "epoch": 2.8951898734177215, "grad_norm": 0.33538165041242207, "learning_rate": 1.7996590295937448e-05, "loss": 0.3038, "loss_nan_ranks": 0, "loss_rank_avg": 0.1899298131465912, "step": 2860, "valid_targets_mean": 5260.9, "valid_targets_min": 1500 }, { "epoch": 2.900253164556962, "grad_norm": 0.3124645131733068, "learning_rate": 1.7926297247632383e-05, "loss": 0.3207, "loss_nan_ranks": 0, "loss_rank_avg": 0.1435328722000122, "step": 2865, "valid_targets_mean": 3785.1, "valid_targets_min": 1048 }, { "epoch": 2.9053164556962026, "grad_norm": 0.3305614452127962, "learning_rate": 1.7856030084251045e-05, "loss": 0.3098, "loss_nan_ranks": 0, "loss_rank_avg": 0.1552894562482834, "step": 2870, "valid_targets_mean": 4255.3, "valid_targets_min": 844 }, { "epoch": 2.910379746835443, "grad_norm": 0.34874837954634086, "learning_rate": 1.7785789682900908e-05, "loss": 0.3082, "loss_nan_ranks": 0, "loss_rank_avg": 0.14497388899326324, "step": 2875, "valid_targets_mean": 3286.0, "valid_targets_min": 1279 }, { "epoch": 2.9154430379746836, "grad_norm": 0.3321474887097409, "learning_rate": 1.771557692035537e-05, "loss": 0.3062, "loss_nan_ranks": 0, "loss_rank_avg": 0.14671984314918518, "step": 2880, "valid_targets_mean": 4362.1, "valid_targets_min": 897 }, { "epoch": 2.920506329113924, "grad_norm": 0.36664765144869893, "learning_rate": 1.7645392673042853e-05, "loss": 0.3298, "loss_nan_ranks": 0, "loss_rank_avg": 0.20450638234615326, "step": 2885, "valid_targets_mean": 3744.9, "valid_targets_min": 536 }, { "epoch": 2.9255696202531647, "grad_norm": 0.30800064070091415, "learning_rate": 1.757523781703581e-05, "loss": 0.3135, "loss_nan_ranks": 0, "loss_rank_avg": 0.13620543479919434, "step": 2890, "valid_targets_mean": 4010.2, "valid_targets_min": 739 }, { "epoch": 2.9306329113924052, "grad_norm": 0.39874064817665694, "learning_rate": 1.7505113228039848e-05, "loss": 0.3146, "loss_nan_ranks": 0, "loss_rank_avg": 0.17097340524196625, "step": 2895, "valid_targets_mean": 4104.1, "valid_targets_min": 1037 }, { "epoch": 2.9356962025316458, "grad_norm": 0.30804629166037306, "learning_rate": 1.7435019781382737e-05, "loss": 0.297, "loss_nan_ranks": 0, "loss_rank_avg": 0.14079098403453827, "step": 2900, "valid_targets_mean": 4534.0, "valid_targets_min": 887 }, { "epoch": 2.9407594936708863, "grad_norm": 0.306220364172818, "learning_rate": 1.7364958352003548e-05, "loss": 0.3174, "loss_nan_ranks": 0, "loss_rank_avg": 0.17645467817783356, "step": 2905, "valid_targets_mean": 4994.2, "valid_targets_min": 1148 }, { "epoch": 2.945822784810127, "grad_norm": 0.3179633647838338, "learning_rate": 1.7294929814441666e-05, "loss": 0.3231, "loss_nan_ranks": 0, "loss_rank_avg": 0.16111071407794952, "step": 2910, "valid_targets_mean": 4938.6, "valid_targets_min": 1387 }, { "epoch": 2.9508860759493674, "grad_norm": 0.31641771807614866, "learning_rate": 1.7224935042825912e-05, "loss": 0.3152, "loss_nan_ranks": 0, "loss_rank_avg": 0.16131725907325745, "step": 2915, "valid_targets_mean": 4423.9, "valid_targets_min": 810 }, { "epoch": 2.9559493670886074, "grad_norm": 0.2900729323232742, "learning_rate": 1.7154974910863646e-05, "loss": 0.3077, "loss_nan_ranks": 0, "loss_rank_avg": 0.10794432461261749, "step": 2920, "valid_targets_mean": 3454.4, "valid_targets_min": 1456 }, { "epoch": 2.961012658227848, "grad_norm": 0.3432477720018123, "learning_rate": 1.7085050291829813e-05, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.15215110778808594, "step": 2925, "valid_targets_mean": 4236.8, "valid_targets_min": 1238 }, { "epoch": 2.9660759493670885, "grad_norm": 0.31507659068073507, "learning_rate": 1.7015162058556088e-05, "loss": 0.3208, "loss_nan_ranks": 0, "loss_rank_avg": 0.16133321821689606, "step": 2930, "valid_targets_mean": 4263.9, "valid_targets_min": 795 }, { "epoch": 2.971139240506329, "grad_norm": 0.29285158348676216, "learning_rate": 1.6945311083419947e-05, "loss": 0.2976, "loss_nan_ranks": 0, "loss_rank_avg": 0.1742202341556549, "step": 2935, "valid_targets_mean": 5417.0, "valid_targets_min": 1360 }, { "epoch": 2.9762025316455696, "grad_norm": 0.2918602342182722, "learning_rate": 1.68754982383338e-05, "loss": 0.3007, "loss_nan_ranks": 0, "loss_rank_avg": 0.1684986650943756, "step": 2940, "valid_targets_mean": 5456.4, "valid_targets_min": 1200 }, { "epoch": 2.98126582278481, "grad_norm": 0.30561630865463585, "learning_rate": 1.6805724394734107e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.10106837749481201, "step": 2945, "valid_targets_mean": 3017.5, "valid_targets_min": 1279 }, { "epoch": 2.9863291139240506, "grad_norm": 0.29442534234659645, "learning_rate": 1.6735990423570477e-05, "loss": 0.3234, "loss_nan_ranks": 0, "loss_rank_avg": 0.13497650623321533, "step": 2950, "valid_targets_mean": 3993.2, "valid_targets_min": 1015 }, { "epoch": 2.991392405063291, "grad_norm": 0.2700507094407274, "learning_rate": 1.666629719529483e-05, "loss": 0.3185, "loss_nan_ranks": 0, "loss_rank_avg": 0.15681613981723785, "step": 2955, "valid_targets_mean": 4630.2, "valid_targets_min": 1176 }, { "epoch": 2.9964556962025317, "grad_norm": 0.3447693878105072, "learning_rate": 1.6596645579850505e-05, "loss": 0.3107, "loss_nan_ranks": 0, "loss_rank_avg": 0.1600763201713562, "step": 2960, "valid_targets_mean": 3677.3, "valid_targets_min": 1107 }, { "epoch": 3.001012658227848, "grad_norm": 0.29622484390463744, "learning_rate": 1.6527036446661396e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.14927029609680176, "step": 2965, "valid_targets_mean": 4862.4, "valid_targets_min": 1322 }, { "epoch": 3.0060759493670886, "grad_norm": 0.29785828676100873, "learning_rate": 1.645747066462115e-05, "loss": 0.3021, "loss_nan_ranks": 0, "loss_rank_avg": 0.19526249170303345, "step": 2970, "valid_targets_mean": 5885.6, "valid_targets_min": 1447 }, { "epoch": 3.011139240506329, "grad_norm": 0.35112230405979555, "learning_rate": 1.638794910208225e-05, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.10469535738229752, "step": 2975, "valid_targets_mean": 2940.2, "valid_targets_min": 1159 }, { "epoch": 3.0162025316455696, "grad_norm": 0.3772315133305102, "learning_rate": 1.631847262684523e-05, "loss": 0.3108, "loss_nan_ranks": 0, "loss_rank_avg": 0.16602087020874023, "step": 2980, "valid_targets_mean": 4357.8, "valid_targets_min": 1389 }, { "epoch": 3.02126582278481, "grad_norm": 0.30911220110322923, "learning_rate": 1.624904210614782e-05, "loss": 0.3033, "loss_nan_ranks": 0, "loss_rank_avg": 0.1612570881843567, "step": 2985, "valid_targets_mean": 4494.7, "valid_targets_min": 1244 }, { "epoch": 3.0263291139240507, "grad_norm": 0.3517033326754291, "learning_rate": 1.6179658406654113e-05, "loss": 0.2958, "loss_nan_ranks": 0, "loss_rank_avg": 0.17958399653434753, "step": 2990, "valid_targets_mean": 4044.6, "valid_targets_min": 1324 }, { "epoch": 3.031392405063291, "grad_norm": 0.28226563989162823, "learning_rate": 1.6110322394443773e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.11023816466331482, "step": 2995, "valid_targets_mean": 4105.8, "valid_targets_min": 1267 }, { "epoch": 3.0364556962025318, "grad_norm": 0.3395674314450887, "learning_rate": 1.60410349350012e-05, "loss": 0.3034, "loss_nan_ranks": 0, "loss_rank_avg": 0.17015889286994934, "step": 3000, "valid_targets_mean": 5613.8, "valid_targets_min": 1423 }, { "epoch": 3.0415189873417723, "grad_norm": 0.3328019254619737, "learning_rate": 1.597179689320474e-05, "loss": 0.3068, "loss_nan_ranks": 0, "loss_rank_avg": 0.16885250806808472, "step": 3005, "valid_targets_mean": 4626.2, "valid_targets_min": 1034 }, { "epoch": 3.046582278481013, "grad_norm": 0.30137258092800007, "learning_rate": 1.5902609133315888e-05, "loss": 0.3026, "loss_nan_ranks": 0, "loss_rank_avg": 0.14555740356445312, "step": 3010, "valid_targets_mean": 5118.1, "valid_targets_min": 1378 }, { "epoch": 3.0516455696202534, "grad_norm": 0.32251822208809916, "learning_rate": 1.5833472518968478e-05, "loss": 0.3049, "loss_nan_ranks": 0, "loss_rank_avg": 0.13226641714572906, "step": 3015, "valid_targets_mean": 4081.9, "valid_targets_min": 1428 }, { "epoch": 3.056708860759494, "grad_norm": 0.3211101552341726, "learning_rate": 1.5764387913157952e-05, "loss": 0.3185, "loss_nan_ranks": 0, "loss_rank_avg": 0.0971713736653328, "step": 3020, "valid_targets_mean": 3146.8, "valid_targets_min": 1380 }, { "epoch": 3.061772151898734, "grad_norm": 0.3360390373855527, "learning_rate": 1.5695356178230527e-05, "loss": 0.3062, "loss_nan_ranks": 0, "loss_rank_avg": 0.12469463050365448, "step": 3025, "valid_targets_mean": 3152.8, "valid_targets_min": 1004 }, { "epoch": 3.0668354430379745, "grad_norm": 0.29385960506365055, "learning_rate": 1.5626378175872486e-05, "loss": 0.2921, "loss_nan_ranks": 0, "loss_rank_avg": 0.16584698855876923, "step": 3030, "valid_targets_mean": 5578.9, "valid_targets_min": 1238 }, { "epoch": 3.071898734177215, "grad_norm": 0.32789137808560437, "learning_rate": 1.5557454767099382e-05, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.17390216886997223, "step": 3035, "valid_targets_mean": 4741.9, "valid_targets_min": 1219 }, { "epoch": 3.0769620253164556, "grad_norm": 0.3234941533877886, "learning_rate": 1.5488586812245302e-05, "loss": 0.3027, "loss_nan_ranks": 0, "loss_rank_avg": 0.17046749591827393, "step": 3040, "valid_targets_mean": 4481.4, "valid_targets_min": 1174 }, { "epoch": 3.082025316455696, "grad_norm": 0.28075430375987626, "learning_rate": 1.541977517095215e-05, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.14547553658485413, "step": 3045, "valid_targets_mean": 5410.0, "valid_targets_min": 1228 }, { "epoch": 3.0870886075949366, "grad_norm": 0.28635813947594835, "learning_rate": 1.5351020702158875e-05, "loss": 0.3099, "loss_nan_ranks": 0, "loss_rank_avg": 0.13441359996795654, "step": 3050, "valid_targets_mean": 5051.8, "valid_targets_min": 960 }, { "epoch": 3.092151898734177, "grad_norm": 0.34800039286889395, "learning_rate": 1.52823242640908e-05, "loss": 0.3096, "loss_nan_ranks": 0, "loss_rank_avg": 0.15158754587173462, "step": 3055, "valid_targets_mean": 3697.4, "valid_targets_min": 1086 }, { "epoch": 3.0972151898734177, "grad_norm": 0.32310977392742785, "learning_rate": 1.5213686714248852e-05, "loss": 0.3082, "loss_nan_ranks": 0, "loss_rank_avg": 0.16765525937080383, "step": 3060, "valid_targets_mean": 4845.2, "valid_targets_min": 1334 }, { "epoch": 3.1022784810126582, "grad_norm": 0.296724917732042, "learning_rate": 1.5145108909398896e-05, "loss": 0.3042, "loss_nan_ranks": 0, "loss_rank_avg": 0.14354108273983002, "step": 3065, "valid_targets_mean": 4783.9, "valid_targets_min": 1333 }, { "epoch": 3.1073417721518988, "grad_norm": 0.42288485229336514, "learning_rate": 1.5076591705561056e-05, "loss": 0.3054, "loss_nan_ranks": 0, "loss_rank_avg": 0.16323769092559814, "step": 3070, "valid_targets_mean": 3961.5, "valid_targets_min": 1451 }, { "epoch": 3.1124050632911393, "grad_norm": 0.29888536735808585, "learning_rate": 1.5008135957998968e-05, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.16281160712242126, "step": 3075, "valid_targets_mean": 5095.7, "valid_targets_min": 989 }, { "epoch": 3.11746835443038, "grad_norm": 0.32246738234879885, "learning_rate": 1.4939742521209178e-05, "loss": 0.3136, "loss_nan_ranks": 0, "loss_rank_avg": 0.142366424202919, "step": 3080, "valid_targets_mean": 3786.1, "valid_targets_min": 776 }, { "epoch": 3.1225316455696204, "grad_norm": 0.2885458143447489, "learning_rate": 1.4871412248910416e-05, "loss": 0.3112, "loss_nan_ranks": 0, "loss_rank_avg": 0.1399984061717987, "step": 3085, "valid_targets_mean": 5652.7, "valid_targets_min": 1058 }, { "epoch": 3.127594936708861, "grad_norm": 0.3436698843544968, "learning_rate": 1.480314599403296e-05, "loss": 0.3051, "loss_nan_ranks": 0, "loss_rank_avg": 0.12947720289230347, "step": 3090, "valid_targets_mean": 3113.7, "valid_targets_min": 1129 }, { "epoch": 3.1326582278481014, "grad_norm": 0.3034361762747695, "learning_rate": 1.4734944608708022e-05, "loss": 0.2819, "loss_nan_ranks": 0, "loss_rank_avg": 0.1270906925201416, "step": 3095, "valid_targets_mean": 4283.6, "valid_targets_min": 1371 }, { "epoch": 3.137721518987342, "grad_norm": 0.2910061490791564, "learning_rate": 1.4666808944257044e-05, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.1065504252910614, "step": 3100, "valid_targets_mean": 4013.8, "valid_targets_min": 1748 }, { "epoch": 3.1427848101265825, "grad_norm": 0.29375562777524983, "learning_rate": 1.459873985118115e-05, "loss": 0.2913, "loss_nan_ranks": 0, "loss_rank_avg": 0.20948265492916107, "step": 3105, "valid_targets_mean": 6254.6, "valid_targets_min": 855 }, { "epoch": 3.1478481012658226, "grad_norm": 0.32610939195307226, "learning_rate": 1.4530738179150445e-05, "loss": 0.3091, "loss_nan_ranks": 0, "loss_rank_avg": 0.16477391123771667, "step": 3110, "valid_targets_mean": 4672.6, "valid_targets_min": 1423 }, { "epoch": 3.152911392405063, "grad_norm": 0.34376610077811187, "learning_rate": 1.44628047769935e-05, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.12125621736049652, "step": 3115, "valid_targets_mean": 3024.9, "valid_targets_min": 1154 }, { "epoch": 3.1579746835443037, "grad_norm": 0.24961470242170858, "learning_rate": 1.4394940492686666e-05, "loss": 0.3028, "loss_nan_ranks": 0, "loss_rank_avg": 0.18956081569194794, "step": 3120, "valid_targets_mean": 8850.2, "valid_targets_min": 1106 }, { "epoch": 3.163037974683544, "grad_norm": 0.3213177133533683, "learning_rate": 1.4327146173343561e-05, "loss": 0.3098, "loss_nan_ranks": 0, "loss_rank_avg": 0.16393819451332092, "step": 3125, "valid_targets_mean": 4351.1, "valid_targets_min": 1322 }, { "epoch": 3.1681012658227847, "grad_norm": 0.3207864682050949, "learning_rate": 1.4259422665204458e-05, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.19772255420684814, "step": 3130, "valid_targets_mean": 5234.6, "valid_targets_min": 1247 }, { "epoch": 3.1731645569620253, "grad_norm": 0.3306680712851493, "learning_rate": 1.4191770813625732e-05, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.1288958340883255, "step": 3135, "valid_targets_mean": 3816.3, "valid_targets_min": 1339 }, { "epoch": 3.178227848101266, "grad_norm": 0.33226796696180216, "learning_rate": 1.4124191463069305e-05, "loss": 0.2918, "loss_nan_ranks": 0, "loss_rank_avg": 0.1820456087589264, "step": 3140, "valid_targets_mean": 4462.9, "valid_targets_min": 1300 }, { "epoch": 3.1832911392405063, "grad_norm": 0.25066525871506057, "learning_rate": 1.4056685457092122e-05, "loss": 0.2981, "loss_nan_ranks": 0, "loss_rank_avg": 0.108408123254776, "step": 3145, "valid_targets_mean": 4348.1, "valid_targets_min": 954 }, { "epoch": 3.188354430379747, "grad_norm": 0.2799683914898738, "learning_rate": 1.3989253638335577e-05, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.140926331281662, "step": 3150, "valid_targets_mean": 5334.3, "valid_targets_min": 686 }, { "epoch": 3.1934177215189874, "grad_norm": 0.364904271269176, "learning_rate": 1.3921896848515064e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.1611071527004242, "step": 3155, "valid_targets_mean": 3846.9, "valid_targets_min": 1050 }, { "epoch": 3.198481012658228, "grad_norm": 0.31469570152651777, "learning_rate": 1.385461592840939e-05, "loss": 0.2914, "loss_nan_ranks": 0, "loss_rank_avg": 0.16711470484733582, "step": 3160, "valid_targets_mean": 4945.6, "valid_targets_min": 1265 }, { "epoch": 3.2035443037974685, "grad_norm": 0.40871004437684494, "learning_rate": 1.3787411717850358e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.14797160029411316, "step": 3165, "valid_targets_mean": 3367.9, "valid_targets_min": 1380 }, { "epoch": 3.208607594936709, "grad_norm": 0.3063676754341602, "learning_rate": 1.3720285055712222e-05, "loss": 0.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.12202514708042145, "step": 3170, "valid_targets_mean": 3846.6, "valid_targets_min": 1062 }, { "epoch": 3.2136708860759495, "grad_norm": 0.33920699542879207, "learning_rate": 1.3653236779901236e-05, "loss": 0.3022, "loss_nan_ranks": 0, "loss_rank_avg": 0.08881708979606628, "step": 3175, "valid_targets_mean": 2589.6, "valid_targets_min": 1310 }, { "epoch": 3.21873417721519, "grad_norm": 0.3118478710909973, "learning_rate": 1.3586267727345232e-05, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.13673335313796997, "step": 3180, "valid_targets_mean": 4171.1, "valid_targets_min": 1119 }, { "epoch": 3.22379746835443, "grad_norm": 0.3657648017370462, "learning_rate": 1.35193787339831e-05, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.13656803965568542, "step": 3185, "valid_targets_mean": 4186.0, "valid_targets_min": 1616 }, { "epoch": 3.2288607594936707, "grad_norm": 0.29575714520451474, "learning_rate": 1.3452570634754434e-05, "loss": 0.2919, "loss_nan_ranks": 0, "loss_rank_avg": 0.14770013093948364, "step": 3190, "valid_targets_mean": 5272.9, "valid_targets_min": 1046 }, { "epoch": 3.233924050632911, "grad_norm": 0.29496009702650783, "learning_rate": 1.3385844263589033e-05, "loss": 0.2984, "loss_nan_ranks": 0, "loss_rank_avg": 0.17479810118675232, "step": 3195, "valid_targets_mean": 5597.1, "valid_targets_min": 1196 }, { "epoch": 3.2389873417721518, "grad_norm": 0.35581177858551544, "learning_rate": 1.3319200453396548e-05, "loss": 0.294, "loss_nan_ranks": 0, "loss_rank_avg": 0.15500982105731964, "step": 3200, "valid_targets_mean": 4076.4, "valid_targets_min": 1070 }, { "epoch": 3.2440506329113923, "grad_norm": 0.292951167708079, "learning_rate": 1.3252640036056068e-05, "loss": 0.3027, "loss_nan_ranks": 0, "loss_rank_avg": 0.1567637026309967, "step": 3205, "valid_targets_mean": 5367.4, "valid_targets_min": 1424 }, { "epoch": 3.249113924050633, "grad_norm": 0.3182836504556952, "learning_rate": 1.318616384240572e-05, "loss": 0.3043, "loss_nan_ranks": 0, "loss_rank_avg": 0.1862029880285263, "step": 3210, "valid_targets_mean": 5235.2, "valid_targets_min": 1150 }, { "epoch": 3.2541772151898734, "grad_norm": 0.5962356962936214, "learning_rate": 1.3119772702232325e-05, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.15173543989658356, "step": 3215, "valid_targets_mean": 3896.9, "valid_targets_min": 1293 }, { "epoch": 3.259240506329114, "grad_norm": 0.30446119131111943, "learning_rate": 1.3053467444261021e-05, "loss": 0.3035, "loss_nan_ranks": 0, "loss_rank_avg": 0.16218072175979614, "step": 3220, "valid_targets_mean": 5058.7, "valid_targets_min": 1443 }, { "epoch": 3.2643037974683544, "grad_norm": 0.30100968288795926, "learning_rate": 1.2987248896144915e-05, "loss": 0.3025, "loss_nan_ranks": 0, "loss_rank_avg": 0.1766858994960785, "step": 3225, "valid_targets_mean": 5638.7, "valid_targets_min": 1494 }, { "epoch": 3.269367088607595, "grad_norm": 0.3043172862585619, "learning_rate": 1.2921117884454784e-05, "loss": 0.3111, "loss_nan_ranks": 0, "loss_rank_avg": 0.13346105813980103, "step": 3230, "valid_targets_mean": 4191.2, "valid_targets_min": 886 }, { "epoch": 3.2744303797468355, "grad_norm": 0.30601688850305675, "learning_rate": 1.2855075234668708e-05, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.17442500591278076, "step": 3235, "valid_targets_mean": 5185.5, "valid_targets_min": 1463 }, { "epoch": 3.279493670886076, "grad_norm": 0.32710194023512384, "learning_rate": 1.278912177116182e-05, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.18517401814460754, "step": 3240, "valid_targets_mean": 4748.3, "valid_targets_min": 1001 }, { "epoch": 3.2845569620253166, "grad_norm": 0.2832311914633299, "learning_rate": 1.2723258317195965e-05, "loss": 0.3118, "loss_nan_ranks": 0, "loss_rank_avg": 0.1336306631565094, "step": 3245, "valid_targets_mean": 4846.2, "valid_targets_min": 1184 }, { "epoch": 3.289620253164557, "grad_norm": 0.2859981419544709, "learning_rate": 1.2657485694909451e-05, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.12190467119216919, "step": 3250, "valid_targets_mean": 4372.2, "valid_targets_min": 1012 }, { "epoch": 3.2946835443037976, "grad_norm": 0.3133461443068576, "learning_rate": 1.2591804725306802e-05, "loss": 0.3056, "loss_nan_ranks": 0, "loss_rank_avg": 0.09984530508518219, "step": 3255, "valid_targets_mean": 3387.1, "valid_targets_min": 1020 }, { "epoch": 3.299746835443038, "grad_norm": 0.3066068642940143, "learning_rate": 1.252621622824846e-05, "loss": 0.3049, "loss_nan_ranks": 0, "loss_rank_avg": 0.10505147278308868, "step": 3260, "valid_targets_mean": 3119.9, "valid_targets_min": 1415 }, { "epoch": 3.3048101265822787, "grad_norm": 0.30638690017522713, "learning_rate": 1.2460721022440617e-05, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.1329905241727829, "step": 3265, "valid_targets_mean": 3749.8, "valid_targets_min": 1247 }, { "epoch": 3.309873417721519, "grad_norm": 0.3893581538313894, "learning_rate": 1.2395319925424922e-05, "loss": 0.301, "loss_nan_ranks": 0, "loss_rank_avg": 0.12106384336948395, "step": 3270, "valid_targets_mean": 3750.2, "valid_targets_min": 1170 }, { "epoch": 3.3149367088607593, "grad_norm": 0.2915580190067732, "learning_rate": 1.2330013753568345e-05, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.15587478876113892, "step": 3275, "valid_targets_mean": 5153.9, "valid_targets_min": 884 }, { "epoch": 3.32, "grad_norm": 0.32454051814127005, "learning_rate": 1.2264803322052938e-05, "loss": 0.2902, "loss_nan_ranks": 0, "loss_rank_avg": 0.14347532391548157, "step": 3280, "valid_targets_mean": 3715.8, "valid_targets_min": 1109 }, { "epoch": 3.3250632911392404, "grad_norm": 0.3014718100183408, "learning_rate": 1.2199689444865688e-05, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.11024832725524902, "step": 3285, "valid_targets_mean": 3356.6, "valid_targets_min": 1346 }, { "epoch": 3.330126582278481, "grad_norm": 0.3180605843827969, "learning_rate": 1.2134672934788338e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.1348501592874527, "step": 3290, "valid_targets_mean": 4180.2, "valid_targets_min": 1405 }, { "epoch": 3.3351898734177214, "grad_norm": 0.31070898369108957, "learning_rate": 1.206975460338726e-05, "loss": 0.2962, "loss_nan_ranks": 0, "loss_rank_avg": 0.14836883544921875, "step": 3295, "valid_targets_mean": 4112.2, "valid_targets_min": 1401 }, { "epoch": 3.340253164556962, "grad_norm": 0.28528395978629406, "learning_rate": 1.2004935261003292e-05, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.11711958050727844, "step": 3300, "valid_targets_mean": 5100.1, "valid_targets_min": 1029 }, { "epoch": 3.3453164556962025, "grad_norm": 0.3708665183674031, "learning_rate": 1.194021571674168e-05, "loss": 0.2891, "loss_nan_ranks": 0, "loss_rank_avg": 0.13884302973747253, "step": 3305, "valid_targets_mean": 4049.6, "valid_targets_min": 974 }, { "epoch": 3.350379746835443, "grad_norm": 0.3298858637588618, "learning_rate": 1.1875596778461903e-05, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.1451665610074997, "step": 3310, "valid_targets_mean": 4987.6, "valid_targets_min": 1624 }, { "epoch": 3.3554430379746836, "grad_norm": 0.30292570807469854, "learning_rate": 1.1811079252767663e-05, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.12376505136489868, "step": 3315, "valid_targets_mean": 3583.1, "valid_targets_min": 1257 }, { "epoch": 3.360506329113924, "grad_norm": 0.32294869729997133, "learning_rate": 1.174666394499677e-05, "loss": 0.2914, "loss_nan_ranks": 0, "loss_rank_avg": 0.11844268441200256, "step": 3320, "valid_targets_mean": 3262.4, "valid_targets_min": 1554 }, { "epoch": 3.3655696202531646, "grad_norm": 0.3438389100269291, "learning_rate": 1.1682351659211088e-05, "loss": 0.2965, "loss_nan_ranks": 0, "loss_rank_avg": 0.1457480937242508, "step": 3325, "valid_targets_mean": 3745.7, "valid_targets_min": 1190 }, { "epoch": 3.370632911392405, "grad_norm": 0.33249792748827744, "learning_rate": 1.1618143198186544e-05, "loss": 0.2956, "loss_nan_ranks": 0, "loss_rank_avg": 0.15856462717056274, "step": 3330, "valid_targets_mean": 4305.5, "valid_targets_min": 910 }, { "epoch": 3.3756962025316457, "grad_norm": 0.3173034049275177, "learning_rate": 1.155403936340304e-05, "loss": 0.2947, "loss_nan_ranks": 0, "loss_rank_avg": 0.18826264142990112, "step": 3335, "valid_targets_mean": 5404.1, "valid_targets_min": 1023 }, { "epoch": 3.3807594936708862, "grad_norm": 0.3178276101310362, "learning_rate": 1.149004095503452e-05, "loss": 0.297, "loss_nan_ranks": 0, "loss_rank_avg": 0.15395784378051758, "step": 3340, "valid_targets_mean": 5008.1, "valid_targets_min": 1032 }, { "epoch": 3.3858227848101268, "grad_norm": 0.3025604254884791, "learning_rate": 1.1426148771938915e-05, "loss": 0.3065, "loss_nan_ranks": 0, "loss_rank_avg": 0.1488351970911026, "step": 3345, "valid_targets_mean": 4703.1, "valid_targets_min": 1506 }, { "epoch": 3.390886075949367, "grad_norm": 0.3037731465395097, "learning_rate": 1.1362363611648228e-05, "loss": 0.3069, "loss_nan_ranks": 0, "loss_rank_avg": 0.11465154588222504, "step": 3350, "valid_targets_mean": 3727.4, "valid_targets_min": 921 }, { "epoch": 3.3959493670886074, "grad_norm": 0.3441348411116797, "learning_rate": 1.1298686270358542e-05, "loss": 0.301, "loss_nan_ranks": 0, "loss_rank_avg": 0.17264041304588318, "step": 3355, "valid_targets_mean": 3737.4, "valid_targets_min": 1599 }, { "epoch": 3.401012658227848, "grad_norm": 0.2922925569041438, "learning_rate": 1.1235117542920077e-05, "loss": 0.2984, "loss_nan_ranks": 0, "loss_rank_avg": 0.11297699809074402, "step": 3360, "valid_targets_mean": 4023.7, "valid_targets_min": 1052 }, { "epoch": 3.4060759493670885, "grad_norm": 0.3304527382358981, "learning_rate": 1.1171658222827321e-05, "loss": 0.308, "loss_nan_ranks": 0, "loss_rank_avg": 0.21652498841285706, "step": 3365, "valid_targets_mean": 5499.5, "valid_targets_min": 949 }, { "epoch": 3.411139240506329, "grad_norm": 0.34098724945316766, "learning_rate": 1.110830910220905e-05, "loss": 0.3065, "loss_nan_ranks": 0, "loss_rank_avg": 0.17756357789039612, "step": 3370, "valid_targets_mean": 3859.3, "valid_targets_min": 961 }, { "epoch": 3.4162025316455695, "grad_norm": 0.29556792434414897, "learning_rate": 1.1045070971818515e-05, "loss": 0.2959, "loss_nan_ranks": 0, "loss_rank_avg": 0.130351722240448, "step": 3375, "valid_targets_mean": 3860.4, "valid_targets_min": 1126 }, { "epoch": 3.42126582278481, "grad_norm": 0.2817393837564735, "learning_rate": 1.0981944621023508e-05, "loss": 0.2989, "loss_nan_ranks": 0, "loss_rank_avg": 0.172260582447052, "step": 3380, "valid_targets_mean": 6195.1, "valid_targets_min": 1065 }, { "epoch": 3.4263291139240506, "grad_norm": 0.3019678707113778, "learning_rate": 1.0918930837796538e-05, "loss": 0.2909, "loss_nan_ranks": 0, "loss_rank_avg": 0.14187800884246826, "step": 3385, "valid_targets_mean": 4729.5, "valid_targets_min": 1024 }, { "epoch": 3.431392405063291, "grad_norm": 0.32014190449807, "learning_rate": 1.0856030408705016e-05, "loss": 0.3174, "loss_nan_ranks": 0, "loss_rank_avg": 0.15517304837703705, "step": 3390, "valid_targets_mean": 4351.6, "valid_targets_min": 1381 }, { "epoch": 3.4364556962025317, "grad_norm": 0.28577315150998106, "learning_rate": 1.0793244118901383e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.16560965776443481, "step": 3395, "valid_targets_mean": 5708.4, "valid_targets_min": 1323 }, { "epoch": 3.441518987341772, "grad_norm": 0.2895330117490245, "learning_rate": 1.0730572752113368e-05, "loss": 0.3004, "loss_nan_ranks": 0, "loss_rank_avg": 0.16116517782211304, "step": 3400, "valid_targets_mean": 6122.2, "valid_targets_min": 1191 }, { "epoch": 3.4465822784810127, "grad_norm": 0.3276147158732667, "learning_rate": 1.0668017090634164e-05, "loss": 0.2912, "loss_nan_ranks": 0, "loss_rank_avg": 0.1463163197040558, "step": 3405, "valid_targets_mean": 3868.4, "valid_targets_min": 1560 }, { "epoch": 3.4516455696202533, "grad_norm": 0.27522935687650096, "learning_rate": 1.0605577915312662e-05, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.14057275652885437, "step": 3410, "valid_targets_mean": 5501.4, "valid_targets_min": 1198 }, { "epoch": 3.456708860759494, "grad_norm": 0.2546793488548092, "learning_rate": 1.0543256005543752e-05, "loss": 0.2931, "loss_nan_ranks": 0, "loss_rank_avg": 0.17178791761398315, "step": 3415, "valid_targets_mean": 6257.9, "valid_targets_min": 1159 }, { "epoch": 3.4617721518987343, "grad_norm": 0.2887049078859965, "learning_rate": 1.048105213925853e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.15336082875728607, "step": 3420, "valid_targets_mean": 5676.3, "valid_targets_min": 1581 }, { "epoch": 3.466835443037975, "grad_norm": 0.3248981947583244, "learning_rate": 1.0418967092914643e-05, "loss": 0.296, "loss_nan_ranks": 0, "loss_rank_avg": 0.12593376636505127, "step": 3425, "valid_targets_mean": 3572.3, "valid_targets_min": 1200 }, { "epoch": 3.4718987341772154, "grad_norm": 0.33097897236242024, "learning_rate": 1.0357001641486556e-05, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.16061154007911682, "step": 3430, "valid_targets_mean": 6276.2, "valid_targets_min": 1499 }, { "epoch": 3.476962025316456, "grad_norm": 0.29614677485829893, "learning_rate": 1.0295156558455885e-05, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.1872052550315857, "step": 3435, "valid_targets_mean": 6640.8, "valid_targets_min": 1160 }, { "epoch": 3.482025316455696, "grad_norm": 0.27705637796463173, "learning_rate": 1.0233432615801786e-05, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.14229699969291687, "step": 3440, "valid_targets_mean": 5945.9, "valid_targets_min": 1284 }, { "epoch": 3.4870886075949366, "grad_norm": 0.26237225876364956, "learning_rate": 1.0171830583991245e-05, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.17002148926258087, "step": 3445, "valid_targets_mean": 6348.2, "valid_targets_min": 1431 }, { "epoch": 3.492151898734177, "grad_norm": 0.33818695188520737, "learning_rate": 1.0110351231969532e-05, "loss": 0.2999, "loss_nan_ranks": 0, "loss_rank_avg": 0.19817857444286346, "step": 3450, "valid_targets_mean": 4845.8, "valid_targets_min": 1227 }, { "epoch": 3.4972151898734176, "grad_norm": 0.27766136414994197, "learning_rate": 1.0048995327150556e-05, "loss": 0.2994, "loss_nan_ranks": 0, "loss_rank_avg": 0.17715927958488464, "step": 3455, "valid_targets_mean": 6080.2, "valid_targets_min": 1024 }, { "epoch": 3.502278481012658, "grad_norm": 0.3385690737736752, "learning_rate": 9.987763635407293e-06, "loss": 0.2976, "loss_nan_ranks": 0, "loss_rank_avg": 0.18266132473945618, "step": 3460, "valid_targets_mean": 4562.4, "valid_targets_min": 1570 }, { "epoch": 3.5073417721518987, "grad_norm": 0.35240157099060987, "learning_rate": 9.926656921062254e-06, "loss": 0.3082, "loss_nan_ranks": 0, "loss_rank_avg": 0.18275323510169983, "step": 3465, "valid_targets_mean": 4161.0, "valid_targets_min": 1086 }, { "epoch": 3.512405063291139, "grad_norm": 0.37082127798975295, "learning_rate": 9.865675946877897e-06, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.137416809797287, "step": 3470, "valid_targets_mean": 3108.2, "valid_targets_min": 1222 }, { "epoch": 3.5174683544303798, "grad_norm": 0.32990352870182205, "learning_rate": 9.804821474047166e-06, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.13373905420303345, "step": 3475, "valid_targets_mean": 3385.4, "valid_targets_min": 1094 }, { "epoch": 3.5225316455696203, "grad_norm": 0.3159470821550788, "learning_rate": 9.744094262183922e-06, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.1414027214050293, "step": 3480, "valid_targets_mean": 3928.0, "valid_targets_min": 1133 }, { "epoch": 3.527594936708861, "grad_norm": 0.2903957000330617, "learning_rate": 9.683495069313527e-06, "loss": 0.3091, "loss_nan_ranks": 0, "loss_rank_avg": 0.1404920518398285, "step": 3485, "valid_targets_mean": 4963.7, "valid_targets_min": 1699 }, { "epoch": 3.5326582278481014, "grad_norm": 0.28971614608089746, "learning_rate": 9.623024651863317e-06, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.12896308302879333, "step": 3490, "valid_targets_mean": 4057.2, "valid_targets_min": 1028 }, { "epoch": 3.537721518987342, "grad_norm": 0.32570265544900434, "learning_rate": 9.56268376465323e-06, "loss": 0.2962, "loss_nan_ranks": 0, "loss_rank_avg": 0.14747750759124756, "step": 3495, "valid_targets_mean": 3836.9, "valid_targets_min": 858 }, { "epoch": 3.5427848101265824, "grad_norm": 0.3186509490983858, "learning_rate": 9.502473160886309e-06, "loss": 0.3055, "loss_nan_ranks": 0, "loss_rank_avg": 0.13043725490570068, "step": 3500, "valid_targets_mean": 3738.1, "valid_targets_min": 908 }, { "epoch": 3.547848101265823, "grad_norm": 0.2738590358023834, "learning_rate": 9.442393592139378e-06, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.14587613940238953, "step": 3505, "valid_targets_mean": 4865.2, "valid_targets_min": 1410 }, { "epoch": 3.552911392405063, "grad_norm": 0.3247037129452682, "learning_rate": 9.382445808353582e-06, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.1686377227306366, "step": 3510, "valid_targets_mean": 4436.3, "valid_targets_min": 1010 }, { "epoch": 3.5579746835443036, "grad_norm": 0.3180620836755935, "learning_rate": 9.322630557825099e-06, "loss": 0.2905, "loss_nan_ranks": 0, "loss_rank_avg": 0.181858628988266, "step": 3515, "valid_targets_mean": 5233.6, "valid_targets_min": 1452 }, { "epoch": 3.563037974683544, "grad_norm": 0.389889167724953, "learning_rate": 9.262948587195733e-06, "loss": 0.3152, "loss_nan_ranks": 0, "loss_rank_avg": 0.15717878937721252, "step": 3520, "valid_targets_mean": 3013.9, "valid_targets_min": 1243 }, { "epoch": 3.5681012658227846, "grad_norm": 0.29747778586225904, "learning_rate": 9.203400641443659e-06, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.1657101958990097, "step": 3525, "valid_targets_mean": 5011.9, "valid_targets_min": 1171 }, { "epoch": 3.573164556962025, "grad_norm": 0.32589494828857773, "learning_rate": 9.143987463874067e-06, "loss": 0.3156, "loss_nan_ranks": 0, "loss_rank_avg": 0.1313675493001938, "step": 3530, "valid_targets_mean": 3697.8, "valid_targets_min": 1024 }, { "epoch": 3.5782278481012657, "grad_norm": 0.3014059728019354, "learning_rate": 9.084709796109907e-06, "loss": 0.2868, "loss_nan_ranks": 0, "loss_rank_avg": 0.1120418906211853, "step": 3535, "valid_targets_mean": 3755.7, "valid_targets_min": 1198 }, { "epoch": 3.5832911392405062, "grad_norm": 0.2948674668221632, "learning_rate": 9.025568378082656e-06, "loss": 0.3131, "loss_nan_ranks": 0, "loss_rank_avg": 0.2535429894924164, "step": 3540, "valid_targets_mean": 5356.3, "valid_targets_min": 1015 }, { "epoch": 3.5883544303797468, "grad_norm": 0.33956864916271323, "learning_rate": 8.96656394802303e-06, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.18608632683753967, "step": 3545, "valid_targets_mean": 4867.1, "valid_targets_min": 1215 }, { "epoch": 3.5934177215189873, "grad_norm": 0.2894977962731721, "learning_rate": 8.907697242451825e-06, "loss": 0.3074, "loss_nan_ranks": 0, "loss_rank_avg": 0.1488334834575653, "step": 3550, "valid_targets_mean": 4891.0, "valid_targets_min": 1716 }, { "epoch": 3.598481012658228, "grad_norm": 0.3343791939565901, "learning_rate": 8.84896899617067e-06, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.141134113073349, "step": 3555, "valid_targets_mean": 3341.7, "valid_targets_min": 890 }, { "epoch": 3.6035443037974684, "grad_norm": 0.33452158631970796, "learning_rate": 8.790379942252888e-06, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.10691896080970764, "step": 3560, "valid_targets_mean": 2877.1, "valid_targets_min": 1216 }, { "epoch": 3.608607594936709, "grad_norm": 0.36142037308609365, "learning_rate": 8.73193081203436e-06, "loss": 0.2975, "loss_nan_ranks": 0, "loss_rank_avg": 0.11998053640127182, "step": 3565, "valid_targets_mean": 2745.8, "valid_targets_min": 1146 }, { "epoch": 3.6136708860759494, "grad_norm": 0.29136587900708333, "learning_rate": 8.673622335104335e-06, "loss": 0.3143, "loss_nan_ranks": 0, "loss_rank_avg": 0.1345549076795578, "step": 3570, "valid_targets_mean": 4353.7, "valid_targets_min": 1408 }, { "epoch": 3.61873417721519, "grad_norm": 0.3065976409246481, "learning_rate": 8.6154552392964e-06, "loss": 0.3027, "loss_nan_ranks": 0, "loss_rank_avg": 0.10774962604045868, "step": 3575, "valid_targets_mean": 3904.3, "valid_targets_min": 1176 }, { "epoch": 3.6237974683544305, "grad_norm": 0.31612983755964325, "learning_rate": 8.557430250679329e-06, "loss": 0.302, "loss_nan_ranks": 0, "loss_rank_avg": 0.13469217717647552, "step": 3580, "valid_targets_mean": 3963.2, "valid_targets_min": 1302 }, { "epoch": 3.628860759493671, "grad_norm": 0.355565500659515, "learning_rate": 8.499548093548069e-06, "loss": 0.2915, "loss_nan_ranks": 0, "loss_rank_avg": 0.1492483913898468, "step": 3585, "valid_targets_mean": 3815.0, "valid_targets_min": 998 }, { "epoch": 3.6339240506329116, "grad_norm": 0.3209640823808966, "learning_rate": 8.441809490414664e-06, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.10731847584247589, "step": 3590, "valid_targets_mean": 3390.2, "valid_targets_min": 1205 }, { "epoch": 3.638987341772152, "grad_norm": 0.3111850353285487, "learning_rate": 8.384215161999245e-06, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.12559540569782257, "step": 3595, "valid_targets_mean": 3864.8, "valid_targets_min": 1279 }, { "epoch": 3.6440506329113926, "grad_norm": 0.3021980554963678, "learning_rate": 8.326765827221066e-06, "loss": 0.3006, "loss_nan_ranks": 0, "loss_rank_avg": 0.16643747687339783, "step": 3600, "valid_targets_mean": 4737.3, "valid_targets_min": 980 }, { "epoch": 3.649113924050633, "grad_norm": 0.3299126612802994, "learning_rate": 8.269462203189467e-06, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.1495143473148346, "step": 3605, "valid_targets_mean": 4373.2, "valid_targets_min": 1652 }, { "epoch": 3.6541772151898733, "grad_norm": 0.3046029741964782, "learning_rate": 8.212305005194992e-06, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.12610015273094177, "step": 3610, "valid_targets_mean": 4068.0, "valid_targets_min": 990 }, { "epoch": 3.659240506329114, "grad_norm": 0.2889811661916004, "learning_rate": 8.155294946700402e-06, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.14253506064414978, "step": 3615, "valid_targets_mean": 4970.4, "valid_targets_min": 1268 }, { "epoch": 3.6643037974683543, "grad_norm": 0.3058585932521842, "learning_rate": 8.098432739331803e-06, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.14140847325325012, "step": 3620, "valid_targets_mean": 4990.8, "valid_targets_min": 1162 }, { "epoch": 3.669367088607595, "grad_norm": 0.3078512961350209, "learning_rate": 8.041719092869761e-06, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.13041014969348907, "step": 3625, "valid_targets_mean": 4127.6, "valid_targets_min": 1226 }, { "epoch": 3.6744303797468354, "grad_norm": 0.2557971332829355, "learning_rate": 7.98515471524042e-06, "loss": 0.3067, "loss_nan_ranks": 0, "loss_rank_avg": 0.13294486701488495, "step": 3630, "valid_targets_mean": 5826.9, "valid_targets_min": 1621 }, { "epoch": 3.679493670886076, "grad_norm": 0.3421960754823531, "learning_rate": 7.928740312506704e-06, "loss": 0.3055, "loss_nan_ranks": 0, "loss_rank_avg": 0.11804340779781342, "step": 3635, "valid_targets_mean": 3220.9, "valid_targets_min": 1529 }, { "epoch": 3.6845569620253165, "grad_norm": 0.30370702242210657, "learning_rate": 7.87247658885946e-06, "loss": 0.2923, "loss_nan_ranks": 0, "loss_rank_avg": 0.1813192367553711, "step": 3640, "valid_targets_mean": 5260.7, "valid_targets_min": 1428 }, { "epoch": 3.689620253164557, "grad_norm": 0.3275936364034654, "learning_rate": 7.816364246608688e-06, "loss": 0.303, "loss_nan_ranks": 0, "loss_rank_avg": 0.16349400579929352, "step": 3645, "valid_targets_mean": 4485.0, "valid_targets_min": 891 }, { "epoch": 3.6946835443037975, "grad_norm": 0.36264702848645247, "learning_rate": 7.760403986174796e-06, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.13801871240139008, "step": 3650, "valid_targets_mean": 3051.1, "valid_targets_min": 1057 }, { "epoch": 3.699746835443038, "grad_norm": 0.2776099144093922, "learning_rate": 7.70459650607981e-06, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.1680225133895874, "step": 3655, "valid_targets_mean": 6631.8, "valid_targets_min": 1456 }, { "epoch": 3.7048101265822786, "grad_norm": 0.34172337758905963, "learning_rate": 7.648942502938705e-06, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.16763363778591156, "step": 3660, "valid_targets_mean": 4061.8, "valid_targets_min": 1209 }, { "epoch": 3.709873417721519, "grad_norm": 0.31939393718066644, "learning_rate": 7.593442671450666e-06, "loss": 0.2965, "loss_nan_ranks": 0, "loss_rank_avg": 0.17321282625198364, "step": 3665, "valid_targets_mean": 4894.1, "valid_targets_min": 1043 }, { "epoch": 3.714936708860759, "grad_norm": 0.32132553979600637, "learning_rate": 7.5380977043904365e-06, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.16710880398750305, "step": 3670, "valid_targets_mean": 4925.1, "valid_targets_min": 1393 }, { "epoch": 3.7199999999999998, "grad_norm": 0.32445408393836617, "learning_rate": 7.482908292599689e-06, "loss": 0.3039, "loss_nan_ranks": 0, "loss_rank_avg": 0.12341426312923431, "step": 3675, "valid_targets_mean": 3606.6, "valid_targets_min": 1214 }, { "epoch": 3.7250632911392403, "grad_norm": 0.3064797642539383, "learning_rate": 7.427875124978359e-06, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.1298845112323761, "step": 3680, "valid_targets_mean": 4494.2, "valid_targets_min": 1211 }, { "epoch": 3.730126582278481, "grad_norm": 0.2891043975748266, "learning_rate": 7.372998888476091e-06, "loss": 0.307, "loss_nan_ranks": 0, "loss_rank_avg": 0.14520198106765747, "step": 3685, "valid_targets_mean": 4642.1, "valid_targets_min": 1350 }, { "epoch": 3.7351898734177214, "grad_norm": 0.2986519000501888, "learning_rate": 7.318280268083624e-06, "loss": 0.3026, "loss_nan_ranks": 0, "loss_rank_avg": 0.19568581879138947, "step": 3690, "valid_targets_mean": 5491.8, "valid_targets_min": 1141 }, { "epoch": 3.740253164556962, "grad_norm": 0.32054148131031535, "learning_rate": 7.263719946824264e-06, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.12194908410310745, "step": 3695, "valid_targets_mean": 3993.2, "valid_targets_min": 1248 }, { "epoch": 3.7453164556962024, "grad_norm": 0.29536657640379355, "learning_rate": 7.209318605745368e-06, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.14819620549678802, "step": 3700, "valid_targets_mean": 4433.9, "valid_targets_min": 1426 }, { "epoch": 3.750379746835443, "grad_norm": 0.28146869288224746, "learning_rate": 7.1550769239098e-06, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.18099471926689148, "step": 3705, "valid_targets_mean": 7152.2, "valid_targets_min": 1449 }, { "epoch": 3.7554430379746835, "grad_norm": 0.31596675118829165, "learning_rate": 7.100995578387519e-06, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.13141889870166779, "step": 3710, "valid_targets_mean": 3884.0, "valid_targets_min": 1459 }, { "epoch": 3.760506329113924, "grad_norm": 0.31422332389376245, "learning_rate": 7.047075244247061e-06, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.1718595027923584, "step": 3715, "valid_targets_mean": 4909.5, "valid_targets_min": 1774 }, { "epoch": 3.7655696202531646, "grad_norm": 0.3058451914869696, "learning_rate": 6.993316594547148e-06, "loss": 0.3043, "loss_nan_ranks": 0, "loss_rank_avg": 0.12041142582893372, "step": 3720, "valid_targets_mean": 3857.4, "valid_targets_min": 1341 }, { "epoch": 3.770632911392405, "grad_norm": 0.3285101705687896, "learning_rate": 6.939720300328303e-06, "loss": 0.3109, "loss_nan_ranks": 0, "loss_rank_avg": 0.15424466133117676, "step": 3725, "valid_targets_mean": 4029.8, "valid_targets_min": 1388 }, { "epoch": 3.7756962025316456, "grad_norm": 0.2852711508998474, "learning_rate": 6.886287030604422e-06, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.15062718093395233, "step": 3730, "valid_targets_mean": 5311.7, "valid_targets_min": 1383 }, { "epoch": 3.780759493670886, "grad_norm": 0.32830150851392953, "learning_rate": 6.83301745235448e-06, "loss": 0.3073, "loss_nan_ranks": 0, "loss_rank_avg": 0.1865895390510559, "step": 3735, "valid_targets_mean": 4781.8, "valid_targets_min": 1034 }, { "epoch": 3.7858227848101267, "grad_norm": 0.33756549066729197, "learning_rate": 6.779912230514161e-06, "loss": 0.2807, "loss_nan_ranks": 0, "loss_rank_avg": 0.12055318802595139, "step": 3740, "valid_targets_mean": 3463.3, "valid_targets_min": 1599 }, { "epoch": 3.790886075949367, "grad_norm": 0.3152172059583756, "learning_rate": 6.7269720279675755e-06, "loss": 0.3027, "loss_nan_ranks": 0, "loss_rank_avg": 0.17137764394283295, "step": 3745, "valid_targets_mean": 4888.2, "valid_targets_min": 1432 }, { "epoch": 3.7959493670886078, "grad_norm": 0.3239318373383687, "learning_rate": 6.674197505539006e-06, "loss": 0.3045, "loss_nan_ranks": 0, "loss_rank_avg": 0.14893168210983276, "step": 3750, "valid_targets_mean": 4158.4, "valid_targets_min": 1285 }, { "epoch": 3.8010126582278483, "grad_norm": 0.2919220688770005, "learning_rate": 6.621589321984611e-06, "loss": 0.2953, "loss_nan_ranks": 0, "loss_rank_avg": 0.14690950512886047, "step": 3755, "valid_targets_mean": 4748.6, "valid_targets_min": 1607 }, { "epoch": 3.806075949367089, "grad_norm": 0.3025582373018823, "learning_rate": 6.569148133984258e-06, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.17515698075294495, "step": 3760, "valid_targets_mean": 5047.3, "valid_targets_min": 1082 }, { "epoch": 3.8111392405063294, "grad_norm": 0.2952019372668243, "learning_rate": 6.516874596133269e-06, "loss": 0.2869, "loss_nan_ranks": 0, "loss_rank_avg": 0.15086880326271057, "step": 3765, "valid_targets_mean": 5131.5, "valid_targets_min": 1253 }, { "epoch": 3.81620253164557, "grad_norm": 0.29724809214492576, "learning_rate": 6.464769360934306e-06, "loss": 0.2927, "loss_nan_ranks": 0, "loss_rank_avg": 0.19773977994918823, "step": 3770, "valid_targets_mean": 6146.5, "valid_targets_min": 1366 }, { "epoch": 3.82126582278481, "grad_norm": 0.33270725662814826, "learning_rate": 6.412833078789178e-06, "loss": 0.3024, "loss_nan_ranks": 0, "loss_rank_avg": 0.15699324011802673, "step": 3775, "valid_targets_mean": 4472.4, "valid_targets_min": 1350 }, { "epoch": 3.8263291139240505, "grad_norm": 0.2963372278675901, "learning_rate": 6.361066397990758e-06, "loss": 0.2956, "loss_nan_ranks": 0, "loss_rank_avg": 0.1388930231332779, "step": 3780, "valid_targets_mean": 4676.4, "valid_targets_min": 971 }, { "epoch": 3.831392405063291, "grad_norm": 0.2786191474125972, "learning_rate": 6.309469964714863e-06, "loss": 0.298, "loss_nan_ranks": 0, "loss_rank_avg": 0.14243824779987335, "step": 3785, "valid_targets_mean": 4964.9, "valid_targets_min": 1391 }, { "epoch": 3.8364556962025316, "grad_norm": 0.3057769621782611, "learning_rate": 6.2580444230122175e-06, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.1198386549949646, "step": 3790, "valid_targets_mean": 3840.2, "valid_targets_min": 745 }, { "epoch": 3.841518987341772, "grad_norm": 0.31205008704708975, "learning_rate": 6.2067904148003764e-06, "loss": 0.3096, "loss_nan_ranks": 0, "loss_rank_avg": 0.17915937304496765, "step": 3795, "valid_targets_mean": 5550.8, "valid_targets_min": 1392 }, { "epoch": 3.8465822784810126, "grad_norm": 0.3072712018089592, "learning_rate": 6.155708579855759e-06, "loss": 0.3163, "loss_nan_ranks": 0, "loss_rank_avg": 0.15422801673412323, "step": 3800, "valid_targets_mean": 4714.1, "valid_targets_min": 970 }, { "epoch": 3.851645569620253, "grad_norm": 0.3056625890719376, "learning_rate": 6.104799555805607e-06, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.10852354019880295, "step": 3805, "valid_targets_mean": 3481.8, "valid_targets_min": 1001 }, { "epoch": 3.8567088607594937, "grad_norm": 0.33415927615785906, "learning_rate": 6.054063978120093e-06, "loss": 0.3035, "loss_nan_ranks": 0, "loss_rank_avg": 0.16793662309646606, "step": 3810, "valid_targets_mean": 3962.6, "valid_targets_min": 1458 }, { "epoch": 3.8617721518987342, "grad_norm": 0.2859437483451691, "learning_rate": 6.00350248010431e-06, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.11396883428096771, "step": 3815, "valid_targets_mean": 4421.5, "valid_targets_min": 1527 }, { "epoch": 3.8668354430379748, "grad_norm": 0.32446773366076725, "learning_rate": 5.95311569289045e-06, "loss": 0.2976, "loss_nan_ranks": 0, "loss_rank_avg": 0.14191418886184692, "step": 3820, "valid_targets_mean": 3904.6, "valid_targets_min": 1346 }, { "epoch": 3.8718987341772153, "grad_norm": 0.33241644171629736, "learning_rate": 5.902904245429852e-06, "loss": 0.3066, "loss_nan_ranks": 0, "loss_rank_avg": 0.15994411706924438, "step": 3825, "valid_targets_mean": 4205.2, "valid_targets_min": 1211 }, { "epoch": 3.876962025316456, "grad_norm": 0.33295558620330956, "learning_rate": 5.852868764485185e-06, "loss": 0.2951, "loss_nan_ranks": 0, "loss_rank_avg": 0.11764267832040787, "step": 3830, "valid_targets_mean": 3148.9, "valid_targets_min": 992 }, { "epoch": 3.882025316455696, "grad_norm": 0.3094377142586556, "learning_rate": 5.803009874622645e-06, "loss": 0.3014, "loss_nan_ranks": 0, "loss_rank_avg": 0.13288931548595428, "step": 3835, "valid_targets_mean": 3723.9, "valid_targets_min": 1009 }, { "epoch": 3.8870886075949365, "grad_norm": 0.28966742570043214, "learning_rate": 5.753328198204107e-06, "loss": 0.2827, "loss_nan_ranks": 0, "loss_rank_avg": 0.14470314979553223, "step": 3840, "valid_targets_mean": 5011.6, "valid_targets_min": 1536 }, { "epoch": 3.892151898734177, "grad_norm": 0.3556764011843303, "learning_rate": 5.7038243553794105e-06, "loss": 0.3098, "loss_nan_ranks": 0, "loss_rank_avg": 0.15663528442382812, "step": 3845, "valid_targets_mean": 3704.3, "valid_targets_min": 938 }, { "epoch": 3.8972151898734175, "grad_norm": 0.4434641609697601, "learning_rate": 5.654498964078578e-06, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.15775218605995178, "step": 3850, "valid_targets_mean": 5224.2, "valid_targets_min": 1008 }, { "epoch": 3.902278481012658, "grad_norm": 0.28354591909624743, "learning_rate": 5.605352640004111e-06, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.20830413699150085, "step": 3855, "valid_targets_mean": 6659.2, "valid_targets_min": 1634 }, { "epoch": 3.9073417721518986, "grad_norm": 0.31278015955485905, "learning_rate": 5.556385996623334e-06, "loss": 0.3024, "loss_nan_ranks": 0, "loss_rank_avg": 0.1927700638771057, "step": 3860, "valid_targets_mean": 6460.9, "valid_targets_min": 1493 }, { "epoch": 3.912405063291139, "grad_norm": 0.3183546633710576, "learning_rate": 5.507599645160688e-06, "loss": 0.2956, "loss_nan_ranks": 0, "loss_rank_avg": 0.14958074688911438, "step": 3865, "valid_targets_mean": 4336.2, "valid_targets_min": 1153 }, { "epoch": 3.9174683544303797, "grad_norm": 0.2926146837393363, "learning_rate": 5.45899419459015e-06, "loss": 0.317, "loss_nan_ranks": 0, "loss_rank_avg": 0.11325857788324356, "step": 3870, "valid_targets_mean": 3313.8, "valid_targets_min": 775 }, { "epoch": 3.92253164556962, "grad_norm": 0.2947057963950262, "learning_rate": 5.410570251627587e-06, "loss": 0.2958, "loss_nan_ranks": 0, "loss_rank_avg": 0.1467699259519577, "step": 3875, "valid_targets_mean": 5764.1, "valid_targets_min": 1283 }, { "epoch": 3.9275949367088607, "grad_norm": 0.29570913844534924, "learning_rate": 5.362328420723208e-06, "loss": 0.2956, "loss_nan_ranks": 0, "loss_rank_avg": 0.14309361577033997, "step": 3880, "valid_targets_mean": 4847.8, "valid_targets_min": 927 }, { "epoch": 3.9326582278481013, "grad_norm": 0.3026281684204848, "learning_rate": 5.314269304054029e-06, "loss": 0.29, "loss_nan_ranks": 0, "loss_rank_avg": 0.19492954015731812, "step": 3885, "valid_targets_mean": 5634.2, "valid_targets_min": 1361 }, { "epoch": 3.937721518987342, "grad_norm": 0.30964406158183067, "learning_rate": 5.26639350151632e-06, "loss": 0.3055, "loss_nan_ranks": 0, "loss_rank_avg": 0.13411834836006165, "step": 3890, "valid_targets_mean": 4035.8, "valid_targets_min": 1199 }, { "epoch": 3.9427848101265823, "grad_norm": 0.3111439221332038, "learning_rate": 5.218701610718162e-06, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.1787598729133606, "step": 3895, "valid_targets_mean": 5102.0, "valid_targets_min": 1779 }, { "epoch": 3.947848101265823, "grad_norm": 0.256548917813654, "learning_rate": 5.171194226971947e-06, "loss": 0.3164, "loss_nan_ranks": 0, "loss_rank_avg": 0.15520493686199188, "step": 3900, "valid_targets_mean": 5819.2, "valid_targets_min": 913 }, { "epoch": 3.9529113924050634, "grad_norm": 0.35240271321787325, "learning_rate": 5.12387194328696e-06, "loss": 0.2864, "loss_nan_ranks": 0, "loss_rank_avg": 0.100287064909935, "step": 3905, "valid_targets_mean": 2803.6, "valid_targets_min": 1229 }, { "epoch": 3.957974683544304, "grad_norm": 0.28051305016909855, "learning_rate": 5.0767353503620055e-06, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.11824625730514526, "step": 3910, "valid_targets_mean": 4403.1, "valid_targets_min": 1454 }, { "epoch": 3.9630379746835445, "grad_norm": 0.33648253442313436, "learning_rate": 5.029785036577976e-06, "loss": 0.3047, "loss_nan_ranks": 0, "loss_rank_avg": 0.12415116280317307, "step": 3915, "valid_targets_mean": 3484.4, "valid_targets_min": 1290 }, { "epoch": 3.968101265822785, "grad_norm": 0.3051655834868841, "learning_rate": 4.983021587990577e-06, "loss": 0.2999, "loss_nan_ranks": 0, "loss_rank_avg": 0.16038689017295837, "step": 3920, "valid_targets_mean": 4039.8, "valid_targets_min": 1423 }, { "epoch": 3.9731645569620255, "grad_norm": 0.3149366075705648, "learning_rate": 4.936445588322947e-06, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.17041844129562378, "step": 3925, "valid_targets_mean": 4645.1, "valid_targets_min": 1388 }, { "epoch": 3.978227848101266, "grad_norm": 0.3104948744129676, "learning_rate": 4.890057618958406e-06, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.13706716895103455, "step": 3930, "valid_targets_mean": 4148.2, "valid_targets_min": 918 }, { "epoch": 3.9832911392405066, "grad_norm": 0.4596385567964535, "learning_rate": 4.843858258933207e-06, "loss": 0.306, "loss_nan_ranks": 0, "loss_rank_avg": 0.12977036833763123, "step": 3935, "valid_targets_mean": 4589.1, "valid_targets_min": 1135 }, { "epoch": 3.9883544303797467, "grad_norm": 0.35205194291692793, "learning_rate": 4.797848084929271e-06, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.16180771589279175, "step": 3940, "valid_targets_mean": 4005.4, "valid_targets_min": 1682 }, { "epoch": 3.993417721518987, "grad_norm": 0.3115344869207087, "learning_rate": 4.7520276712670344e-06, "loss": 0.3138, "loss_nan_ranks": 0, "loss_rank_avg": 0.1245289221405983, "step": 3945, "valid_targets_mean": 3869.5, "valid_targets_min": 1814 }, { "epoch": 3.9984810126582278, "grad_norm": 0.3447482808883552, "learning_rate": 4.706397589898237e-06, "loss": 0.2992, "loss_nan_ranks": 0, "loss_rank_avg": 0.21260038018226624, "step": 3950, "valid_targets_mean": 4663.9, "valid_targets_min": 1153 }, { "epoch": 4.0030379746835445, "grad_norm": 0.31704002367241657, "learning_rate": 4.660958410398808e-06, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.11520913243293762, "step": 3955, "valid_targets_mean": 3230.5, "valid_targets_min": 1024 }, { "epoch": 4.008101265822785, "grad_norm": 0.3107759512067684, "learning_rate": 4.61571069996176e-06, "loss": 0.3067, "loss_nan_ranks": 0, "loss_rank_avg": 0.15815721452236176, "step": 3960, "valid_targets_mean": 4538.7, "valid_targets_min": 763 }, { "epoch": 4.013164556962026, "grad_norm": 0.3240449542122713, "learning_rate": 4.5706550233900825e-06, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.1527724266052246, "step": 3965, "valid_targets_mean": 4152.1, "valid_targets_min": 1278 }, { "epoch": 4.018227848101266, "grad_norm": 0.3371371879535488, "learning_rate": 4.5257919430897305e-06, "loss": 0.2919, "loss_nan_ranks": 0, "loss_rank_avg": 0.14754730463027954, "step": 3970, "valid_targets_mean": 3785.3, "valid_targets_min": 1269 }, { "epoch": 4.023291139240507, "grad_norm": 0.28767581366652223, "learning_rate": 4.481122019062562e-06, "loss": 0.2976, "loss_nan_ranks": 0, "loss_rank_avg": 0.14282898604869843, "step": 3975, "valid_targets_mean": 4653.0, "valid_targets_min": 1265 }, { "epoch": 4.028354430379747, "grad_norm": 0.29732809453534903, "learning_rate": 4.436645808899374e-06, "loss": 0.3062, "loss_nan_ranks": 0, "loss_rank_avg": 0.18286307156085968, "step": 3980, "valid_targets_mean": 5864.7, "valid_targets_min": 1531 }, { "epoch": 4.033417721518988, "grad_norm": 0.29104777332578374, "learning_rate": 4.3923638677729506e-06, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.15134663879871368, "step": 3985, "valid_targets_mean": 5712.8, "valid_targets_min": 923 }, { "epoch": 4.038481012658228, "grad_norm": 0.34370328700294156, "learning_rate": 4.348276748431095e-06, "loss": 0.2889, "loss_nan_ranks": 0, "loss_rank_avg": 0.16227614879608154, "step": 3990, "valid_targets_mean": 4682.2, "valid_targets_min": 1365 }, { "epoch": 4.043544303797469, "grad_norm": 0.2853726249793705, "learning_rate": 4.304385001189781e-06, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.15851733088493347, "step": 3995, "valid_targets_mean": 5396.8, "valid_targets_min": 1278 }, { "epoch": 4.048607594936709, "grad_norm": 0.2664334385740433, "learning_rate": 4.260689173926238e-06, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.1690644472837448, "step": 4000, "valid_targets_mean": 6774.5, "valid_targets_min": 1292 }, { "epoch": 4.053670886075949, "grad_norm": 0.27904233780454435, "learning_rate": 4.217189812072131e-06, "loss": 0.2918, "loss_nan_ranks": 0, "loss_rank_avg": 0.13511596620082855, "step": 4005, "valid_targets_mean": 4486.5, "valid_targets_min": 1562 }, { "epoch": 4.0587341772151895, "grad_norm": 0.3231775999779525, "learning_rate": 4.173887458606767e-06, "loss": 0.3074, "loss_nan_ranks": 0, "loss_rank_avg": 0.11682070791721344, "step": 4010, "valid_targets_mean": 3668.7, "valid_targets_min": 1126 }, { "epoch": 4.06379746835443, "grad_norm": 0.2770166025598625, "learning_rate": 4.130782654050283e-06, "loss": 0.3007, "loss_nan_ranks": 0, "loss_rank_avg": 0.15404465794563293, "step": 4015, "valid_targets_mean": 5586.6, "valid_targets_min": 1272 }, { "epoch": 4.0688607594936705, "grad_norm": 0.27479033637998745, "learning_rate": 4.087875936456937e-06, "loss": 0.2758, "loss_nan_ranks": 0, "loss_rank_avg": 0.12938356399536133, "step": 4020, "valid_targets_mean": 5243.8, "valid_targets_min": 1267 }, { "epoch": 4.073924050632911, "grad_norm": 0.31378983164450186, "learning_rate": 4.045167841408359e-06, "loss": 0.3017, "loss_nan_ranks": 0, "loss_rank_avg": 0.15723198652267456, "step": 4025, "valid_targets_mean": 4392.6, "valid_targets_min": 1232 }, { "epoch": 4.078987341772152, "grad_norm": 0.29002739575691505, "learning_rate": 4.002658902006893e-06, "loss": 0.2859, "loss_nan_ranks": 0, "loss_rank_avg": 0.15544429421424866, "step": 4030, "valid_targets_mean": 5350.4, "valid_targets_min": 909 }, { "epoch": 4.084050632911392, "grad_norm": 0.3087847959185058, "learning_rate": 3.9603496488689174e-06, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.16527938842773438, "step": 4035, "valid_targets_mean": 5526.1, "valid_targets_min": 1129 }, { "epoch": 4.089113924050633, "grad_norm": 0.3085791674780826, "learning_rate": 3.918240610118234e-06, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.1917693018913269, "step": 4040, "valid_targets_mean": 6275.9, "valid_targets_min": 1748 }, { "epoch": 4.094177215189873, "grad_norm": 0.286080067957159, "learning_rate": 3.876332311379489e-06, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.1519317775964737, "step": 4045, "valid_targets_mean": 5526.4, "valid_targets_min": 1127 }, { "epoch": 4.099240506329114, "grad_norm": 0.2837484355272842, "learning_rate": 3.834625275771582e-06, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.123206228017807, "step": 4050, "valid_targets_mean": 4113.7, "valid_targets_min": 1252 }, { "epoch": 4.104303797468354, "grad_norm": 0.2999251731420047, "learning_rate": 3.7931200239011643e-06, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.13318127393722534, "step": 4055, "valid_targets_mean": 4568.8, "valid_targets_min": 1236 }, { "epoch": 4.109367088607595, "grad_norm": 0.2816382941308749, "learning_rate": 3.7518170738561168e-06, "loss": 0.2923, "loss_nan_ranks": 0, "loss_rank_avg": 0.14610666036605835, "step": 4060, "valid_targets_mean": 4928.9, "valid_targets_min": 826 }, { "epoch": 4.114430379746835, "grad_norm": 0.32554297974189644, "learning_rate": 3.7107169411991127e-06, "loss": 0.3074, "loss_nan_ranks": 0, "loss_rank_avg": 0.12090884894132614, "step": 4065, "valid_targets_mean": 3398.6, "valid_targets_min": 1385 }, { "epoch": 4.119493670886076, "grad_norm": 0.3170024428197897, "learning_rate": 3.6698201389611423e-06, "loss": 0.2839, "loss_nan_ranks": 0, "loss_rank_avg": 0.13328410685062408, "step": 4070, "valid_targets_mean": 4025.0, "valid_targets_min": 901 }, { "epoch": 4.124556962025316, "grad_norm": 0.3205485924763668, "learning_rate": 3.62912717763515e-06, "loss": 0.3124, "loss_nan_ranks": 0, "loss_rank_avg": 0.21576707065105438, "step": 4075, "valid_targets_mean": 6120.9, "valid_targets_min": 1421 }, { "epoch": 4.129620253164557, "grad_norm": 0.38654381765739637, "learning_rate": 3.5886385651696267e-06, "loss": 0.287, "loss_nan_ranks": 0, "loss_rank_avg": 0.14297889173030853, "step": 4080, "valid_targets_mean": 4917.6, "valid_targets_min": 1098 }, { "epoch": 4.1346835443037975, "grad_norm": 0.3524477589713149, "learning_rate": 3.5483548069623043e-06, "loss": 0.3032, "loss_nan_ranks": 0, "loss_rank_avg": 0.14278902113437653, "step": 4085, "valid_targets_mean": 3844.8, "valid_targets_min": 1260 }, { "epoch": 4.139746835443038, "grad_norm": 0.3197809913122213, "learning_rate": 3.5082764058538056e-06, "loss": 0.2891, "loss_nan_ranks": 0, "loss_rank_avg": 0.12523522973060608, "step": 4090, "valid_targets_mean": 3690.5, "valid_targets_min": 885 }, { "epoch": 4.1448101265822785, "grad_norm": 0.30886469526940097, "learning_rate": 3.4684038621214124e-06, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.16583015024662018, "step": 4095, "valid_targets_mean": 5001.4, "valid_targets_min": 1243 }, { "epoch": 4.149873417721519, "grad_norm": 0.28226754473975985, "learning_rate": 3.4287376734727817e-06, "loss": 0.2931, "loss_nan_ranks": 0, "loss_rank_avg": 0.16582466661930084, "step": 4100, "valid_targets_mean": 5544.1, "valid_targets_min": 1022 }, { "epoch": 4.15493670886076, "grad_norm": 0.3051843817153008, "learning_rate": 3.3892783350397675e-06, "loss": 0.2876, "loss_nan_ranks": 0, "loss_rank_avg": 0.11235642433166504, "step": 4105, "valid_targets_mean": 3728.7, "valid_targets_min": 1019 }, { "epoch": 4.16, "grad_norm": 0.28561421446674784, "learning_rate": 3.3500263393722033e-06, "loss": 0.2821, "loss_nan_ranks": 0, "loss_rank_avg": 0.14730824530124664, "step": 4110, "valid_targets_mean": 5325.3, "valid_targets_min": 1247 }, { "epoch": 4.165063291139241, "grad_norm": 0.3396963845435047, "learning_rate": 3.310982176431785e-06, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.1362554281949997, "step": 4115, "valid_targets_mean": 4046.4, "valid_targets_min": 974 }, { "epoch": 4.170126582278481, "grad_norm": 0.3604026125994517, "learning_rate": 3.2721463335859484e-06, "loss": 0.2991, "loss_nan_ranks": 0, "loss_rank_avg": 0.12034134566783905, "step": 4120, "valid_targets_mean": 2845.9, "valid_targets_min": 1453 }, { "epoch": 4.175189873417722, "grad_norm": 0.3047812123169994, "learning_rate": 3.2335192956017634e-06, "loss": 0.2972, "loss_nan_ranks": 0, "loss_rank_avg": 0.1503809243440628, "step": 4125, "valid_targets_mean": 4877.8, "valid_targets_min": 1783 }, { "epoch": 4.180253164556962, "grad_norm": 0.36835014889244666, "learning_rate": 3.1951015446399247e-06, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.11517144739627838, "step": 4130, "valid_targets_mean": 2904.6, "valid_targets_min": 909 }, { "epoch": 4.185316455696203, "grad_norm": 0.32918669737266704, "learning_rate": 3.156893560248688e-06, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.140342578291893, "step": 4135, "valid_targets_mean": 4083.8, "valid_targets_min": 1081 }, { "epoch": 4.190379746835443, "grad_norm": 0.33957836205604514, "learning_rate": 3.118895819357908e-06, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.1507326364517212, "step": 4140, "valid_targets_mean": 4652.1, "valid_targets_min": 1298 }, { "epoch": 4.195443037974684, "grad_norm": 0.285494983139607, "learning_rate": 3.081108796273098e-06, "loss": 0.301, "loss_nan_ranks": 0, "loss_rank_avg": 0.12487950921058655, "step": 4145, "valid_targets_mean": 4737.4, "valid_targets_min": 1243 }, { "epoch": 4.200506329113924, "grad_norm": 0.32355832904009185, "learning_rate": 3.0435329626694733e-06, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.18284101784229279, "step": 4150, "valid_targets_mean": 4946.2, "valid_targets_min": 1066 }, { "epoch": 4.205569620253165, "grad_norm": 0.2901811873935047, "learning_rate": 3.006168787586097e-06, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.13859279453754425, "step": 4155, "valid_targets_mean": 5316.1, "valid_targets_min": 1099 }, { "epoch": 4.2106329113924055, "grad_norm": 0.5190123284320625, "learning_rate": 2.9690167374200075e-06, "loss": 0.2972, "loss_nan_ranks": 0, "loss_rank_avg": 0.1444871723651886, "step": 4160, "valid_targets_mean": 4388.6, "valid_targets_min": 1162 }, { "epoch": 4.215696202531646, "grad_norm": 0.31722642981901594, "learning_rate": 2.9320772759203975e-06, "loss": 0.2988, "loss_nan_ranks": 0, "loss_rank_avg": 0.13206876814365387, "step": 4165, "valid_targets_mean": 4130.3, "valid_targets_min": 1281 }, { "epoch": 4.220759493670886, "grad_norm": 0.30916942149206356, "learning_rate": 2.8953508641828375e-06, "loss": 0.3024, "loss_nan_ranks": 0, "loss_rank_avg": 0.1427369862794876, "step": 4170, "valid_targets_mean": 4538.5, "valid_targets_min": 1313 }, { "epoch": 4.225822784810126, "grad_norm": 0.3075492109138346, "learning_rate": 2.858837960643499e-06, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.17169958353042603, "step": 4175, "valid_targets_mean": 4840.8, "valid_targets_min": 1296 }, { "epoch": 4.230886075949367, "grad_norm": 0.29933826061321767, "learning_rate": 2.822539021073463e-06, "loss": 0.3067, "loss_nan_ranks": 0, "loss_rank_avg": 0.16137537360191345, "step": 4180, "valid_targets_mean": 5634.3, "valid_targets_min": 1130 }, { "epoch": 4.235949367088607, "grad_norm": 0.29690888264127147, "learning_rate": 2.786454498572997e-06, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.135961651802063, "step": 4185, "valid_targets_mean": 4399.6, "valid_targets_min": 732 }, { "epoch": 4.241012658227848, "grad_norm": 0.3246955608047686, "learning_rate": 2.7505848435659156e-06, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.1551479548215866, "step": 4190, "valid_targets_mean": 4534.1, "valid_targets_min": 1082 }, { "epoch": 4.246075949367088, "grad_norm": 0.29829478040788515, "learning_rate": 2.7149305037939687e-06, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.18227550387382507, "step": 4195, "valid_targets_mean": 5650.3, "valid_targets_min": 1359 }, { "epoch": 4.251139240506329, "grad_norm": 0.3491396172417171, "learning_rate": 2.679491924311226e-06, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.13989317417144775, "step": 4200, "valid_targets_mean": 3527.8, "valid_targets_min": 1094 }, { "epoch": 4.256202531645569, "grad_norm": 0.3062465471975927, "learning_rate": 2.644269547478555e-06, "loss": 0.304, "loss_nan_ranks": 0, "loss_rank_avg": 0.16212749481201172, "step": 4205, "valid_targets_mean": 4856.2, "valid_targets_min": 850 }, { "epoch": 4.26126582278481, "grad_norm": 0.31154484975672075, "learning_rate": 2.609263812958065e-06, "loss": 0.2934, "loss_nan_ranks": 0, "loss_rank_avg": 0.10032152384519577, "step": 4210, "valid_targets_mean": 3391.6, "valid_targets_min": 1245 }, { "epoch": 4.2663291139240505, "grad_norm": 0.3276187265653155, "learning_rate": 2.5744751577076343e-06, "loss": 0.2924, "loss_nan_ranks": 0, "loss_rank_avg": 0.16798563301563263, "step": 4215, "valid_targets_mean": 4301.5, "valid_targets_min": 828 }, { "epoch": 4.271392405063291, "grad_norm": 0.31771678562930245, "learning_rate": 2.539904015975476e-06, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.14239826798439026, "step": 4220, "valid_targets_mean": 4702.1, "valid_targets_min": 1064 }, { "epoch": 4.2764556962025315, "grad_norm": 0.2979983224769533, "learning_rate": 2.5055508192946732e-06, "loss": 0.3026, "loss_nan_ranks": 0, "loss_rank_avg": 0.15499252080917358, "step": 4225, "valid_targets_mean": 4931.4, "valid_targets_min": 1420 }, { "epoch": 4.281518987341772, "grad_norm": 0.3378145372579719, "learning_rate": 2.4714159964778394e-06, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.15219071507453918, "step": 4230, "valid_targets_mean": 4131.9, "valid_targets_min": 1088 }, { "epoch": 4.286582278481013, "grad_norm": 0.3132928788106069, "learning_rate": 2.437499973611728e-06, "loss": 0.2861, "loss_nan_ranks": 0, "loss_rank_avg": 0.17868193984031677, "step": 4235, "valid_targets_mean": 5772.8, "valid_targets_min": 1773 }, { "epoch": 4.291645569620253, "grad_norm": 0.3049108704834252, "learning_rate": 2.403803174051933e-06, "loss": 0.2997, "loss_nan_ranks": 0, "loss_rank_avg": 0.17676058411598206, "step": 4240, "valid_targets_mean": 5360.8, "valid_targets_min": 1400 }, { "epoch": 4.296708860759494, "grad_norm": 0.2674881690807918, "learning_rate": 2.3703260184176103e-06, "loss": 0.2849, "loss_nan_ranks": 0, "loss_rank_avg": 0.11438636481761932, "step": 4245, "valid_targets_mean": 4663.1, "valid_targets_min": 991 }, { "epoch": 4.301772151898734, "grad_norm": 0.3381875004506121, "learning_rate": 2.337068924586203e-06, "loss": 0.3034, "loss_nan_ranks": 0, "loss_rank_avg": 0.14016669988632202, "step": 4250, "valid_targets_mean": 3257.6, "valid_targets_min": 973 }, { "epoch": 4.306835443037975, "grad_norm": 0.33566799216440724, "learning_rate": 2.3040323076882578e-06, "loss": 0.2852, "loss_nan_ranks": 0, "loss_rank_avg": 0.1721951961517334, "step": 4255, "valid_targets_mean": 4602.8, "valid_targets_min": 1312 }, { "epoch": 4.311898734177215, "grad_norm": 0.39194447138918637, "learning_rate": 2.2712165801022046e-06, "loss": 0.2997, "loss_nan_ranks": 0, "loss_rank_avg": 0.1366182416677475, "step": 4260, "valid_targets_mean": 2721.6, "valid_targets_min": 913 }, { "epoch": 4.316962025316456, "grad_norm": 0.3637100172839474, "learning_rate": 2.2386221514492502e-06, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.11843443661928177, "step": 4265, "valid_targets_mean": 3167.0, "valid_targets_min": 1022 }, { "epoch": 4.322025316455696, "grad_norm": 0.32727869850436964, "learning_rate": 2.2062494285882363e-06, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.1746322512626648, "step": 4270, "valid_targets_mean": 4557.8, "valid_targets_min": 939 }, { "epoch": 4.327088607594937, "grad_norm": 0.35219909889872136, "learning_rate": 2.1740988156105593e-06, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.08915197849273682, "step": 4275, "valid_targets_mean": 2497.8, "valid_targets_min": 1172 }, { "epoch": 4.332151898734177, "grad_norm": 0.3312024847124787, "learning_rate": 2.142170713835161e-06, "loss": 0.2925, "loss_nan_ranks": 0, "loss_rank_avg": 0.16628465056419373, "step": 4280, "valid_targets_mean": 4481.7, "valid_targets_min": 1417 }, { "epoch": 4.337215189873418, "grad_norm": 0.26123810507474954, "learning_rate": 2.1104655218034685e-06, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.136556938290596, "step": 4285, "valid_targets_mean": 5086.1, "valid_targets_min": 1214 }, { "epoch": 4.3422784810126585, "grad_norm": 0.28913080019288895, "learning_rate": 2.0789836352744653e-06, "loss": 0.3025, "loss_nan_ranks": 0, "loss_rank_avg": 0.1929275244474411, "step": 4290, "valid_targets_mean": 6718.0, "valid_targets_min": 666 }, { "epoch": 4.347341772151899, "grad_norm": 0.2856092567973034, "learning_rate": 2.0477254472197237e-06, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.12290873378515244, "step": 4295, "valid_targets_mean": 4296.3, "valid_targets_min": 828 }, { "epoch": 4.3524050632911395, "grad_norm": 0.376756316497093, "learning_rate": 2.0166913478185004e-06, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.1333305984735489, "step": 4300, "valid_targets_mean": 4643.4, "valid_targets_min": 1007 }, { "epoch": 4.35746835443038, "grad_norm": 0.37269967571373286, "learning_rate": 1.9858817244528896e-06, "loss": 0.2771, "loss_nan_ranks": 0, "loss_rank_avg": 0.16167780756950378, "step": 4305, "valid_targets_mean": 3327.0, "valid_targets_min": 1248 }, { "epoch": 4.362531645569621, "grad_norm": 0.36507367284654024, "learning_rate": 1.955296961702955e-06, "loss": 0.2891, "loss_nan_ranks": 0, "loss_rank_avg": 0.1149420514702797, "step": 4310, "valid_targets_mean": 3484.9, "valid_targets_min": 1218 }, { "epoch": 4.367594936708861, "grad_norm": 0.3549138995526032, "learning_rate": 1.9249374413419584e-06, "loss": 0.3209, "loss_nan_ranks": 0, "loss_rank_avg": 0.16552500426769257, "step": 4315, "valid_targets_mean": 4319.2, "valid_targets_min": 1166 }, { "epoch": 4.372658227848102, "grad_norm": 0.30961509363434114, "learning_rate": 1.894803542331567e-06, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.12911680340766907, "step": 4320, "valid_targets_mean": 3623.0, "valid_targets_min": 1170 }, { "epoch": 4.377721518987342, "grad_norm": 0.30219606387390835, "learning_rate": 1.8648956408171547e-06, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.1574065387248993, "step": 4325, "valid_targets_mean": 4955.6, "valid_targets_min": 1679 }, { "epoch": 4.382784810126582, "grad_norm": 0.3279169523694041, "learning_rate": 1.8352141101230758e-06, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.1483180820941925, "step": 4330, "valid_targets_mean": 3969.1, "valid_targets_min": 1428 }, { "epoch": 4.387848101265822, "grad_norm": 0.3105228186529775, "learning_rate": 1.8057593207480194e-06, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.11923258006572723, "step": 4335, "valid_targets_mean": 3387.1, "valid_targets_min": 1009 }, { "epoch": 4.392911392405063, "grad_norm": 0.33881080054396395, "learning_rate": 1.7765316403603927e-06, "loss": 0.2916, "loss_nan_ranks": 0, "loss_rank_avg": 0.13051745295524597, "step": 4340, "valid_targets_mean": 3938.3, "valid_targets_min": 1204 }, { "epoch": 4.397974683544303, "grad_norm": 0.2859920210081916, "learning_rate": 1.7475314337937099e-06, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.14054298400878906, "step": 4345, "valid_targets_mean": 4863.8, "valid_targets_min": 1288 }, { "epoch": 4.403037974683544, "grad_norm": 0.3222088763676915, "learning_rate": 1.7187590630420681e-06, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.15554268658161163, "step": 4350, "valid_targets_mean": 3944.6, "valid_targets_min": 1256 }, { "epoch": 4.4081012658227845, "grad_norm": 0.32147293328088156, "learning_rate": 1.6902148872555924e-06, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.13429546356201172, "step": 4355, "valid_targets_mean": 3537.0, "valid_targets_min": 1501 }, { "epoch": 4.413164556962025, "grad_norm": 0.2873112295172894, "learning_rate": 1.661899262735991e-06, "loss": 0.2809, "loss_nan_ranks": 0, "loss_rank_avg": 0.11225029826164246, "step": 4360, "valid_targets_mean": 3726.2, "valid_targets_min": 1432 }, { "epoch": 4.418227848101266, "grad_norm": 0.3137420905534193, "learning_rate": 1.6338125429320694e-06, "loss": 0.3025, "loss_nan_ranks": 0, "loss_rank_avg": 0.1628667116165161, "step": 4365, "valid_targets_mean": 4489.4, "valid_targets_min": 1251 }, { "epoch": 4.423291139240506, "grad_norm": 0.2980697010922971, "learning_rate": 1.605955078435355e-06, "loss": 0.2861, "loss_nan_ranks": 0, "loss_rank_avg": 0.1740245670080185, "step": 4370, "valid_targets_mean": 5941.4, "valid_targets_min": 949 }, { "epoch": 4.428354430379747, "grad_norm": 0.29655956780164205, "learning_rate": 1.5783272169756903e-06, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.12947620451450348, "step": 4375, "valid_targets_mean": 4607.8, "valid_targets_min": 1670 }, { "epoch": 4.433417721518987, "grad_norm": 0.28159919536576594, "learning_rate": 1.550929303416917e-06, "loss": 0.2891, "loss_nan_ranks": 0, "loss_rank_avg": 0.11871195584535599, "step": 4380, "valid_targets_mean": 4622.2, "valid_targets_min": 1319 }, { "epoch": 4.438481012658228, "grad_norm": 0.3159849176088272, "learning_rate": 1.5237616797525512e-06, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.13893471658229828, "step": 4385, "valid_targets_mean": 4139.4, "valid_targets_min": 1377 }, { "epoch": 4.443544303797468, "grad_norm": 0.3103371076544768, "learning_rate": 1.49682468510153e-06, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.17314529418945312, "step": 4390, "valid_targets_mean": 5825.6, "valid_targets_min": 1000 }, { "epoch": 4.448607594936709, "grad_norm": 0.28729653443614084, "learning_rate": 1.4701186557039648e-06, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.13900840282440186, "step": 4395, "valid_targets_mean": 4918.3, "valid_targets_min": 1337 }, { "epoch": 4.453670886075949, "grad_norm": 0.3411738428471954, "learning_rate": 1.4436439249169554e-06, "loss": 0.3038, "loss_nan_ranks": 0, "loss_rank_avg": 0.13948732614517212, "step": 4400, "valid_targets_mean": 5576.6, "valid_targets_min": 1142 }, { "epoch": 4.45873417721519, "grad_norm": 0.3118105881962252, "learning_rate": 1.4174008232104285e-06, "loss": 0.2997, "loss_nan_ranks": 0, "loss_rank_avg": 0.13870777189731598, "step": 4405, "valid_targets_mean": 4355.1, "valid_targets_min": 1522 }, { "epoch": 4.46379746835443, "grad_norm": 0.32978343142383926, "learning_rate": 1.3913896781629954e-06, "loss": 0.2975, "loss_nan_ranks": 0, "loss_rank_avg": 0.13087686896324158, "step": 4410, "valid_targets_mean": 3731.3, "valid_targets_min": 540 }, { "epoch": 4.468860759493671, "grad_norm": 0.2618923931315447, "learning_rate": 1.3656108144578962e-06, "loss": 0.2879, "loss_nan_ranks": 0, "loss_rank_avg": 0.13182973861694336, "step": 4415, "valid_targets_mean": 4776.1, "valid_targets_min": 889 }, { "epoch": 4.473924050632911, "grad_norm": 0.27864898068700833, "learning_rate": 1.340064553878908e-06, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.14037862420082092, "step": 4420, "valid_targets_mean": 5322.2, "valid_targets_min": 1116 }, { "epoch": 4.478987341772152, "grad_norm": 0.2935646123466447, "learning_rate": 1.3147512153063558e-06, "loss": 0.2848, "loss_nan_ranks": 0, "loss_rank_avg": 0.18074341118335724, "step": 4425, "valid_targets_mean": 6079.2, "valid_targets_min": 1329 }, { "epoch": 4.4840506329113925, "grad_norm": 0.34486016144946086, "learning_rate": 1.289671114713129e-06, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.1330321580171585, "step": 4430, "valid_targets_mean": 3942.1, "valid_targets_min": 906 }, { "epoch": 4.489113924050633, "grad_norm": 0.3344555372523651, "learning_rate": 1.264824565160716e-06, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.1601177453994751, "step": 4435, "valid_targets_mean": 5832.6, "valid_targets_min": 1133 }, { "epoch": 4.494177215189874, "grad_norm": 0.31338693723543865, "learning_rate": 1.2402118767953342e-06, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.11089809238910675, "step": 4440, "valid_targets_mean": 3433.5, "valid_targets_min": 1255 }, { "epoch": 4.499240506329114, "grad_norm": 0.32257737557743127, "learning_rate": 1.2158333568440183e-06, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.19272515177726746, "step": 4445, "valid_targets_mean": 5173.0, "valid_targets_min": 1505 }, { "epoch": 4.504303797468355, "grad_norm": 0.31362483355013254, "learning_rate": 1.1916893096108063e-06, "loss": 0.2946, "loss_nan_ranks": 0, "loss_rank_avg": 0.1500798463821411, "step": 4450, "valid_targets_mean": 4663.4, "valid_targets_min": 1370 }, { "epoch": 4.509367088607595, "grad_norm": 0.3261715632472016, "learning_rate": 1.167780036472952e-06, "loss": 0.2959, "loss_nan_ranks": 0, "loss_rank_avg": 0.13341718912124634, "step": 4455, "valid_targets_mean": 3426.2, "valid_targets_min": 1364 }, { "epoch": 4.514430379746836, "grad_norm": 0.30597584635072983, "learning_rate": 1.1441058358771317e-06, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.16293524205684662, "step": 4460, "valid_targets_mean": 4787.8, "valid_targets_min": 1378 }, { "epoch": 4.519493670886076, "grad_norm": 0.2817037355554941, "learning_rate": 1.1206670033357537e-06, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.15130957961082458, "step": 4465, "valid_targets_mean": 5285.4, "valid_targets_min": 1543 }, { "epoch": 4.524556962025317, "grad_norm": 0.31694092622996994, "learning_rate": 1.0974638314232355e-06, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.15193693339824677, "step": 4470, "valid_targets_mean": 4457.0, "valid_targets_min": 1065 }, { "epoch": 4.529620253164557, "grad_norm": 0.3521199068866329, "learning_rate": 1.074496609772384e-06, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.12703898549079895, "step": 4475, "valid_targets_mean": 3699.0, "valid_targets_min": 1328 }, { "epoch": 4.534683544303798, "grad_norm": 0.33021283919153493, "learning_rate": 1.0517656250707575e-06, "loss": 0.2989, "loss_nan_ranks": 0, "loss_rank_avg": 0.17758193612098694, "step": 4480, "valid_targets_mean": 5269.1, "valid_targets_min": 1336 }, { "epoch": 4.539746835443038, "grad_norm": 0.29305233423571464, "learning_rate": 1.0292711610570904e-06, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.17428819835186005, "step": 4485, "valid_targets_mean": 6173.5, "valid_targets_min": 1377 }, { "epoch": 4.544810126582279, "grad_norm": 0.28819969743794543, "learning_rate": 1.007013498517766e-06, "loss": 0.2909, "loss_nan_ranks": 0, "loss_rank_avg": 0.11772993206977844, "step": 4490, "valid_targets_mean": 4622.6, "valid_targets_min": 1404 }, { "epoch": 4.549873417721519, "grad_norm": 0.28436809731542273, "learning_rate": 9.849929152832937e-07, "loss": 0.2917, "loss_nan_ranks": 0, "loss_rank_avg": 0.1377575397491455, "step": 4495, "valid_targets_mean": 4425.2, "valid_targets_min": 1292 }, { "epoch": 4.55493670886076, "grad_norm": 0.3150381879092353, "learning_rate": 9.63209686224853e-07, "loss": 0.293, "loss_nan_ranks": 0, "loss_rank_avg": 0.13312697410583496, "step": 4500, "valid_targets_mean": 3467.1, "valid_targets_min": 826 }, { "epoch": 4.5600000000000005, "grad_norm": 0.2911980506543601, "learning_rate": 9.416640832508572e-07, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.16458618640899658, "step": 4505, "valid_targets_mean": 5330.3, "valid_targets_min": 980 }, { "epoch": 4.56506329113924, "grad_norm": 0.32761330476726724, "learning_rate": 9.203563753035527e-07, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.15134479105472565, "step": 4510, "valid_targets_mean": 4789.5, "valid_targets_min": 1240 }, { "epoch": 4.570126582278481, "grad_norm": 0.27610230646497064, "learning_rate": 8.992868283556833e-07, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.14713215827941895, "step": 4515, "valid_targets_mean": 5446.5, "valid_targets_min": 810 }, { "epoch": 4.575189873417721, "grad_norm": 0.33737396503280603, "learning_rate": 8.78455705407144e-07, "loss": 0.2892, "loss_nan_ranks": 0, "loss_rank_avg": 0.15195101499557495, "step": 4520, "valid_targets_mean": 4126.9, "valid_targets_min": 866 }, { "epoch": 4.580253164556962, "grad_norm": 0.421939799277528, "learning_rate": 8.578632664817177e-07, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.15855969488620758, "step": 4525, "valid_targets_mean": 4059.2, "valid_targets_min": 1162 }, { "epoch": 4.585316455696202, "grad_norm": 0.30679616072425525, "learning_rate": 8.375097686238187e-07, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.15983693301677704, "step": 4530, "valid_targets_mean": 4688.2, "valid_targets_min": 844 }, { "epoch": 4.590379746835443, "grad_norm": 0.33783626379593873, "learning_rate": 8.173954658952854e-07, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.13029304146766663, "step": 4535, "valid_targets_mean": 3584.9, "valid_targets_min": 1132 }, { "epoch": 4.595443037974683, "grad_norm": 0.409725960177412, "learning_rate": 7.975206093722176e-07, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.1639317274093628, "step": 4540, "valid_targets_mean": 4393.8, "valid_targets_min": 981 }, { "epoch": 4.600506329113924, "grad_norm": 0.34883872064169896, "learning_rate": 7.778854471418306e-07, "loss": 0.2912, "loss_nan_ranks": 0, "loss_rank_avg": 0.1438419073820114, "step": 4545, "valid_targets_mean": 3598.3, "valid_targets_min": 1015 }, { "epoch": 4.605569620253164, "grad_norm": 0.3163445155831429, "learning_rate": 7.584902242993708e-07, "loss": 0.2991, "loss_nan_ranks": 0, "loss_rank_avg": 0.19004172086715698, "step": 4550, "valid_targets_mean": 5218.9, "valid_targets_min": 1337 }, { "epoch": 4.610632911392405, "grad_norm": 0.28908020066387696, "learning_rate": 7.393351829450379e-07, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.12715786695480347, "step": 4555, "valid_targets_mean": 4291.9, "valid_targets_min": 1068 }, { "epoch": 4.6156962025316455, "grad_norm": 0.3390758182489428, "learning_rate": 7.204205621809813e-07, "loss": 0.3018, "loss_nan_ranks": 0, "loss_rank_avg": 0.16513592004776, "step": 4560, "valid_targets_mean": 4141.6, "valid_targets_min": 1241 }, { "epoch": 4.620759493670886, "grad_norm": 0.3707332505274512, "learning_rate": 7.017465981083127e-07, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.18795087933540344, "step": 4565, "valid_targets_mean": 6154.2, "valid_targets_min": 1174 }, { "epoch": 4.6258227848101265, "grad_norm": 0.3431279755640469, "learning_rate": 6.833135238241473e-07, "loss": 0.2955, "loss_nan_ranks": 0, "loss_rank_avg": 0.1402522623538971, "step": 4570, "valid_targets_mean": 3705.2, "valid_targets_min": 1346 }, { "epoch": 4.630886075949367, "grad_norm": 0.3201150073208208, "learning_rate": 6.651215694187074e-07, "loss": 0.2956, "loss_nan_ranks": 0, "loss_rank_avg": 0.13963478803634644, "step": 4575, "valid_targets_mean": 4570.6, "valid_targets_min": 1027 }, { "epoch": 4.635949367088608, "grad_norm": 0.32083737479519586, "learning_rate": 6.471709619724386e-07, "loss": 0.2811, "loss_nan_ranks": 0, "loss_rank_avg": 0.1721346378326416, "step": 4580, "valid_targets_mean": 4410.9, "valid_targets_min": 1268 }, { "epoch": 4.641012658227848, "grad_norm": 0.3413968428656355, "learning_rate": 6.294619255531853e-07, "loss": 0.2984, "loss_nan_ranks": 0, "loss_rank_avg": 0.1746809184551239, "step": 4585, "valid_targets_mean": 4543.4, "valid_targets_min": 1503 }, { "epoch": 4.646075949367089, "grad_norm": 0.2984905883347286, "learning_rate": 6.119946812133926e-07, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.2020062506198883, "step": 4590, "valid_targets_mean": 7061.8, "valid_targets_min": 1615 }, { "epoch": 4.651139240506329, "grad_norm": 0.2957015403668056, "learning_rate": 5.947694469873377e-07, "loss": 0.3024, "loss_nan_ranks": 0, "loss_rank_avg": 0.1912672221660614, "step": 4595, "valid_targets_mean": 6352.6, "valid_targets_min": 1115 }, { "epoch": 4.65620253164557, "grad_norm": 0.3177142897029759, "learning_rate": 5.777864378884212e-07, "loss": 0.2905, "loss_nan_ranks": 0, "loss_rank_avg": 0.1385997235774994, "step": 4600, "valid_targets_mean": 4380.5, "valid_targets_min": 1184 }, { "epoch": 4.66126582278481, "grad_norm": 0.30671392692985, "learning_rate": 5.610458659064688e-07, "loss": 0.3067, "loss_nan_ranks": 0, "loss_rank_avg": 0.17495407164096832, "step": 4605, "valid_targets_mean": 5155.4, "valid_targets_min": 1128 }, { "epoch": 4.666329113924051, "grad_norm": 0.32460623503028924, "learning_rate": 5.445479400051046e-07, "loss": 0.2997, "loss_nan_ranks": 0, "loss_rank_avg": 0.1435496062040329, "step": 4610, "valid_targets_mean": 4002.2, "valid_targets_min": 1103 }, { "epoch": 4.671392405063291, "grad_norm": 0.3077758754022733, "learning_rate": 5.282928661191178e-07, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.11725576967000961, "step": 4615, "valid_targets_mean": 3599.3, "valid_targets_min": 1270 }, { "epoch": 4.676455696202532, "grad_norm": 0.2920943225927082, "learning_rate": 5.12280847151918e-07, "loss": 0.2933, "loss_nan_ranks": 0, "loss_rank_avg": 0.15268352627754211, "step": 4620, "valid_targets_mean": 4974.8, "valid_targets_min": 1238 }, { "epoch": 4.681518987341772, "grad_norm": 0.3310902814879114, "learning_rate": 4.965120829729819e-07, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.1577180027961731, "step": 4625, "valid_targets_mean": 4892.1, "valid_targets_min": 1480 }, { "epoch": 4.686582278481013, "grad_norm": 0.3364738036743787, "learning_rate": 4.809867704153726e-07, "loss": 0.2962, "loss_nan_ranks": 0, "loss_rank_avg": 0.11956533789634705, "step": 4630, "valid_targets_mean": 3546.2, "valid_targets_min": 914 }, { "epoch": 4.6916455696202535, "grad_norm": 0.34774374236202665, "learning_rate": 4.657051032732707e-07, "loss": 0.3098, "loss_nan_ranks": 0, "loss_rank_avg": 0.14325565099716187, "step": 4635, "valid_targets_mean": 3353.1, "valid_targets_min": 908 }, { "epoch": 4.696708860759494, "grad_norm": 0.32445866672285933, "learning_rate": 4.506672722995609e-07, "loss": 0.2953, "loss_nan_ranks": 0, "loss_rank_avg": 0.1779376119375229, "step": 4640, "valid_targets_mean": 5084.9, "valid_targets_min": 1254 }, { "epoch": 4.7017721518987345, "grad_norm": 0.3370837185705519, "learning_rate": 4.358734652034624e-07, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.12637917697429657, "step": 4645, "valid_targets_mean": 3544.5, "valid_targets_min": 1283 }, { "epoch": 4.706835443037974, "grad_norm": 0.3141292209016846, "learning_rate": 4.2132386664815783e-07, "loss": 0.3063, "loss_nan_ranks": 0, "loss_rank_avg": 0.13325795531272888, "step": 4650, "valid_targets_mean": 4623.6, "valid_targets_min": 1232 }, { "epoch": 4.711898734177215, "grad_norm": 0.3052040124075767, "learning_rate": 4.070186582485214e-07, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.14848539233207703, "step": 4655, "valid_targets_mean": 3974.2, "valid_targets_min": 1752 }, { "epoch": 4.716962025316455, "grad_norm": 0.3485398015143201, "learning_rate": 3.9295801856882307e-07, "loss": 0.3033, "loss_nan_ranks": 0, "loss_rank_avg": 0.15560302138328552, "step": 4660, "valid_targets_mean": 3853.7, "valid_targets_min": 1331 }, { "epoch": 4.722025316455696, "grad_norm": 0.30603263342163534, "learning_rate": 3.791421231205217e-07, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.1302764117717743, "step": 4665, "valid_targets_mean": 4759.7, "valid_targets_min": 980 }, { "epoch": 4.727088607594936, "grad_norm": 0.36206047089808735, "learning_rate": 3.6557114436005516e-07, "loss": 0.2953, "loss_nan_ranks": 0, "loss_rank_avg": 0.11317434906959534, "step": 4670, "valid_targets_mean": 2750.8, "valid_targets_min": 1281 }, { "epoch": 4.732151898734177, "grad_norm": 0.31924377751088473, "learning_rate": 3.522452516867048e-07, "loss": 0.3074, "loss_nan_ranks": 0, "loss_rank_avg": 0.19149929285049438, "step": 4675, "valid_targets_mean": 5680.5, "valid_targets_min": 1070 }, { "epoch": 4.737215189873417, "grad_norm": 0.40142669703450146, "learning_rate": 3.391646114404701e-07, "loss": 0.3025, "loss_nan_ranks": 0, "loss_rank_avg": 0.1676904857158661, "step": 4680, "valid_targets_mean": 5601.9, "valid_targets_min": 1777 }, { "epoch": 4.742278481012658, "grad_norm": 0.33298593772917773, "learning_rate": 3.263293868999928e-07, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.1185358390212059, "step": 4685, "valid_targets_mean": 2993.5, "valid_targets_min": 1244 }, { "epoch": 4.7473417721518985, "grad_norm": 0.28590139808721005, "learning_rate": 3.1373973828052964e-07, "loss": 0.2946, "loss_nan_ranks": 0, "loss_rank_avg": 0.1383609175682068, "step": 4690, "valid_targets_mean": 4685.9, "valid_targets_min": 1897 }, { "epoch": 4.752405063291139, "grad_norm": 0.33045699934667616, "learning_rate": 3.013958227319358e-07, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.128380686044693, "step": 4695, "valid_targets_mean": 3661.8, "valid_targets_min": 1102 }, { "epoch": 4.7574683544303795, "grad_norm": 0.3175505591380564, "learning_rate": 2.892977943367159e-07, "loss": 0.2774, "loss_nan_ranks": 0, "loss_rank_avg": 0.19775532186031342, "step": 4700, "valid_targets_mean": 5166.0, "valid_targets_min": 954 }, { "epoch": 4.76253164556962, "grad_norm": 0.2773796894575858, "learning_rate": 2.774458041080963e-07, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.12263042479753494, "step": 4705, "valid_targets_mean": 4538.4, "valid_targets_min": 1559 }, { "epoch": 4.767594936708861, "grad_norm": 0.3292357564608315, "learning_rate": 2.6583999998814e-07, "loss": 0.2953, "loss_nan_ranks": 0, "loss_rank_avg": 0.14571279287338257, "step": 4710, "valid_targets_mean": 3984.7, "valid_targets_min": 1195 }, { "epoch": 4.772658227848101, "grad_norm": 0.3368831623026044, "learning_rate": 2.544805268459016e-07, "loss": 0.2867, "loss_nan_ranks": 0, "loss_rank_avg": 0.21459759771823883, "step": 4715, "valid_targets_mean": 4702.3, "valid_targets_min": 1266 }, { "epoch": 4.777721518987342, "grad_norm": 0.335601220973268, "learning_rate": 2.4336752647561304e-07, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.14298905432224274, "step": 4720, "valid_targets_mean": 3874.7, "valid_targets_min": 965 }, { "epoch": 4.782784810126582, "grad_norm": 0.28413880966924987, "learning_rate": 2.3250113759492266e-07, "loss": 0.2862, "loss_nan_ranks": 0, "loss_rank_avg": 0.1618804931640625, "step": 4725, "valid_targets_mean": 5582.7, "valid_targets_min": 868 }, { "epoch": 4.787848101265823, "grad_norm": 0.3021482607745952, "learning_rate": 2.2188149584315922e-07, "loss": 0.3055, "loss_nan_ranks": 0, "loss_rank_avg": 0.15998998284339905, "step": 4730, "valid_targets_mean": 4565.1, "valid_targets_min": 1149 }, { "epoch": 4.792911392405063, "grad_norm": 0.3011882542828061, "learning_rate": 2.1150873377963954e-07, "loss": 0.3021, "loss_nan_ranks": 0, "loss_rank_avg": 0.1401754915714264, "step": 4735, "valid_targets_mean": 5010.8, "valid_targets_min": 998 }, { "epoch": 4.797974683544304, "grad_norm": 0.3507567997328214, "learning_rate": 2.0138298088201004e-07, "loss": 0.2854, "loss_nan_ranks": 0, "loss_rank_avg": 0.0675700232386589, "step": 4740, "valid_targets_mean": 2630.8, "valid_targets_min": 1155 }, { "epoch": 4.803037974683544, "grad_norm": 0.3187910514753291, "learning_rate": 1.915043635446323e-07, "loss": 0.2916, "loss_nan_ranks": 0, "loss_rank_avg": 0.12245633453130722, "step": 4745, "valid_targets_mean": 3394.0, "valid_targets_min": 1403 }, { "epoch": 4.808101265822785, "grad_norm": 0.2967133708531598, "learning_rate": 1.8187300507701345e-07, "loss": 0.3035, "loss_nan_ranks": 0, "loss_rank_avg": 0.1302807629108429, "step": 4750, "valid_targets_mean": 3881.6, "valid_targets_min": 1033 }, { "epoch": 4.813164556962025, "grad_norm": 0.30044714660435673, "learning_rate": 1.7248902570225378e-07, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.13116371631622314, "step": 4755, "valid_targets_mean": 4054.7, "valid_targets_min": 886 }, { "epoch": 4.818227848101266, "grad_norm": 0.3161774057323668, "learning_rate": 1.6335254255555933e-07, "loss": 0.2925, "loss_nan_ranks": 0, "loss_rank_avg": 0.14581556618213654, "step": 4760, "valid_targets_mean": 4080.4, "valid_targets_min": 1368 }, { "epoch": 4.8232911392405065, "grad_norm": 0.30034489171760914, "learning_rate": 1.5446366968276283e-07, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.1464047133922577, "step": 4765, "valid_targets_mean": 4359.5, "valid_targets_min": 1093 }, { "epoch": 4.828354430379747, "grad_norm": 0.30396263421785596, "learning_rate": 1.4582251803892055e-07, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.14488472044467926, "step": 4770, "valid_targets_mean": 4854.4, "valid_targets_min": 956 }, { "epoch": 4.8334177215189875, "grad_norm": 0.25886849889886787, "learning_rate": 1.3742919548691114e-07, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.13551469147205353, "step": 4775, "valid_targets_mean": 5292.5, "valid_targets_min": 1085 }, { "epoch": 4.838481012658228, "grad_norm": 0.3369536866060149, "learning_rate": 1.2928380679609442e-07, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.20701755583286285, "step": 4780, "valid_targets_mean": 5313.5, "valid_targets_min": 1444 }, { "epoch": 4.843544303797469, "grad_norm": 0.2981209270612857, "learning_rate": 1.2138645364101032e-07, "loss": 0.2933, "loss_nan_ranks": 0, "loss_rank_avg": 0.11797007918357849, "step": 4785, "valid_targets_mean": 4077.7, "valid_targets_min": 1058 }, { "epoch": 4.848607594936709, "grad_norm": 0.2923056085103413, "learning_rate": 1.1373723460009756e-07, "loss": 0.2866, "loss_nan_ranks": 0, "loss_rank_avg": 0.18645049631595612, "step": 4790, "valid_targets_mean": 6275.9, "valid_targets_min": 1356 }, { "epoch": 4.85367088607595, "grad_norm": 0.31520564975094073, "learning_rate": 1.0633624515447027e-07, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.1347823590040207, "step": 4795, "valid_targets_mean": 3709.9, "valid_targets_min": 1143 }, { "epoch": 4.85873417721519, "grad_norm": 0.330282900217264, "learning_rate": 9.918357768673004e-08, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.10554465651512146, "step": 4800, "valid_targets_mean": 3067.8, "valid_targets_min": 1042 }, { "epoch": 4.863797468354431, "grad_norm": 0.34394007944621313, "learning_rate": 9.22793214797979e-08, "loss": 0.3043, "loss_nan_ranks": 0, "loss_rank_avg": 0.1265249103307724, "step": 4805, "valid_targets_mean": 3206.9, "valid_targets_min": 972 }, { "epoch": 4.868860759493671, "grad_norm": 0.3066301892656282, "learning_rate": 8.562356271582194e-08, "loss": 0.3032, "loss_nan_ranks": 0, "loss_rank_avg": 0.11144056916236877, "step": 4810, "valid_targets_mean": 3448.4, "valid_targets_min": 1079 }, { "epoch": 4.873924050632912, "grad_norm": 0.31898550298505707, "learning_rate": 7.92163844750804e-08, "loss": 0.2921, "loss_nan_ranks": 0, "loss_rank_avg": 0.17169725894927979, "step": 4815, "valid_targets_mean": 4453.8, "valid_targets_min": 1086 }, { "epoch": 4.878987341772152, "grad_norm": 0.35072783756221276, "learning_rate": 7.305786673495796e-08, "loss": 0.298, "loss_nan_ranks": 0, "loss_rank_avg": 0.1834912747144699, "step": 4820, "valid_targets_mean": 4796.1, "valid_targets_min": 1290 }, { "epoch": 4.884050632911393, "grad_norm": 0.30086828019346806, "learning_rate": 6.714808636893999e-08, "loss": 0.2984, "loss_nan_ranks": 0, "loss_rank_avg": 0.19445079565048218, "step": 4825, "valid_targets_mean": 5488.9, "valid_targets_min": 1013 }, { "epoch": 4.889113924050633, "grad_norm": 0.29066248451169346, "learning_rate": 6.148711714565992e-08, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.14921297132968903, "step": 4830, "valid_targets_mean": 5289.1, "valid_targets_min": 1279 }, { "epoch": 4.894177215189873, "grad_norm": 0.3206808977051651, "learning_rate": 5.6075029727971075e-08, "loss": 0.294, "loss_nan_ranks": 0, "loss_rank_avg": 0.15516558289527893, "step": 4835, "valid_targets_mean": 4284.6, "valid_targets_min": 1465 }, { "epoch": 4.899240506329114, "grad_norm": 0.34136663563954944, "learning_rate": 5.091189167207189e-08, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.16188789904117584, "step": 4840, "valid_targets_mean": 4162.2, "valid_targets_min": 1536 }, { "epoch": 4.904303797468354, "grad_norm": 0.2892291641651244, "learning_rate": 4.5997767426653183e-08, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.11494030058383942, "step": 4845, "valid_targets_mean": 3805.9, "valid_targets_min": 950 }, { "epoch": 4.909367088607595, "grad_norm": 0.3310728562870818, "learning_rate": 4.133271833210772e-08, "loss": 0.3063, "loss_nan_ranks": 0, "loss_rank_avg": 0.15285596251487732, "step": 4850, "valid_targets_mean": 4150.3, "valid_targets_min": 1408 }, { "epoch": 4.914430379746835, "grad_norm": 0.29329622685622975, "learning_rate": 3.6916802619746395e-08, "loss": 0.2958, "loss_nan_ranks": 0, "loss_rank_avg": 0.16643556952476501, "step": 4855, "valid_targets_mean": 5756.4, "valid_targets_min": 1791 }, { "epoch": 4.919493670886076, "grad_norm": 0.3795378130128926, "learning_rate": 3.2750075411087654e-08, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.20965784788131714, "step": 4860, "valid_targets_mean": 5036.8, "valid_targets_min": 1359 }, { "epoch": 4.924556962025316, "grad_norm": 0.3227285897594828, "learning_rate": 2.8832588717164766e-08, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.13055765628814697, "step": 4865, "valid_targets_mean": 3481.6, "valid_targets_min": 1608 }, { "epoch": 4.929620253164557, "grad_norm": 0.30074655411206147, "learning_rate": 2.516439143786631e-08, "loss": 0.3002, "loss_nan_ranks": 0, "loss_rank_avg": 0.17739662528038025, "step": 4870, "valid_targets_mean": 5336.9, "valid_targets_min": 786 }, { "epoch": 4.934683544303797, "grad_norm": 0.37988249749008485, "learning_rate": 2.1745529361343333e-08, "loss": 0.2951, "loss_nan_ranks": 0, "loss_rank_avg": 0.18349409103393555, "step": 4875, "valid_targets_mean": 5208.7, "valid_targets_min": 1284 }, { "epoch": 4.939746835443038, "grad_norm": 0.3022387792298933, "learning_rate": 1.857604516342315e-08, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.1349787563085556, "step": 4880, "valid_targets_mean": 4001.4, "valid_targets_min": 1055 }, { "epoch": 4.944810126582278, "grad_norm": 0.3239022765036362, "learning_rate": 1.5655978407085326e-08, "loss": 0.3022, "loss_nan_ranks": 0, "loss_rank_avg": 0.15572325885295868, "step": 4885, "valid_targets_mean": 4256.0, "valid_targets_min": 1282 }, { "epoch": 4.949873417721519, "grad_norm": 0.3484022919664308, "learning_rate": 1.2985365541959838e-08, "loss": 0.2871, "loss_nan_ranks": 0, "loss_rank_avg": 0.1123068630695343, "step": 4890, "valid_targets_mean": 3383.1, "valid_targets_min": 1353 }, { "epoch": 4.954936708860759, "grad_norm": 0.2766076122909068, "learning_rate": 1.0564239903885221e-08, "loss": 0.298, "loss_nan_ranks": 0, "loss_rank_avg": 0.13588979840278625, "step": 4895, "valid_targets_mean": 5022.2, "valid_targets_min": 1687 }, { "epoch": 4.96, "grad_norm": 0.3637031857594984, "learning_rate": 8.392631714477794e-09, "loss": 0.2958, "loss_nan_ranks": 0, "loss_rank_avg": 0.22151219844818115, "step": 4900, "valid_targets_mean": 4548.4, "valid_targets_min": 1055 }, { "epoch": 4.9650632911392405, "grad_norm": 0.3070617643850501, "learning_rate": 6.470568080760853e-09, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.1599656343460083, "step": 4905, "valid_targets_mean": 5380.0, "valid_targets_min": 696 }, { "epoch": 4.970126582278481, "grad_norm": 0.2982099706698035, "learning_rate": 4.798072994827152e-09, "loss": 0.2819, "loss_nan_ranks": 0, "loss_rank_avg": 0.13907426595687866, "step": 4910, "valid_targets_mean": 4511.9, "valid_targets_min": 1282 }, { "epoch": 4.975189873417722, "grad_norm": 0.34819560371210506, "learning_rate": 3.3751673335458147e-09, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.14076785743236542, "step": 4915, "valid_targets_mean": 3422.9, "valid_targets_min": 1383 }, { "epoch": 4.980253164556962, "grad_norm": 0.3120620502259134, "learning_rate": 2.2018688582803315e-09, "loss": 0.2976, "loss_nan_ranks": 0, "loss_rank_avg": 0.17987266182899475, "step": 4920, "valid_targets_mean": 5285.9, "valid_targets_min": 1137 }, { "epoch": 4.985316455696203, "grad_norm": 0.28626460706538365, "learning_rate": 1.2781922146931635e-09, "loss": 0.3007, "loss_nan_ranks": 0, "loss_rank_avg": 0.15345998108386993, "step": 4925, "valid_targets_mean": 5331.3, "valid_targets_min": 781 }, { "epoch": 4.990379746835443, "grad_norm": 0.30214318111472815, "learning_rate": 6.041489325459004e-10, "loss": 0.2843, "loss_nan_ranks": 0, "loss_rank_avg": 0.14609292149543762, "step": 4930, "valid_targets_mean": 4398.6, "valid_targets_min": 1460 }, { "epoch": 4.995443037974684, "grad_norm": 0.36710406768986703, "learning_rate": 1.7974742556159386e-10, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.17454470694065094, "step": 4935, "valid_targets_mean": 4667.4, "valid_targets_min": 949 }, { "epoch": 5.0, "grad_norm": 0.42711913533675244, "learning_rate": 4.992991313734763e-12, "loss": 0.2954, "loss_nan_ranks": 0, "loss_rank_avg": 0.29739144444465637, "step": 4940, "valid_targets_mean": 4348.2, "valid_targets_min": 876 }, { "epoch": 5.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.29739144444465637, "step": 4940, "total_flos": 1.3775029894633226e+18, "train_loss": 0.31707094306887884, "train_runtime": 34760.1149, "train_samples_per_second": 4.545, "train_steps_per_second": 0.142, "valid_targets_mean": 4348.2, "valid_targets_min": 876 } ], "logging_steps": 5, "max_steps": 4940, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": false, "should_training_stop": false }, "attributes": {} } }, "total_flos": 1.3775029894633226e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }