{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4319, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.010351966873706004, "grad_norm": 15.605315613103867, "learning_rate": 4.71976401179941e-07, "loss": 0.6774, "loss_nan_ranks": 0, "loss_rank_avg": 0.7991642951965332, "step": 5, "valid_targets_mean": 2069.4, "valid_targets_min": 544 }, { "epoch": 0.020703933747412008, "grad_norm": 8.863140569141265, "learning_rate": 1.0619469026548673e-06, "loss": 0.7208, "loss_nan_ranks": 0, "loss_rank_avg": 0.6838527917861938, "step": 10, "valid_targets_mean": 3883.4, "valid_targets_min": 313 }, { "epoch": 0.031055900621118012, "grad_norm": 12.629168153366845, "learning_rate": 1.6519174041297937e-06, "loss": 0.685, "loss_nan_ranks": 0, "loss_rank_avg": 0.7600278854370117, "step": 15, "valid_targets_mean": 2096.7, "valid_targets_min": 618 }, { "epoch": 0.041407867494824016, "grad_norm": 6.799624906702634, "learning_rate": 2.24188790560472e-06, "loss": 0.6675, "loss_nan_ranks": 0, "loss_rank_avg": 0.6246192455291748, "step": 20, "valid_targets_mean": 3201.5, "valid_targets_min": 693 }, { "epoch": 0.051759834368530024, "grad_norm": 4.637130666016448, "learning_rate": 2.831858407079646e-06, "loss": 0.6722, "loss_nan_ranks": 0, "loss_rank_avg": 0.7706674337387085, "step": 25, "valid_targets_mean": 3519.5, "valid_targets_min": 636 }, { "epoch": 0.062111801242236024, "grad_norm": 3.1183737090108545, "learning_rate": 3.4218289085545726e-06, "loss": 0.6021, "loss_nan_ranks": 0, "loss_rank_avg": 0.6737767457962036, "step": 30, "valid_targets_mean": 3171.9, "valid_targets_min": 820 }, { "epoch": 0.07246376811594203, "grad_norm": 2.298602022892457, "learning_rate": 4.011799410029498e-06, "loss": 0.5708, "loss_nan_ranks": 0, "loss_rank_avg": 0.5966386795043945, "step": 35, "valid_targets_mean": 2413.9, "valid_targets_min": 854 }, { "epoch": 0.08281573498964803, "grad_norm": 1.9166901302469286, "learning_rate": 4.6017699115044254e-06, "loss": 0.4853, "loss_nan_ranks": 0, "loss_rank_avg": 0.5276696681976318, "step": 40, "valid_targets_mean": 1972.9, "valid_targets_min": 893 }, { "epoch": 0.09316770186335403, "grad_norm": 2.287553544660079, "learning_rate": 5.191740412979352e-06, "loss": 0.4365, "loss_nan_ranks": 0, "loss_rank_avg": 0.441994309425354, "step": 45, "valid_targets_mean": 3530.9, "valid_targets_min": 928 }, { "epoch": 0.10351966873706005, "grad_norm": 1.2570057018709198, "learning_rate": 5.781710914454279e-06, "loss": 0.4807, "loss_nan_ranks": 0, "loss_rank_avg": 0.5429658889770508, "step": 50, "valid_targets_mean": 2901.6, "valid_targets_min": 756 }, { "epoch": 0.11387163561076605, "grad_norm": 0.930016752086229, "learning_rate": 6.371681415929204e-06, "loss": 0.5788, "loss_nan_ranks": 0, "loss_rank_avg": 0.44122475385665894, "step": 55, "valid_targets_mean": 3173.3, "valid_targets_min": 515 }, { "epoch": 0.12422360248447205, "grad_norm": 0.8587397931841486, "learning_rate": 6.961651917404131e-06, "loss": 0.4867, "loss_nan_ranks": 0, "loss_rank_avg": 0.46632158756256104, "step": 60, "valid_targets_mean": 2709.9, "valid_targets_min": 781 }, { "epoch": 0.13457556935817805, "grad_norm": 0.9248959615543452, "learning_rate": 7.551622418879056e-06, "loss": 0.5078, "loss_nan_ranks": 0, "loss_rank_avg": 0.49240103363990784, "step": 65, "valid_targets_mean": 2006.4, "valid_targets_min": 645 }, { "epoch": 0.14492753623188406, "grad_norm": 0.7279615677685586, "learning_rate": 8.141592920353984e-06, "loss": 0.425, "loss_nan_ranks": 0, "loss_rank_avg": 0.39918971061706543, "step": 70, "valid_targets_mean": 3112.9, "valid_targets_min": 431 }, { "epoch": 0.15527950310559005, "grad_norm": 0.7659577874600716, "learning_rate": 8.73156342182891e-06, "loss": 0.4238, "loss_nan_ranks": 0, "loss_rank_avg": 0.40704938769340515, "step": 75, "valid_targets_mean": 2240.1, "valid_targets_min": 604 }, { "epoch": 0.16563146997929606, "grad_norm": 0.7216997725030858, "learning_rate": 9.321533923303837e-06, "loss": 0.4238, "loss_nan_ranks": 0, "loss_rank_avg": 0.43496978282928467, "step": 80, "valid_targets_mean": 3710.6, "valid_targets_min": 849 }, { "epoch": 0.17598343685300208, "grad_norm": 0.8774588952929467, "learning_rate": 9.911504424778762e-06, "loss": 0.4171, "loss_nan_ranks": 0, "loss_rank_avg": 0.43825411796569824, "step": 85, "valid_targets_mean": 1872.3, "valid_targets_min": 779 }, { "epoch": 0.18633540372670807, "grad_norm": 0.8451380882184308, "learning_rate": 1.0501474926253687e-05, "loss": 0.4484, "loss_nan_ranks": 0, "loss_rank_avg": 0.44401633739471436, "step": 90, "valid_targets_mean": 2137.0, "valid_targets_min": 597 }, { "epoch": 0.19668737060041408, "grad_norm": 0.6084483563484301, "learning_rate": 1.1091445427728616e-05, "loss": 0.4483, "loss_nan_ranks": 0, "loss_rank_avg": 0.3756181001663208, "step": 95, "valid_targets_mean": 3593.1, "valid_targets_min": 642 }, { "epoch": 0.2070393374741201, "grad_norm": 0.6213761233419673, "learning_rate": 1.1681415929203541e-05, "loss": 0.4075, "loss_nan_ranks": 0, "loss_rank_avg": 0.4502703547477722, "step": 100, "valid_targets_mean": 3648.6, "valid_targets_min": 1054 }, { "epoch": 0.21739130434782608, "grad_norm": 0.9269246228823874, "learning_rate": 1.2271386430678467e-05, "loss": 0.4266, "loss_nan_ranks": 0, "loss_rank_avg": 0.4538400173187256, "step": 105, "valid_targets_mean": 1649.7, "valid_targets_min": 1060 }, { "epoch": 0.2277432712215321, "grad_norm": 0.6575358320968785, "learning_rate": 1.2861356932153392e-05, "loss": 0.4556, "loss_nan_ranks": 0, "loss_rank_avg": 0.4259205162525177, "step": 110, "valid_targets_mean": 2929.3, "valid_targets_min": 920 }, { "epoch": 0.23809523809523808, "grad_norm": 0.7520773860181491, "learning_rate": 1.345132743362832e-05, "loss": 0.4091, "loss_nan_ranks": 0, "loss_rank_avg": 0.51981520652771, "step": 115, "valid_targets_mean": 2942.2, "valid_targets_min": 870 }, { "epoch": 0.2484472049689441, "grad_norm": 0.6260406424910655, "learning_rate": 1.4041297935103246e-05, "loss": 0.4403, "loss_nan_ranks": 0, "loss_rank_avg": 0.463638037443161, "step": 120, "valid_targets_mean": 3665.9, "valid_targets_min": 863 }, { "epoch": 0.2587991718426501, "grad_norm": 0.7666598846619594, "learning_rate": 1.4631268436578171e-05, "loss": 0.4347, "loss_nan_ranks": 0, "loss_rank_avg": 0.49128270149230957, "step": 125, "valid_targets_mean": 2527.6, "valid_targets_min": 374 }, { "epoch": 0.2691511387163561, "grad_norm": 0.863409285542385, "learning_rate": 1.5221238938053098e-05, "loss": 0.3948, "loss_nan_ranks": 0, "loss_rank_avg": 0.5175631046295166, "step": 130, "valid_targets_mean": 2604.3, "valid_targets_min": 604 }, { "epoch": 0.2795031055900621, "grad_norm": 0.6514406268066054, "learning_rate": 1.5811209439528025e-05, "loss": 0.3959, "loss_nan_ranks": 0, "loss_rank_avg": 0.3603256940841675, "step": 135, "valid_targets_mean": 2682.6, "valid_targets_min": 1039 }, { "epoch": 0.2898550724637681, "grad_norm": 0.7385382622379217, "learning_rate": 1.6401179941002953e-05, "loss": 0.3854, "loss_nan_ranks": 0, "loss_rank_avg": 0.3818318247795105, "step": 140, "valid_targets_mean": 2239.2, "valid_targets_min": 525 }, { "epoch": 0.3002070393374741, "grad_norm": 0.7388257073327376, "learning_rate": 1.6991150442477876e-05, "loss": 0.429, "loss_nan_ranks": 0, "loss_rank_avg": 0.5566807985305786, "step": 145, "valid_targets_mean": 3091.8, "valid_targets_min": 386 }, { "epoch": 0.3105590062111801, "grad_norm": 0.842626090176198, "learning_rate": 1.7581120943952803e-05, "loss": 0.4001, "loss_nan_ranks": 0, "loss_rank_avg": 0.3940976560115814, "step": 150, "valid_targets_mean": 1999.4, "valid_targets_min": 711 }, { "epoch": 0.32091097308488614, "grad_norm": 0.6925465806852213, "learning_rate": 1.817109144542773e-05, "loss": 0.4275, "loss_nan_ranks": 0, "loss_rank_avg": 0.44604888558387756, "step": 155, "valid_targets_mean": 2645.6, "valid_targets_min": 915 }, { "epoch": 0.33126293995859213, "grad_norm": 0.6871016903538135, "learning_rate": 1.8761061946902657e-05, "loss": 0.3953, "loss_nan_ranks": 0, "loss_rank_avg": 0.4031655192375183, "step": 160, "valid_targets_mean": 2989.4, "valid_targets_min": 577 }, { "epoch": 0.3416149068322981, "grad_norm": 0.7772347914126068, "learning_rate": 1.935103244837758e-05, "loss": 0.3942, "loss_nan_ranks": 0, "loss_rank_avg": 0.4824008345603943, "step": 165, "valid_targets_mean": 2767.8, "valid_targets_min": 553 }, { "epoch": 0.35196687370600416, "grad_norm": 0.7369249527882769, "learning_rate": 1.9941002949852508e-05, "loss": 0.3649, "loss_nan_ranks": 0, "loss_rank_avg": 0.3546352982521057, "step": 170, "valid_targets_mean": 2191.2, "valid_targets_min": 709 }, { "epoch": 0.36231884057971014, "grad_norm": 0.7534283311389234, "learning_rate": 2.0530973451327435e-05, "loss": 0.3829, "loss_nan_ranks": 0, "loss_rank_avg": 0.3965192437171936, "step": 175, "valid_targets_mean": 2274.2, "valid_targets_min": 757 }, { "epoch": 0.37267080745341613, "grad_norm": 0.5744145884839316, "learning_rate": 2.1120943952802362e-05, "loss": 0.3689, "loss_nan_ranks": 0, "loss_rank_avg": 0.27616333961486816, "step": 180, "valid_targets_mean": 3288.3, "valid_targets_min": 754 }, { "epoch": 0.3830227743271222, "grad_norm": 0.7399447267515546, "learning_rate": 2.171091445427729e-05, "loss": 0.4155, "loss_nan_ranks": 0, "loss_rank_avg": 0.5079173445701599, "step": 185, "valid_targets_mean": 3585.9, "valid_targets_min": 305 }, { "epoch": 0.39337474120082816, "grad_norm": 0.787595577330117, "learning_rate": 2.2300884955752213e-05, "loss": 0.3672, "loss_nan_ranks": 0, "loss_rank_avg": 0.40638184547424316, "step": 190, "valid_targets_mean": 2532.8, "valid_targets_min": 501 }, { "epoch": 0.40372670807453415, "grad_norm": 0.8366148088688402, "learning_rate": 2.289085545722714e-05, "loss": 0.3903, "loss_nan_ranks": 0, "loss_rank_avg": 0.344083696603775, "step": 195, "valid_targets_mean": 1931.6, "valid_targets_min": 984 }, { "epoch": 0.4140786749482402, "grad_norm": 0.7049038068177579, "learning_rate": 2.3480825958702063e-05, "loss": 0.366, "loss_nan_ranks": 0, "loss_rank_avg": 0.3272162675857544, "step": 200, "valid_targets_mean": 2669.5, "valid_targets_min": 709 }, { "epoch": 0.4244306418219462, "grad_norm": 0.722982409943531, "learning_rate": 2.4070796460176994e-05, "loss": 0.4846, "loss_nan_ranks": 0, "loss_rank_avg": 0.4433075487613678, "step": 205, "valid_targets_mean": 2856.4, "valid_targets_min": 788 }, { "epoch": 0.43478260869565216, "grad_norm": 0.6216316854835306, "learning_rate": 2.466076696165192e-05, "loss": 0.3702, "loss_nan_ranks": 0, "loss_rank_avg": 0.3501080870628357, "step": 210, "valid_targets_mean": 2924.4, "valid_targets_min": 715 }, { "epoch": 0.4451345755693582, "grad_norm": 0.8036432318505198, "learning_rate": 2.5250737463126848e-05, "loss": 0.3722, "loss_nan_ranks": 0, "loss_rank_avg": 0.3556331992149353, "step": 215, "valid_targets_mean": 2358.1, "valid_targets_min": 835 }, { "epoch": 0.4554865424430642, "grad_norm": 0.9026688718475531, "learning_rate": 2.584070796460177e-05, "loss": 0.4376, "loss_nan_ranks": 0, "loss_rank_avg": 0.362284779548645, "step": 220, "valid_targets_mean": 1682.8, "valid_targets_min": 778 }, { "epoch": 0.4658385093167702, "grad_norm": 0.8474657010085218, "learning_rate": 2.64306784660767e-05, "loss": 0.3687, "loss_nan_ranks": 0, "loss_rank_avg": 0.41895484924316406, "step": 225, "valid_targets_mean": 1957.7, "valid_targets_min": 816 }, { "epoch": 0.47619047619047616, "grad_norm": 0.5989684265924352, "learning_rate": 2.7020648967551622e-05, "loss": 0.3956, "loss_nan_ranks": 0, "loss_rank_avg": 0.270280659198761, "step": 230, "valid_targets_mean": 3520.2, "valid_targets_min": 819 }, { "epoch": 0.4865424430641822, "grad_norm": 0.7407035731133066, "learning_rate": 2.761061946902655e-05, "loss": 0.3462, "loss_nan_ranks": 0, "loss_rank_avg": 0.33700358867645264, "step": 235, "valid_targets_mean": 3075.6, "valid_targets_min": 883 }, { "epoch": 0.4968944099378882, "grad_norm": 0.6514761903429114, "learning_rate": 2.8200589970501476e-05, "loss": 0.3657, "loss_nan_ranks": 0, "loss_rank_avg": 0.40764114260673523, "step": 240, "valid_targets_mean": 3008.0, "valid_targets_min": 524 }, { "epoch": 0.5072463768115942, "grad_norm": 0.9486281355398519, "learning_rate": 2.8790560471976407e-05, "loss": 0.2909, "loss_nan_ranks": 0, "loss_rank_avg": 0.3389992117881775, "step": 245, "valid_targets_mean": 2530.0, "valid_targets_min": 292 }, { "epoch": 0.5175983436853002, "grad_norm": 0.8255724854520955, "learning_rate": 2.938053097345133e-05, "loss": 0.387, "loss_nan_ranks": 0, "loss_rank_avg": 0.5169772505760193, "step": 250, "valid_targets_mean": 2672.6, "valid_targets_min": 633 }, { "epoch": 0.5279503105590062, "grad_norm": 0.744452870979198, "learning_rate": 2.9970501474926257e-05, "loss": 0.4064, "loss_nan_ranks": 0, "loss_rank_avg": 0.38283827900886536, "step": 255, "valid_targets_mean": 2401.8, "valid_targets_min": 1422 }, { "epoch": 0.5383022774327122, "grad_norm": 0.5635474379382327, "learning_rate": 3.0560471976401184e-05, "loss": 0.3819, "loss_nan_ranks": 0, "loss_rank_avg": 0.4241616725921631, "step": 260, "valid_targets_mean": 5410.8, "valid_targets_min": 754 }, { "epoch": 0.5486542443064182, "grad_norm": 0.676856787568286, "learning_rate": 3.115044247787611e-05, "loss": 0.3813, "loss_nan_ranks": 0, "loss_rank_avg": 0.534885823726654, "step": 265, "valid_targets_mean": 4032.4, "valid_targets_min": 601 }, { "epoch": 0.5590062111801242, "grad_norm": 0.685650100513104, "learning_rate": 3.174041297935103e-05, "loss": 0.3515, "loss_nan_ranks": 0, "loss_rank_avg": 0.34689125418663025, "step": 270, "valid_targets_mean": 2478.0, "valid_targets_min": 216 }, { "epoch": 0.5693581780538303, "grad_norm": 0.92365940319728, "learning_rate": 3.233038348082596e-05, "loss": 0.3328, "loss_nan_ranks": 0, "loss_rank_avg": 0.3527258038520813, "step": 275, "valid_targets_mean": 1704.9, "valid_targets_min": 211 }, { "epoch": 0.5797101449275363, "grad_norm": 0.7943251607272555, "learning_rate": 3.2920353982300886e-05, "loss": 0.3735, "loss_nan_ranks": 0, "loss_rank_avg": 0.31049463152885437, "step": 280, "valid_targets_mean": 1748.0, "valid_targets_min": 910 }, { "epoch": 0.5900621118012422, "grad_norm": 0.7707949131715036, "learning_rate": 3.3510324483775816e-05, "loss": 0.3549, "loss_nan_ranks": 0, "loss_rank_avg": 0.3978985548019409, "step": 285, "valid_targets_mean": 2196.7, "valid_targets_min": 345 }, { "epoch": 0.6004140786749482, "grad_norm": 0.9067101706634203, "learning_rate": 3.410029498525074e-05, "loss": 0.3773, "loss_nan_ranks": 0, "loss_rank_avg": 0.3796255588531494, "step": 290, "valid_targets_mean": 1666.6, "valid_targets_min": 912 }, { "epoch": 0.6107660455486542, "grad_norm": 0.49575725135513243, "learning_rate": 3.469026548672567e-05, "loss": 0.3283, "loss_nan_ranks": 0, "loss_rank_avg": 0.3226116895675659, "step": 295, "valid_targets_mean": 4260.1, "valid_targets_min": 783 }, { "epoch": 0.6211180124223602, "grad_norm": 0.7176031931898035, "learning_rate": 3.5280235988200594e-05, "loss": 0.3223, "loss_nan_ranks": 0, "loss_rank_avg": 0.32411545515060425, "step": 300, "valid_targets_mean": 2275.6, "valid_targets_min": 743 }, { "epoch": 0.6314699792960663, "grad_norm": 0.7663570928663194, "learning_rate": 3.587020648967552e-05, "loss": 0.3817, "loss_nan_ranks": 0, "loss_rank_avg": 0.3520033359527588, "step": 305, "valid_targets_mean": 2414.7, "valid_targets_min": 652 }, { "epoch": 0.6418219461697723, "grad_norm": 0.46213987326297384, "learning_rate": 3.646017699115044e-05, "loss": 0.323, "loss_nan_ranks": 0, "loss_rank_avg": 0.29329046607017517, "step": 310, "valid_targets_mean": 4565.9, "valid_targets_min": 647 }, { "epoch": 0.6521739130434783, "grad_norm": 0.6297790214422954, "learning_rate": 3.705014749262537e-05, "loss": 0.3365, "loss_nan_ranks": 0, "loss_rank_avg": 0.27002575993537903, "step": 315, "valid_targets_mean": 2892.7, "valid_targets_min": 784 }, { "epoch": 0.6625258799171843, "grad_norm": 0.6803152264658195, "learning_rate": 3.7640117994100295e-05, "loss": 0.3263, "loss_nan_ranks": 0, "loss_rank_avg": 0.35963690280914307, "step": 320, "valid_targets_mean": 2670.9, "valid_targets_min": 673 }, { "epoch": 0.6728778467908902, "grad_norm": 0.660475255702629, "learning_rate": 3.8230088495575226e-05, "loss": 0.3664, "loss_nan_ranks": 0, "loss_rank_avg": 0.3141520619392395, "step": 325, "valid_targets_mean": 2466.3, "valid_targets_min": 785 }, { "epoch": 0.6832298136645962, "grad_norm": 0.5714885591458042, "learning_rate": 3.882005899705015e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.2787840962409973, "step": 330, "valid_targets_mean": 2959.7, "valid_targets_min": 754 }, { "epoch": 0.6935817805383023, "grad_norm": 0.7840125701270887, "learning_rate": 3.941002949852508e-05, "loss": 0.3609, "loss_nan_ranks": 0, "loss_rank_avg": 0.3164142966270447, "step": 335, "valid_targets_mean": 3174.2, "valid_targets_min": 641 }, { "epoch": 0.7039337474120083, "grad_norm": 0.6419066522152682, "learning_rate": 4e-05, "loss": 0.3102, "loss_nan_ranks": 0, "loss_rank_avg": 0.30930954217910767, "step": 340, "valid_targets_mean": 3136.9, "valid_targets_min": 440 }, { "epoch": 0.7142857142857143, "grad_norm": 0.5059032670699602, "learning_rate": 3.999973336302744e-05, "loss": 0.3525, "loss_nan_ranks": 0, "loss_rank_avg": 0.25785183906555176, "step": 345, "valid_targets_mean": 3533.2, "valid_targets_min": 328 }, { "epoch": 0.7246376811594203, "grad_norm": 0.791626821129135, "learning_rate": 3.999893345921928e-05, "loss": 0.3358, "loss_nan_ranks": 0, "loss_rank_avg": 0.3422420918941498, "step": 350, "valid_targets_mean": 2178.9, "valid_targets_min": 640 }, { "epoch": 0.7349896480331263, "grad_norm": 0.5850437706333231, "learning_rate": 3.999760030990392e-05, "loss": 0.3754, "loss_nan_ranks": 0, "loss_rank_avg": 0.3285501003265381, "step": 355, "valid_targets_mean": 3447.8, "valid_targets_min": 1128 }, { "epoch": 0.7453416149068323, "grad_norm": 1.4793972289409643, "learning_rate": 3.999573395062805e-05, "loss": 0.3541, "loss_nan_ranks": 0, "loss_rank_avg": 0.4052942991256714, "step": 360, "valid_targets_mean": 2194.2, "valid_targets_min": 217 }, { "epoch": 0.7556935817805382, "grad_norm": 0.8161182629951351, "learning_rate": 3.9993334431155696e-05, "loss": 0.3496, "loss_nan_ranks": 0, "loss_rank_avg": 0.3312402367591858, "step": 365, "valid_targets_mean": 1771.2, "valid_targets_min": 664 }, { "epoch": 0.7660455486542443, "grad_norm": 0.7778042883063869, "learning_rate": 3.9990401815466935e-05, "loss": 0.3156, "loss_nan_ranks": 0, "loss_rank_avg": 0.39662399888038635, "step": 370, "valid_targets_mean": 2807.4, "valid_targets_min": 786 }, { "epoch": 0.7763975155279503, "grad_norm": 0.9868164908098449, "learning_rate": 3.9986936181756133e-05, "loss": 0.3484, "loss_nan_ranks": 0, "loss_rank_avg": 0.3773801326751709, "step": 375, "valid_targets_mean": 2612.4, "valid_targets_min": 1034 }, { "epoch": 0.7867494824016563, "grad_norm": 0.7554054875779739, "learning_rate": 3.9982937622429904e-05, "loss": 0.3218, "loss_nan_ranks": 0, "loss_rank_avg": 0.378534197807312, "step": 380, "valid_targets_mean": 2050.9, "valid_targets_min": 1109 }, { "epoch": 0.7971014492753623, "grad_norm": 0.6391636850831167, "learning_rate": 3.997840624410462e-05, "loss": 0.3325, "loss_nan_ranks": 0, "loss_rank_avg": 0.30764123797416687, "step": 385, "valid_targets_mean": 3234.5, "valid_targets_min": 958 }, { "epoch": 0.8074534161490683, "grad_norm": 0.659669602172271, "learning_rate": 3.997334216760358e-05, "loss": 0.3556, "loss_nan_ranks": 0, "loss_rank_avg": 0.2978909909725189, "step": 390, "valid_targets_mean": 4481.5, "valid_targets_min": 510 }, { "epoch": 0.8178053830227743, "grad_norm": 0.6718264239579972, "learning_rate": 3.996774552795379e-05, "loss": 0.3685, "loss_nan_ranks": 0, "loss_rank_avg": 0.3460586667060852, "step": 395, "valid_targets_mean": 2349.4, "valid_targets_min": 887 }, { "epoch": 0.8281573498964804, "grad_norm": 0.7476248873647089, "learning_rate": 3.996161647438236e-05, "loss": 0.3653, "loss_nan_ranks": 0, "loss_rank_avg": 0.3052156865596771, "step": 400, "valid_targets_mean": 2157.8, "valid_targets_min": 818 }, { "epoch": 0.8385093167701864, "grad_norm": 0.8223378901356958, "learning_rate": 3.9954955170312504e-05, "loss": 0.416, "loss_nan_ranks": 0, "loss_rank_avg": 0.4880888760089874, "step": 405, "valid_targets_mean": 3147.2, "valid_targets_min": 821 }, { "epoch": 0.8488612836438924, "grad_norm": 0.6823448035407557, "learning_rate": 3.994776179335923e-05, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.3424914479255676, "step": 410, "valid_targets_mean": 2431.7, "valid_targets_min": 869 }, { "epoch": 0.8592132505175983, "grad_norm": 0.7312590665354671, "learning_rate": 3.9940036535324564e-05, "loss": 0.3355, "loss_nan_ranks": 0, "loss_rank_avg": 0.3406717777252197, "step": 415, "valid_targets_mean": 2271.6, "valid_targets_min": 400 }, { "epoch": 0.8695652173913043, "grad_norm": 0.6805623092937332, "learning_rate": 3.9931779602192435e-05, "loss": 0.3095, "loss_nan_ranks": 0, "loss_rank_avg": 0.35298052430152893, "step": 420, "valid_targets_mean": 2380.3, "valid_targets_min": 331 }, { "epoch": 0.8799171842650103, "grad_norm": 0.47734066638902245, "learning_rate": 3.9922991214123226e-05, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.27308475971221924, "step": 425, "valid_targets_mean": 3988.6, "valid_targets_min": 570 }, { "epoch": 0.8902691511387164, "grad_norm": 0.5978371647266324, "learning_rate": 3.991367160544783e-05, "loss": 0.3574, "loss_nan_ranks": 0, "loss_rank_avg": 0.22311019897460938, "step": 430, "valid_targets_mean": 2887.8, "valid_targets_min": 663 }, { "epoch": 0.9006211180124224, "grad_norm": 0.5853594710092753, "learning_rate": 3.99038210246615e-05, "loss": 0.3862, "loss_nan_ranks": 0, "loss_rank_avg": 0.33275023102760315, "step": 435, "valid_targets_mean": 3190.8, "valid_targets_min": 750 }, { "epoch": 0.9109730848861284, "grad_norm": 0.6824932837618515, "learning_rate": 3.9893439734417125e-05, "loss": 0.3382, "loss_nan_ranks": 0, "loss_rank_avg": 0.2892998158931732, "step": 440, "valid_targets_mean": 2007.6, "valid_targets_min": 937 }, { "epoch": 0.9213250517598344, "grad_norm": 0.7388214988568738, "learning_rate": 3.9882528011518286e-05, "loss": 0.3598, "loss_nan_ranks": 0, "loss_rank_avg": 0.4132966697216034, "step": 445, "valid_targets_mean": 2261.5, "valid_targets_min": 747 }, { "epoch": 0.9316770186335404, "grad_norm": 0.6447680427593593, "learning_rate": 3.987108614691186e-05, "loss": 0.3628, "loss_nan_ranks": 0, "loss_rank_avg": 0.3517792522907257, "step": 450, "valid_targets_mean": 2310.1, "valid_targets_min": 918 }, { "epoch": 0.9420289855072463, "grad_norm": 0.679191901913392, "learning_rate": 3.985911444568026e-05, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.2909126877784729, "step": 455, "valid_targets_mean": 2311.9, "valid_targets_min": 742 }, { "epoch": 0.9523809523809523, "grad_norm": 0.793829538406422, "learning_rate": 3.9846613227033305e-05, "loss": 0.3663, "loss_nan_ranks": 0, "loss_rank_avg": 0.34115058183670044, "step": 460, "valid_targets_mean": 2087.2, "valid_targets_min": 708 }, { "epoch": 0.9627329192546584, "grad_norm": 0.5926367081080217, "learning_rate": 3.98335828242997e-05, "loss": 0.3408, "loss_nan_ranks": 0, "loss_rank_avg": 0.2802141606807709, "step": 465, "valid_targets_mean": 2543.6, "valid_targets_min": 821 }, { "epoch": 0.9730848861283644, "grad_norm": 0.5823847098766494, "learning_rate": 3.982002358491817e-05, "loss": 0.3349, "loss_nan_ranks": 0, "loss_rank_avg": 0.293674111366272, "step": 470, "valid_targets_mean": 2787.9, "valid_targets_min": 404 }, { "epoch": 0.9834368530020704, "grad_norm": 0.7514989296192166, "learning_rate": 3.980593587042816e-05, "loss": 0.359, "loss_nan_ranks": 0, "loss_rank_avg": 0.3089297413825989, "step": 475, "valid_targets_mean": 2357.3, "valid_targets_min": 617 }, { "epoch": 0.9937888198757764, "grad_norm": 0.7508286456561156, "learning_rate": 3.979132005646022e-05, "loss": 0.3045, "loss_nan_ranks": 0, "loss_rank_avg": 0.2705974578857422, "step": 480, "valid_targets_mean": 2060.9, "valid_targets_min": 495 }, { "epoch": 1.0041407867494825, "grad_norm": 0.578303130786325, "learning_rate": 3.9776176532726005e-05, "loss": 0.3067, "loss_nan_ranks": 0, "loss_rank_avg": 0.23351214826107025, "step": 485, "valid_targets_mean": 2921.1, "valid_targets_min": 862 }, { "epoch": 1.0144927536231885, "grad_norm": 0.8565681891585248, "learning_rate": 3.976050570300783e-05, "loss": 0.3846, "loss_nan_ranks": 0, "loss_rank_avg": 0.4955739974975586, "step": 490, "valid_targets_mean": 2399.9, "valid_targets_min": 397 }, { "epoch": 1.0248447204968945, "grad_norm": 0.8525085460239903, "learning_rate": 3.974430798514796e-05, "loss": 0.2587, "loss_nan_ranks": 0, "loss_rank_avg": 0.34586983919143677, "step": 495, "valid_targets_mean": 3405.7, "valid_targets_min": 692 }, { "epoch": 1.0351966873706004, "grad_norm": 0.6107145043153749, "learning_rate": 3.972758381103744e-05, "loss": 0.3328, "loss_nan_ranks": 0, "loss_rank_avg": 0.25020384788513184, "step": 500, "valid_targets_mean": 2676.7, "valid_targets_min": 693 }, { "epoch": 1.0455486542443064, "grad_norm": 0.3712861445621319, "learning_rate": 3.9710333626604585e-05, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.2056269347667694, "step": 505, "valid_targets_mean": 5489.6, "valid_targets_min": 677 }, { "epoch": 1.0559006211180124, "grad_norm": 0.5445195023826013, "learning_rate": 3.969255789180309e-05, "loss": 0.3549, "loss_nan_ranks": 0, "loss_rank_avg": 0.3427426815032959, "step": 510, "valid_targets_mean": 4128.8, "valid_targets_min": 909 }, { "epoch": 1.0662525879917184, "grad_norm": 1.5522590817967603, "learning_rate": 3.9674257080599775e-05, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.3245624303817749, "step": 515, "valid_targets_mean": 2571.8, "valid_targets_min": 988 }, { "epoch": 1.0766045548654244, "grad_norm": 0.7670802874384615, "learning_rate": 3.9655431680961924e-05, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.3730795085430145, "step": 520, "valid_targets_mean": 2089.7, "valid_targets_min": 509 }, { "epoch": 1.0869565217391304, "grad_norm": 0.8808573279945764, "learning_rate": 3.9636082194844285e-05, "loss": 0.3202, "loss_nan_ranks": 0, "loss_rank_avg": 0.31017860770225525, "step": 525, "valid_targets_mean": 2748.6, "valid_targets_min": 746 }, { "epoch": 1.0973084886128364, "grad_norm": 0.5678915273276016, "learning_rate": 3.9616209138175705e-05, "loss": 0.3206, "loss_nan_ranks": 0, "loss_rank_avg": 0.3231387436389923, "step": 530, "valid_targets_mean": 3620.4, "valid_targets_min": 1076 }, { "epoch": 1.1076604554865424, "grad_norm": 0.6715392961412922, "learning_rate": 3.959581304084536e-05, "loss": 0.3538, "loss_nan_ranks": 0, "loss_rank_avg": 0.42259538173675537, "step": 535, "valid_targets_mean": 4127.1, "valid_targets_min": 406 }, { "epoch": 1.1180124223602483, "grad_norm": 0.6122700992261885, "learning_rate": 3.9574894446688594e-05, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.323467493057251, "step": 540, "valid_targets_mean": 3492.6, "valid_targets_min": 684 }, { "epoch": 1.1283643892339545, "grad_norm": 0.8429230339257078, "learning_rate": 3.955345391347249e-05, "loss": 0.3377, "loss_nan_ranks": 0, "loss_rank_avg": 0.45265573263168335, "step": 545, "valid_targets_mean": 2018.4, "valid_targets_min": 873 }, { "epoch": 1.1387163561076605, "grad_norm": 0.5177578813671116, "learning_rate": 3.9531492012880915e-05, "loss": 0.272, "loss_nan_ranks": 0, "loss_rank_avg": 0.24492105841636658, "step": 550, "valid_targets_mean": 3538.9, "valid_targets_min": 631 }, { "epoch": 1.1490683229813665, "grad_norm": 0.9358791063800329, "learning_rate": 3.9509009330499356e-05, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.3208366632461548, "step": 555, "valid_targets_mean": 2221.3, "valid_targets_min": 735 }, { "epoch": 1.1594202898550725, "grad_norm": 1.492654485940082, "learning_rate": 3.948600646579923e-05, "loss": 0.3741, "loss_nan_ranks": 0, "loss_rank_avg": 0.30150753259658813, "step": 560, "valid_targets_mean": 1951.8, "valid_targets_min": 508 }, { "epoch": 1.1697722567287785, "grad_norm": 0.5458431310144255, "learning_rate": 3.946248403212197e-05, "loss": 0.325, "loss_nan_ranks": 0, "loss_rank_avg": 0.34849831461906433, "step": 565, "valid_targets_mean": 4525.2, "valid_targets_min": 886 }, { "epoch": 1.1801242236024845, "grad_norm": 1.3216443391427874, "learning_rate": 3.943844265666263e-05, "loss": 0.3464, "loss_nan_ranks": 0, "loss_rank_avg": 0.2811647057533264, "step": 570, "valid_targets_mean": 2566.6, "valid_targets_min": 931 }, { "epoch": 1.1904761904761905, "grad_norm": 0.5379526619584627, "learning_rate": 3.9413882980453155e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.2871326506137848, "step": 575, "valid_targets_mean": 3341.6, "valid_targets_min": 752 }, { "epoch": 1.2008281573498965, "grad_norm": 0.5970973416160769, "learning_rate": 3.9388805658345325e-05, "loss": 0.3592, "loss_nan_ranks": 0, "loss_rank_avg": 0.32768434286117554, "step": 580, "valid_targets_mean": 4324.7, "valid_targets_min": 686 }, { "epoch": 1.2111801242236024, "grad_norm": 0.7650985133734655, "learning_rate": 3.9363211358993264e-05, "loss": 0.3126, "loss_nan_ranks": 0, "loss_rank_avg": 0.35999956727027893, "step": 585, "valid_targets_mean": 2116.5, "valid_targets_min": 709 }, { "epoch": 1.2215320910973084, "grad_norm": 0.6626315464935324, "learning_rate": 3.9337100764835616e-05, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.17115123569965363, "step": 590, "valid_targets_mean": 4721.6, "valid_targets_min": 590 }, { "epoch": 1.2318840579710144, "grad_norm": 0.608747167208178, "learning_rate": 3.931047457207736e-05, "loss": 0.3522, "loss_nan_ranks": 0, "loss_rank_avg": 0.3361900746822357, "step": 595, "valid_targets_mean": 3093.6, "valid_targets_min": 1291 }, { "epoch": 1.2422360248447206, "grad_norm": 0.7141578114058345, "learning_rate": 3.928333349067125e-05, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.3286536931991577, "step": 600, "valid_targets_mean": 2283.4, "valid_targets_min": 402 }, { "epoch": 1.2525879917184266, "grad_norm": 0.5678041106872164, "learning_rate": 3.925567824429885e-05, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.29660943150520325, "step": 605, "valid_targets_mean": 3684.8, "valid_targets_min": 1120 }, { "epoch": 1.2629399585921326, "grad_norm": 0.722727884026502, "learning_rate": 3.922750957035128e-05, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.2989663779735565, "step": 610, "valid_targets_mean": 2112.3, "valid_targets_min": 371 }, { "epoch": 1.2732919254658386, "grad_norm": 0.5666973822209642, "learning_rate": 3.919882821990953e-05, "loss": 0.3165, "loss_nan_ranks": 0, "loss_rank_avg": 0.28699982166290283, "step": 615, "valid_targets_mean": 3570.9, "valid_targets_min": 780 }, { "epoch": 1.2836438923395446, "grad_norm": 0.6949218726412446, "learning_rate": 3.9169634957724465e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.2630559206008911, "step": 620, "valid_targets_mean": 1976.1, "valid_targets_min": 216 }, { "epoch": 1.2939958592132506, "grad_norm": 0.7553316125934354, "learning_rate": 3.913993056219636e-05, "loss": 0.3238, "loss_nan_ranks": 0, "loss_rank_avg": 0.3031398057937622, "step": 625, "valid_targets_mean": 2566.6, "valid_targets_min": 1097 }, { "epoch": 1.3043478260869565, "grad_norm": 0.6012551894727312, "learning_rate": 3.9109715825354254e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.30872005224227905, "step": 630, "valid_targets_mean": 2901.4, "valid_targets_min": 884 }, { "epoch": 1.3146997929606625, "grad_norm": 0.6499249693828386, "learning_rate": 3.907899155283472e-05, "loss": 0.3054, "loss_nan_ranks": 0, "loss_rank_avg": 0.2922044098377228, "step": 635, "valid_targets_mean": 2478.1, "valid_targets_min": 644 }, { "epoch": 1.3250517598343685, "grad_norm": 0.6607109178219058, "learning_rate": 3.904775856386047e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.32309627532958984, "step": 640, "valid_targets_mean": 2581.8, "valid_targets_min": 822 }, { "epoch": 1.3354037267080745, "grad_norm": 0.99359277719902, "learning_rate": 3.9016017691218465e-05, "loss": 0.3148, "loss_nan_ranks": 0, "loss_rank_avg": 0.3399587869644165, "step": 645, "valid_targets_mean": 2634.0, "valid_targets_min": 780 }, { "epoch": 1.3457556935817805, "grad_norm": 0.6998735259668638, "learning_rate": 3.8983769781237725e-05, "loss": 0.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.35572707653045654, "step": 650, "valid_targets_mean": 2802.4, "valid_targets_min": 288 }, { "epoch": 1.3561076604554865, "grad_norm": 0.6543925730470436, "learning_rate": 3.8951015693766755e-05, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.3457895815372467, "step": 655, "valid_targets_mean": 2723.4, "valid_targets_min": 1094 }, { "epoch": 1.3664596273291925, "grad_norm": 0.867046377934047, "learning_rate": 3.8917756302150627e-05, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.34926313161849976, "step": 660, "valid_targets_mean": 2280.2, "valid_targets_min": 697 }, { "epoch": 1.3768115942028984, "grad_norm": 0.8720982266233283, "learning_rate": 3.8883992493207696e-05, "loss": 0.3581, "loss_nan_ranks": 0, "loss_rank_avg": 0.3935870826244354, "step": 665, "valid_targets_mean": 2969.8, "valid_targets_min": 848 }, { "epoch": 1.3871635610766044, "grad_norm": 0.7607813486400433, "learning_rate": 3.8849725167205934e-05, "loss": 0.376, "loss_nan_ranks": 0, "loss_rank_avg": 0.35601186752319336, "step": 670, "valid_targets_mean": 2010.1, "valid_targets_min": 625 }, { "epoch": 1.3975155279503104, "grad_norm": 0.6244741241809822, "learning_rate": 3.8814955237838954e-05, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.33208197355270386, "step": 675, "valid_targets_mean": 2881.0, "valid_targets_min": 633 }, { "epoch": 1.4078674948240166, "grad_norm": 0.701432966146093, "learning_rate": 3.8779683632201625e-05, "loss": 0.3234, "loss_nan_ranks": 0, "loss_rank_avg": 0.2493334263563156, "step": 680, "valid_targets_mean": 2480.6, "valid_targets_min": 726 }, { "epoch": 1.4182194616977226, "grad_norm": 0.6386263618060875, "learning_rate": 3.8743911290765354e-05, "loss": 0.3563, "loss_nan_ranks": 0, "loss_rank_avg": 0.33178985118865967, "step": 685, "valid_targets_mean": 2496.4, "valid_targets_min": 555 }, { "epoch": 1.4285714285714286, "grad_norm": 0.7163290212539811, "learning_rate": 3.870763916735303e-05, "loss": 0.3221, "loss_nan_ranks": 0, "loss_rank_avg": 0.42771202325820923, "step": 690, "valid_targets_mean": 2670.1, "valid_targets_min": 305 }, { "epoch": 1.4389233954451346, "grad_norm": 0.6173973599046334, "learning_rate": 3.867086822911358e-05, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.3355981111526489, "step": 695, "valid_targets_mean": 4034.1, "valid_targets_min": 960 }, { "epoch": 1.4492753623188406, "grad_norm": 0.593581318712642, "learning_rate": 3.863359945649615e-05, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.3260822296142578, "step": 700, "valid_targets_mean": 3011.0, "valid_targets_min": 566 }, { "epoch": 1.4596273291925466, "grad_norm": 0.7037825237005169, "learning_rate": 3.859583384322402e-05, "loss": 0.3314, "loss_nan_ranks": 0, "loss_rank_avg": 0.2873789072036743, "step": 705, "valid_targets_mean": 2114.8, "valid_targets_min": 281 }, { "epoch": 1.4699792960662525, "grad_norm": 0.4809742053953339, "learning_rate": 3.855757239626807e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.3173772394657135, "step": 710, "valid_targets_mean": 5494.3, "valid_targets_min": 313 }, { "epoch": 1.4803312629399585, "grad_norm": 0.7992784007276763, "learning_rate": 3.851881613581993e-05, "loss": 0.3428, "loss_nan_ranks": 0, "loss_rank_avg": 0.37110865116119385, "step": 715, "valid_targets_mean": 1696.1, "valid_targets_min": 613 }, { "epoch": 1.4906832298136645, "grad_norm": 0.7460466376190822, "learning_rate": 3.847956609526481e-05, "loss": 0.2999, "loss_nan_ranks": 0, "loss_rank_avg": 0.36755889654159546, "step": 720, "valid_targets_mean": 2678.8, "valid_targets_min": 551 }, { "epoch": 1.5010351966873707, "grad_norm": 0.8015485930507722, "learning_rate": 3.843982332115389e-05, "loss": 0.3648, "loss_nan_ranks": 0, "loss_rank_avg": 0.5440657734870911, "step": 725, "valid_targets_mean": 3186.0, "valid_targets_min": 435 }, { "epoch": 1.5113871635610767, "grad_norm": 0.6245802617185957, "learning_rate": 3.839958887317649e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.27157890796661377, "step": 730, "valid_targets_mean": 2370.6, "valid_targets_min": 787 }, { "epoch": 1.5217391304347827, "grad_norm": 0.8406585786723727, "learning_rate": 3.8358863824131726e-05, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.3849491477012634, "step": 735, "valid_targets_mean": 2885.7, "valid_targets_min": 728 }, { "epoch": 1.5320910973084887, "grad_norm": 0.6705418668893592, "learning_rate": 3.831764925989999e-05, "loss": 0.3017, "loss_nan_ranks": 0, "loss_rank_avg": 0.2597661018371582, "step": 740, "valid_targets_mean": 2369.4, "valid_targets_min": 777 }, { "epoch": 1.5424430641821947, "grad_norm": 0.7570661925654296, "learning_rate": 3.8275946279413946e-05, "loss": 0.3126, "loss_nan_ranks": 0, "loss_rank_avg": 0.4379417598247528, "step": 745, "valid_targets_mean": 3104.5, "valid_targets_min": 709 }, { "epoch": 1.5527950310559007, "grad_norm": 0.7568141088774238, "learning_rate": 3.823375599462924e-05, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.3063448667526245, "step": 750, "valid_targets_mean": 1793.1, "valid_targets_min": 583 }, { "epoch": 1.5631469979296067, "grad_norm": 0.5008197907800821, "learning_rate": 3.819107953049485e-05, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.23246562480926514, "step": 755, "valid_targets_mean": 3298.4, "valid_targets_min": 741 }, { "epoch": 1.5734989648033126, "grad_norm": 0.6451644332169639, "learning_rate": 3.814791802492309e-05, "loss": 0.3332, "loss_nan_ranks": 0, "loss_rank_avg": 0.4341411888599396, "step": 760, "valid_targets_mean": 3766.1, "valid_targets_min": 550 }, { "epoch": 1.5838509316770186, "grad_norm": 0.6316711474608361, "learning_rate": 3.810427262875928e-05, "loss": 0.3632, "loss_nan_ranks": 0, "loss_rank_avg": 0.40523141622543335, "step": 765, "valid_targets_mean": 2900.8, "valid_targets_min": 549 }, { "epoch": 1.5942028985507246, "grad_norm": 0.6559079761601386, "learning_rate": 3.8060144505751066e-05, "loss": 0.3555, "loss_nan_ranks": 0, "loss_rank_avg": 0.3753317594528198, "step": 770, "valid_targets_mean": 2754.6, "valid_targets_min": 923 }, { "epoch": 1.6045548654244306, "grad_norm": 0.8409357657293262, "learning_rate": 3.8015534832517346e-05, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.31297141313552856, "step": 775, "valid_targets_mean": 1537.7, "valid_targets_min": 400 }, { "epoch": 1.6149068322981366, "grad_norm": 0.5230610037042105, "learning_rate": 3.797044479851693e-05, "loss": 0.3394, "loss_nan_ranks": 0, "loss_rank_avg": 0.34146177768707275, "step": 780, "valid_targets_mean": 4368.2, "valid_targets_min": 564 }, { "epoch": 1.6252587991718426, "grad_norm": 0.8017960578186035, "learning_rate": 3.7924875606016856e-05, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.31278154253959656, "step": 785, "valid_targets_mean": 2435.0, "valid_targets_min": 309 }, { "epoch": 1.6356107660455486, "grad_norm": 0.7307900776630412, "learning_rate": 3.7878828470060274e-05, "loss": 0.2563, "loss_nan_ranks": 0, "loss_rank_avg": 0.24949385225772858, "step": 790, "valid_targets_mean": 1969.8, "valid_targets_min": 689 }, { "epoch": 1.6459627329192545, "grad_norm": 0.6089402692068703, "learning_rate": 3.783230461843406e-05, "loss": 0.3037, "loss_nan_ranks": 0, "loss_rank_avg": 0.2793858051300049, "step": 795, "valid_targets_mean": 2419.0, "valid_targets_min": 303 }, { "epoch": 1.6563146997929605, "grad_norm": 0.604875615097612, "learning_rate": 3.7785305291636126e-05, "loss": 0.3101, "loss_nan_ranks": 0, "loss_rank_avg": 0.35383036732673645, "step": 800, "valid_targets_mean": 2854.2, "valid_targets_min": 666 }, { "epoch": 1.6666666666666665, "grad_norm": 0.7840139460025201, "learning_rate": 3.773783174284228e-05, "loss": 0.293, "loss_nan_ranks": 0, "loss_rank_avg": 0.270771324634552, "step": 805, "valid_targets_mean": 1783.1, "valid_targets_min": 597 }, { "epoch": 1.6770186335403725, "grad_norm": 0.5439330951892583, "learning_rate": 3.768988523787287e-05, "loss": 0.3221, "loss_nan_ranks": 0, "loss_rank_avg": 0.2746136784553528, "step": 810, "valid_targets_mean": 3407.2, "valid_targets_min": 459 }, { "epoch": 1.6873706004140787, "grad_norm": 0.707062238751807, "learning_rate": 3.764146705515898e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.30619674921035767, "step": 815, "valid_targets_mean": 2142.9, "valid_targets_min": 923 }, { "epoch": 1.6977225672877847, "grad_norm": 0.6851395668736608, "learning_rate": 3.759257848570838e-05, "loss": 0.3534, "loss_nan_ranks": 0, "loss_rank_avg": 0.5384789705276489, "step": 820, "valid_targets_mean": 3692.9, "valid_targets_min": 642 }, { "epoch": 1.7080745341614907, "grad_norm": 0.6969892105656047, "learning_rate": 3.754322083307107e-05, "loss": 0.3032, "loss_nan_ranks": 0, "loss_rank_avg": 0.34344714879989624, "step": 825, "valid_targets_mean": 2168.1, "valid_targets_min": 880 }, { "epoch": 1.7184265010351967, "grad_norm": 0.6350233312646498, "learning_rate": 3.749339541330457e-05, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.21109239757061005, "step": 830, "valid_targets_mean": 2116.4, "valid_targets_min": 518 }, { "epoch": 1.7287784679089027, "grad_norm": 0.6242925285847643, "learning_rate": 3.7443103554938794e-05, "loss": 0.3074, "loss_nan_ranks": 0, "loss_rank_avg": 0.35286158323287964, "step": 835, "valid_targets_mean": 2796.6, "valid_targets_min": 347 }, { "epoch": 1.7391304347826086, "grad_norm": 0.7068835221058171, "learning_rate": 3.739234659894062e-05, "loss": 0.2794, "loss_nan_ranks": 0, "loss_rank_avg": 0.27447009086608887, "step": 840, "valid_targets_mean": 1944.8, "valid_targets_min": 488 }, { "epoch": 1.7494824016563149, "grad_norm": 0.7775094105121269, "learning_rate": 3.7341125898678154e-05, "loss": 0.3409, "loss_nan_ranks": 0, "loss_rank_avg": 0.3335605561733246, "step": 845, "valid_targets_mean": 2268.7, "valid_targets_min": 655 }, { "epoch": 1.7598343685300208, "grad_norm": 0.7026899191258092, "learning_rate": 3.7289442819884644e-05, "loss": 0.3313, "loss_nan_ranks": 0, "loss_rank_avg": 0.3098892867565155, "step": 850, "valid_targets_mean": 2165.6, "valid_targets_min": 886 }, { "epoch": 1.7701863354037268, "grad_norm": 0.7785694411643936, "learning_rate": 3.723729874062206e-05, "loss": 0.3383, "loss_nan_ranks": 0, "loss_rank_avg": 0.5063181519508362, "step": 855, "valid_targets_mean": 3067.9, "valid_targets_min": 845 }, { "epoch": 1.7805383022774328, "grad_norm": 0.6864346250242391, "learning_rate": 3.718469505124434e-05, "loss": 0.3438, "loss_nan_ranks": 0, "loss_rank_avg": 0.30108267068862915, "step": 860, "valid_targets_mean": 2758.5, "valid_targets_min": 747 }, { "epoch": 1.7908902691511388, "grad_norm": 0.6688063851094667, "learning_rate": 3.7131633154360336e-05, "loss": 0.2891, "loss_nan_ranks": 0, "loss_rank_avg": 0.3029250204563141, "step": 865, "valid_targets_mean": 2407.8, "valid_targets_min": 945 }, { "epoch": 1.8012422360248448, "grad_norm": 0.6814618177356577, "learning_rate": 3.707811446479639e-05, "loss": 0.2774, "loss_nan_ranks": 0, "loss_rank_avg": 0.3125041127204895, "step": 870, "valid_targets_mean": 2367.2, "valid_targets_min": 1157 }, { "epoch": 1.8115942028985508, "grad_norm": 0.6124859430419072, "learning_rate": 3.702414040955866e-05, "loss": 0.3282, "loss_nan_ranks": 0, "loss_rank_avg": 0.33444851636886597, "step": 875, "valid_targets_mean": 2857.4, "valid_targets_min": 789 }, { "epoch": 1.8219461697722568, "grad_norm": 0.5332243076283965, "learning_rate": 3.696971242779499e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.30144771933555603, "step": 880, "valid_targets_mean": 3346.8, "valid_targets_min": 734 }, { "epoch": 1.8322981366459627, "grad_norm": 0.6418575705848031, "learning_rate": 3.691483197075664e-05, "loss": 0.314, "loss_nan_ranks": 0, "loss_rank_avg": 0.2444503903388977, "step": 885, "valid_targets_mean": 2092.2, "valid_targets_min": 707 }, { "epoch": 1.8426501035196687, "grad_norm": 0.6840565309784318, "learning_rate": 3.685950050175946e-05, "loss": 0.2981, "loss_nan_ranks": 0, "loss_rank_avg": 0.3534913659095764, "step": 890, "valid_targets_mean": 2626.1, "valid_targets_min": 883 }, { "epoch": 1.8530020703933747, "grad_norm": 0.6411961833023883, "learning_rate": 3.680371949614503e-05, "loss": 0.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.3057364523410797, "step": 895, "valid_targets_mean": 2653.8, "valid_targets_min": 788 }, { "epoch": 1.8633540372670807, "grad_norm": 0.734143938781199, "learning_rate": 3.6747490441241166e-05, "loss": 0.3165, "loss_nan_ranks": 0, "loss_rank_avg": 0.2625513970851898, "step": 900, "valid_targets_mean": 1966.4, "valid_targets_min": 342 }, { "epoch": 1.8737060041407867, "grad_norm": 0.6002740004630833, "learning_rate": 3.669081483632238e-05, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.24936066567897797, "step": 905, "valid_targets_mean": 2350.6, "valid_targets_min": 581 }, { "epoch": 1.8840579710144927, "grad_norm": 0.6634082462286021, "learning_rate": 3.6633694192569835e-05, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.2440337836742401, "step": 910, "valid_targets_mean": 2182.1, "valid_targets_min": 768 }, { "epoch": 1.8944099378881987, "grad_norm": 0.6598417402185687, "learning_rate": 3.657613003303109e-05, "loss": 0.3533, "loss_nan_ranks": 0, "loss_rank_avg": 0.3100677728652954, "step": 915, "valid_targets_mean": 2527.1, "valid_targets_min": 869 }, { "epoch": 1.9047619047619047, "grad_norm": 0.7136251407724076, "learning_rate": 3.651812389257947e-05, "loss": 0.3177, "loss_nan_ranks": 0, "loss_rank_avg": 0.40685153007507324, "step": 920, "valid_targets_mean": 2883.4, "valid_targets_min": 438 }, { "epoch": 1.9151138716356106, "grad_norm": 0.8221505552013975, "learning_rate": 3.645967731787313e-05, "loss": 0.2988, "loss_nan_ranks": 0, "loss_rank_avg": 0.348793625831604, "step": 925, "valid_targets_mean": 1815.2, "valid_targets_min": 471 }, { "epoch": 1.9254658385093166, "grad_norm": 0.6714962697810101, "learning_rate": 3.640079186731385e-05, "loss": 0.2772, "loss_nan_ranks": 0, "loss_rank_avg": 0.3066626787185669, "step": 930, "valid_targets_mean": 2163.9, "valid_targets_min": 739 }, { "epoch": 1.9358178053830226, "grad_norm": 0.8603452197126946, "learning_rate": 3.634146911100547e-05, "loss": 0.3325, "loss_nan_ranks": 0, "loss_rank_avg": 0.3235263228416443, "step": 935, "valid_targets_mean": 2000.6, "valid_targets_min": 778 }, { "epoch": 1.9461697722567288, "grad_norm": 0.8181375628740634, "learning_rate": 3.6281710630711984e-05, "loss": 0.3459, "loss_nan_ranks": 0, "loss_rank_avg": 0.33535006642341614, "step": 940, "valid_targets_mean": 2283.9, "valid_targets_min": 787 }, { "epoch": 1.9565217391304348, "grad_norm": 0.7661975352385241, "learning_rate": 3.6221518019815436e-05, "loss": 0.3142, "loss_nan_ranks": 0, "loss_rank_avg": 0.32310929894447327, "step": 945, "valid_targets_mean": 2044.9, "valid_targets_min": 870 }, { "epoch": 1.9668737060041408, "grad_norm": 0.7546886437201982, "learning_rate": 3.616089288327336e-05, "loss": 0.2886, "loss_nan_ranks": 0, "loss_rank_avg": 0.3442019522190094, "step": 950, "valid_targets_mean": 2058.4, "valid_targets_min": 908 }, { "epoch": 1.9772256728778468, "grad_norm": 0.6284194122874336, "learning_rate": 3.609983683757606e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.41605764627456665, "step": 955, "valid_targets_mean": 4267.4, "valid_targets_min": 939 }, { "epoch": 1.9875776397515528, "grad_norm": 0.565257067101154, "learning_rate": 3.603835151070345e-05, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.27033889293670654, "step": 960, "valid_targets_mean": 3668.6, "valid_targets_min": 912 }, { "epoch": 1.9979296066252588, "grad_norm": 0.6360153374329626, "learning_rate": 3.5976438542081666e-05, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.2408621609210968, "step": 965, "valid_targets_mean": 2069.4, "valid_targets_min": 774 }, { "epoch": 2.008281573498965, "grad_norm": 0.6357166576139243, "learning_rate": 3.591409958253937e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.2636573612689972, "step": 970, "valid_targets_mean": 2536.4, "valid_targets_min": 622 }, { "epoch": 2.018633540372671, "grad_norm": 0.6716098344095058, "learning_rate": 3.5851336294263696e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.25086358189582825, "step": 975, "valid_targets_mean": 2756.8, "valid_targets_min": 1130 }, { "epoch": 2.028985507246377, "grad_norm": 0.4956351374220249, "learning_rate": 3.578815035075597e-05, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.2566456198692322, "step": 980, "valid_targets_mean": 5390.4, "valid_targets_min": 815 }, { "epoch": 2.039337474120083, "grad_norm": 0.7064220242643727, "learning_rate": 3.572454343678705e-05, "loss": 0.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.2861258387565613, "step": 985, "valid_targets_mean": 2059.2, "valid_targets_min": 501 }, { "epoch": 2.049689440993789, "grad_norm": 0.8729780469833862, "learning_rate": 3.566051724835245e-05, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.32387927174568176, "step": 990, "valid_targets_mean": 1951.7, "valid_targets_min": 656 }, { "epoch": 2.060041407867495, "grad_norm": 0.6569866235371754, "learning_rate": 3.559607349262705e-05, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.23175671696662903, "step": 995, "valid_targets_mean": 2289.1, "valid_targets_min": 895 }, { "epoch": 2.070393374741201, "grad_norm": 0.9247889042046914, "learning_rate": 3.5531213887919667e-05, "loss": 0.2548, "loss_nan_ranks": 0, "loss_rank_avg": 0.2623339295387268, "step": 1000, "valid_targets_mean": 2524.4, "valid_targets_min": 232 }, { "epoch": 2.080745341614907, "grad_norm": 0.6363817576343097, "learning_rate": 3.546594016362716e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.28919100761413574, "step": 1005, "valid_targets_mean": 2776.9, "valid_targets_min": 617 }, { "epoch": 2.091097308488613, "grad_norm": 0.7881930796673811, "learning_rate": 3.540025406018834e-05, "loss": 0.2697, "loss_nan_ranks": 0, "loss_rank_avg": 0.2384035289287567, "step": 1010, "valid_targets_mean": 1624.8, "valid_targets_min": 487 }, { "epoch": 2.101449275362319, "grad_norm": 0.4465477565347781, "learning_rate": 3.533415732903759e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.2667323648929596, "step": 1015, "valid_targets_mean": 5425.1, "valid_targets_min": 783 }, { "epoch": 2.111801242236025, "grad_norm": 0.7631555157748504, "learning_rate": 3.5267651732558146e-05, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.3835008442401886, "step": 1020, "valid_targets_mean": 2624.8, "valid_targets_min": 510 }, { "epoch": 2.122153209109731, "grad_norm": 0.55664148104698, "learning_rate": 3.520073904403509e-05, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.25191134214401245, "step": 1025, "valid_targets_mean": 3272.8, "valid_targets_min": 972 }, { "epoch": 2.132505175983437, "grad_norm": 0.8149036515302649, "learning_rate": 3.513342104760809e-05, "loss": 0.2167, "loss_nan_ranks": 0, "loss_rank_avg": 0.22442390024662018, "step": 1030, "valid_targets_mean": 1833.1, "valid_targets_min": 818 }, { "epoch": 2.142857142857143, "grad_norm": 0.5802425971474474, "learning_rate": 3.506569953822383e-05, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.2896159291267395, "step": 1035, "valid_targets_mean": 3547.2, "valid_targets_min": 342 }, { "epoch": 2.153209109730849, "grad_norm": 0.6221670768855667, "learning_rate": 3.4997576321588126e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.22672376036643982, "step": 1040, "valid_targets_mean": 2443.9, "valid_targets_min": 647 }, { "epoch": 2.1635610766045548, "grad_norm": 0.8278897691479519, "learning_rate": 3.492905321411781e-05, "loss": 0.3221, "loss_nan_ranks": 0, "loss_rank_avg": 0.2788503170013428, "step": 1045, "valid_targets_mean": 2161.9, "valid_targets_min": 821 }, { "epoch": 2.1739130434782608, "grad_norm": 0.6727746895274888, "learning_rate": 3.486013204289227e-05, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.21209818124771118, "step": 1050, "valid_targets_mean": 2909.8, "valid_targets_min": 1008 }, { "epoch": 2.1842650103519667, "grad_norm": 0.6334119835007679, "learning_rate": 3.479081464560475e-05, "loss": 0.2621, "loss_nan_ranks": 0, "loss_rank_avg": 0.29021257162094116, "step": 1055, "valid_targets_mean": 3242.4, "valid_targets_min": 542 }, { "epoch": 2.1946169772256727, "grad_norm": 1.1830366048428838, "learning_rate": 3.4721102870513345e-05, "loss": 0.253, "loss_nan_ranks": 0, "loss_rank_avg": 0.36102619767189026, "step": 1060, "valid_targets_mean": 2006.9, "valid_targets_min": 839 }, { "epoch": 2.2049689440993787, "grad_norm": 0.8106585345203733, "learning_rate": 3.465099857639173e-05, "loss": 0.3153, "loss_nan_ranks": 0, "loss_rank_avg": 0.27605193853378296, "step": 1065, "valid_targets_mean": 1677.1, "valid_targets_min": 705 }, { "epoch": 2.2153209109730847, "grad_norm": 0.5880377494754921, "learning_rate": 3.458050363247957e-05, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.24764445424079895, "step": 1070, "valid_targets_mean": 3182.0, "valid_targets_min": 700 }, { "epoch": 2.2256728778467907, "grad_norm": 0.5697074711554126, "learning_rate": 3.450961991843271e-05, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.24443545937538147, "step": 1075, "valid_targets_mean": 4197.8, "valid_targets_min": 1715 }, { "epoch": 2.2360248447204967, "grad_norm": 0.7599961285605185, "learning_rate": 3.4438349324273044e-05, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.3468702733516693, "step": 1080, "valid_targets_mean": 2894.7, "valid_targets_min": 904 }, { "epoch": 2.246376811594203, "grad_norm": 0.7320534504878216, "learning_rate": 3.436669375033812e-05, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.2806239724159241, "step": 1085, "valid_targets_mean": 2801.9, "valid_targets_min": 804 }, { "epoch": 2.256728778467909, "grad_norm": 0.6651232453856196, "learning_rate": 3.429465510723046e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.25253286957740784, "step": 1090, "valid_targets_mean": 2427.6, "valid_targets_min": 404 }, { "epoch": 2.267080745341615, "grad_norm": 0.7318417075725385, "learning_rate": 3.4222235315766634e-05, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.2881121039390564, "step": 1095, "valid_targets_mean": 2698.2, "valid_targets_min": 553 }, { "epoch": 2.277432712215321, "grad_norm": 0.5060721290785742, "learning_rate": 3.414943630692605e-05, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.1891990602016449, "step": 1100, "valid_targets_mean": 3982.4, "valid_targets_min": 1146 }, { "epoch": 2.287784679089027, "grad_norm": 0.6388973076559393, "learning_rate": 3.407626002179943e-05, "loss": 0.2605, "loss_nan_ranks": 0, "loss_rank_avg": 0.2833097577095032, "step": 1105, "valid_targets_mean": 2923.7, "valid_targets_min": 837 }, { "epoch": 2.298136645962733, "grad_norm": 0.7050108379240185, "learning_rate": 3.40027084115371e-05, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.25936251878738403, "step": 1110, "valid_targets_mean": 2194.5, "valid_targets_min": 761 }, { "epoch": 2.308488612836439, "grad_norm": 1.1896188271617125, "learning_rate": 3.3928783437296906e-05, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.23933464288711548, "step": 1115, "valid_targets_mean": 2121.6, "valid_targets_min": 435 }, { "epoch": 2.318840579710145, "grad_norm": 0.5651209935539805, "learning_rate": 3.385448707019199e-05, "loss": 0.2806, "loss_nan_ranks": 0, "loss_rank_avg": 0.25165855884552, "step": 1120, "valid_targets_mean": 4061.7, "valid_targets_min": 695 }, { "epoch": 2.329192546583851, "grad_norm": 0.7262731183176127, "learning_rate": 3.37798212912382e-05, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.2577860951423645, "step": 1125, "valid_targets_mean": 2202.4, "valid_targets_min": 815 }, { "epoch": 2.339544513457557, "grad_norm": 0.5618393584824415, "learning_rate": 3.370478809130126e-05, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.1696050465106964, "step": 1130, "valid_targets_mean": 2500.9, "valid_targets_min": 347 }, { "epoch": 2.349896480331263, "grad_norm": 0.7126252849015065, "learning_rate": 3.3629389471043686e-05, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.3189730942249298, "step": 1135, "valid_targets_mean": 3294.7, "valid_targets_min": 1051 }, { "epoch": 2.360248447204969, "grad_norm": 0.9604299856824035, "learning_rate": 3.355362744087147e-05, "loss": 0.3133, "loss_nan_ranks": 0, "loss_rank_avg": 0.40159639716148376, "step": 1140, "valid_targets_mean": 3716.9, "valid_targets_min": 314 }, { "epoch": 2.370600414078675, "grad_norm": 0.6100748889704821, "learning_rate": 3.347750402088046e-05, "loss": 0.2548, "loss_nan_ranks": 0, "loss_rank_avg": 0.25193271040916443, "step": 1145, "valid_targets_mean": 3066.1, "valid_targets_min": 954 }, { "epoch": 2.380952380952381, "grad_norm": 0.6513131119801923, "learning_rate": 3.3401021240802446e-05, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.23295412957668304, "step": 1150, "valid_targets_mean": 2498.0, "valid_targets_min": 428 }, { "epoch": 2.391304347826087, "grad_norm": 0.6813554157755068, "learning_rate": 3.332418113995116e-05, "loss": 0.2621, "loss_nan_ranks": 0, "loss_rank_avg": 0.19543245434761047, "step": 1155, "valid_targets_mean": 2158.0, "valid_targets_min": 831 }, { "epoch": 2.401656314699793, "grad_norm": 0.7313840895870419, "learning_rate": 3.3246985767167763e-05, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.22841569781303406, "step": 1160, "valid_targets_mean": 2154.1, "valid_targets_min": 400 }, { "epoch": 2.412008281573499, "grad_norm": 0.5935846326263404, "learning_rate": 3.316943718076633e-05, "loss": 0.2533, "loss_nan_ranks": 0, "loss_rank_avg": 0.333047479391098, "step": 1165, "valid_targets_mean": 4248.6, "valid_targets_min": 943 }, { "epoch": 2.422360248447205, "grad_norm": 0.791044272962795, "learning_rate": 3.3091537448478854e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.26495736837387085, "step": 1170, "valid_targets_mean": 2369.9, "valid_targets_min": 975 }, { "epoch": 2.432712215320911, "grad_norm": 0.6676783405628622, "learning_rate": 3.301328864740024e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.33358559012413025, "step": 1175, "valid_targets_mean": 2824.4, "valid_targets_min": 438 }, { "epoch": 2.443064182194617, "grad_norm": 0.6210999987816006, "learning_rate": 3.2934692863932826e-05, "loss": 0.2883, "loss_nan_ranks": 0, "loss_rank_avg": 0.37713438272476196, "step": 1180, "valid_targets_mean": 4190.8, "valid_targets_min": 972 }, { "epoch": 2.453416149068323, "grad_norm": 0.9102484172009931, "learning_rate": 3.285575219373079e-05, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.27761310338974, "step": 1185, "valid_targets_mean": 2286.0, "valid_targets_min": 683 }, { "epoch": 2.463768115942029, "grad_norm": 0.8264325779605302, "learning_rate": 3.2776468741644254e-05, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.35481444001197815, "step": 1190, "valid_targets_mean": 1918.8, "valid_targets_min": 488 }, { "epoch": 2.474120082815735, "grad_norm": 0.7271253546023544, "learning_rate": 3.26968446216632e-05, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.26062947511672974, "step": 1195, "valid_targets_mean": 2231.8, "valid_targets_min": 709 }, { "epoch": 2.4844720496894412, "grad_norm": 0.8973929287276415, "learning_rate": 3.2616881956861025e-05, "loss": 0.2677, "loss_nan_ranks": 0, "loss_rank_avg": 0.27928027510643005, "step": 1200, "valid_targets_mean": 1896.2, "valid_targets_min": 348 }, { "epoch": 2.494824016563147, "grad_norm": 0.4082069685047567, "learning_rate": 3.2536582879338046e-05, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.18940213322639465, "step": 1205, "valid_targets_mean": 4323.4, "valid_targets_min": 968 }, { "epoch": 2.505175983436853, "grad_norm": 0.7017656676375894, "learning_rate": 3.245594953016455e-05, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.2417268604040146, "step": 1210, "valid_targets_mean": 2325.2, "valid_targets_min": 812 }, { "epoch": 2.5155279503105588, "grad_norm": 0.6814415938184818, "learning_rate": 3.237498405932374e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.33832401037216187, "step": 1215, "valid_targets_mean": 2867.0, "valid_targets_min": 887 }, { "epoch": 2.525879917184265, "grad_norm": 0.7801644137826693, "learning_rate": 3.2293688625654414e-05, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.27744320034980774, "step": 1220, "valid_targets_mean": 1826.2, "valid_targets_min": 551 }, { "epoch": 2.536231884057971, "grad_norm": 0.7921338973324987, "learning_rate": 3.221206539679342e-05, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.2806174159049988, "step": 1225, "valid_targets_mean": 4052.1, "valid_targets_min": 953 }, { "epoch": 2.546583850931677, "grad_norm": 0.7638655535817076, "learning_rate": 3.213011654911781e-05, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.22334516048431396, "step": 1230, "valid_targets_mean": 1654.2, "valid_targets_min": 677 }, { "epoch": 2.556935817805383, "grad_norm": 0.9533183958110001, "learning_rate": 3.204784426768685e-05, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.22882500290870667, "step": 1235, "valid_targets_mean": 3256.3, "valid_targets_min": 917 }, { "epoch": 2.567287784679089, "grad_norm": 0.3343640416944216, "learning_rate": 3.1965250746183755e-05, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.13794702291488647, "step": 1240, "valid_targets_mean": 5393.2, "valid_targets_min": 363 }, { "epoch": 2.577639751552795, "grad_norm": 0.6369559557128881, "learning_rate": 3.1882338186857164e-05, "loss": 0.2423, "loss_nan_ranks": 0, "loss_rank_avg": 0.2859078645706177, "step": 1245, "valid_targets_mean": 2821.6, "valid_targets_min": 740 }, { "epoch": 2.587991718426501, "grad_norm": 0.6063783751731852, "learning_rate": 3.1799108800462466e-05, "loss": 0.3386, "loss_nan_ranks": 0, "loss_rank_avg": 0.31201863288879395, "step": 1250, "valid_targets_mean": 3289.1, "valid_targets_min": 789 }, { "epoch": 2.598343685300207, "grad_norm": 0.5142821780449842, "learning_rate": 3.1715564806202815e-05, "loss": 0.3602, "loss_nan_ranks": 0, "loss_rank_avg": 0.2918277978897095, "step": 1255, "valid_targets_mean": 3862.7, "valid_targets_min": 802 }, { "epoch": 2.608695652173913, "grad_norm": 0.5889004684696514, "learning_rate": 3.1631708431669985e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.2696582078933716, "step": 1260, "valid_targets_mean": 3824.6, "valid_targets_min": 899 }, { "epoch": 2.619047619047619, "grad_norm": 0.6639591263396689, "learning_rate": 3.1547541912784965e-05, "loss": 0.2819, "loss_nan_ranks": 0, "loss_rank_avg": 0.25455427169799805, "step": 1265, "valid_targets_mean": 2578.6, "valid_targets_min": 337 }, { "epoch": 2.629399585921325, "grad_norm": 0.6938668640706942, "learning_rate": 3.146306749373833e-05, "loss": 0.27, "loss_nan_ranks": 0, "loss_rank_avg": 0.285896360874176, "step": 1270, "valid_targets_mean": 2242.8, "valid_targets_min": 658 }, { "epoch": 2.639751552795031, "grad_norm": 0.6635900887759165, "learning_rate": 3.137828742693041e-05, "loss": 0.3081, "loss_nan_ranks": 0, "loss_rank_avg": 0.3423786163330078, "step": 1275, "valid_targets_mean": 3281.0, "valid_targets_min": 980 }, { "epoch": 2.650103519668737, "grad_norm": 0.6801128006550414, "learning_rate": 3.129320397291125e-05, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.2767699360847473, "step": 1280, "valid_targets_mean": 2735.9, "valid_targets_min": 464 }, { "epoch": 2.660455486542443, "grad_norm": 0.7025184682700185, "learning_rate": 3.12078194003203e-05, "loss": 0.2553, "loss_nan_ranks": 0, "loss_rank_avg": 0.27691537141799927, "step": 1285, "valid_targets_mean": 2134.4, "valid_targets_min": 626 }, { "epoch": 2.670807453416149, "grad_norm": 0.5924464858785424, "learning_rate": 3.112213598582596e-05, "loss": 0.2732, "loss_nan_ranks": 0, "loss_rank_avg": 0.15232308208942413, "step": 1290, "valid_targets_mean": 4905.1, "valid_targets_min": 777 }, { "epoch": 2.681159420289855, "grad_norm": 0.7877428337019158, "learning_rate": 3.1036156014064846e-05, "loss": 0.2453, "loss_nan_ranks": 0, "loss_rank_avg": 0.24164274334907532, "step": 1295, "valid_targets_mean": 2376.1, "valid_targets_min": 1018 }, { "epoch": 2.691511387163561, "grad_norm": 0.7142467961580515, "learning_rate": 3.094988177758091e-05, "loss": 0.2558, "loss_nan_ranks": 0, "loss_rank_avg": 0.37197333574295044, "step": 1300, "valid_targets_mean": 3346.9, "valid_targets_min": 628 }, { "epoch": 2.701863354037267, "grad_norm": 0.5870935195942067, "learning_rate": 3.086331557676426e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.2159366011619568, "step": 1305, "valid_targets_mean": 2964.8, "valid_targets_min": 274 }, { "epoch": 2.712215320910973, "grad_norm": 0.6872956928546283, "learning_rate": 3.0776459719789876e-05, "loss": 0.2727, "loss_nan_ranks": 0, "loss_rank_avg": 0.31350186467170715, "step": 1310, "valid_targets_mean": 2581.4, "valid_targets_min": 696 }, { "epoch": 2.722567287784679, "grad_norm": 0.7486101772028452, "learning_rate": 3.0689316522556026e-05, "loss": 0.3293, "loss_nan_ranks": 0, "loss_rank_avg": 0.2855913043022156, "step": 1315, "valid_targets_mean": 2561.9, "valid_targets_min": 750 }, { "epoch": 2.732919254658385, "grad_norm": 0.4579078783293101, "learning_rate": 3.060188830862254e-05, "loss": 0.2429, "loss_nan_ranks": 0, "loss_rank_avg": 0.27316346764564514, "step": 1320, "valid_targets_mean": 6253.2, "valid_targets_min": 780 }, { "epoch": 2.7432712215320914, "grad_norm": 0.5358219876585554, "learning_rate": 3.0514177409148854e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.19187697768211365, "step": 1325, "valid_targets_mean": 2720.8, "valid_targets_min": 386 }, { "epoch": 2.753623188405797, "grad_norm": 0.5552497910549137, "learning_rate": 3.042618616283184e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.27454033493995667, "step": 1330, "valid_targets_mean": 3399.2, "valid_targets_min": 397 }, { "epoch": 2.7639751552795033, "grad_norm": 0.6823834665507209, "learning_rate": 3.0337916915843437e-05, "loss": 0.2599, "loss_nan_ranks": 0, "loss_rank_avg": 0.2507593631744385, "step": 1335, "valid_targets_mean": 2280.2, "valid_targets_min": 857 }, { "epoch": 2.774327122153209, "grad_norm": 0.7550596937365505, "learning_rate": 3.024937202176813e-05, "loss": 0.3365, "loss_nan_ranks": 0, "loss_rank_avg": 0.2813539505004883, "step": 1340, "valid_targets_mean": 1925.6, "valid_targets_min": 800 }, { "epoch": 2.7846790890269153, "grad_norm": 0.620351083586836, "learning_rate": 3.016055384154016e-05, "loss": 0.2645, "loss_nan_ranks": 0, "loss_rank_avg": 0.27360090613365173, "step": 1345, "valid_targets_mean": 2753.7, "valid_targets_min": 1050 }, { "epoch": 2.795031055900621, "grad_norm": 0.5870647895388508, "learning_rate": 3.007146474338061e-05, "loss": 0.2453, "loss_nan_ranks": 0, "loss_rank_avg": 0.25962918996810913, "step": 1350, "valid_targets_mean": 3009.2, "valid_targets_min": 843 }, { "epoch": 2.8053830227743273, "grad_norm": 0.7132808075099697, "learning_rate": 2.9982107102734225e-05, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.28429892659187317, "step": 1355, "valid_targets_mean": 2095.7, "valid_targets_min": 1051 }, { "epoch": 2.8157349896480333, "grad_norm": 0.5718661527861477, "learning_rate": 2.9892483302206067e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.20819316804409027, "step": 1360, "valid_targets_mean": 2768.9, "valid_targets_min": 258 }, { "epoch": 2.8260869565217392, "grad_norm": 0.3634008953249174, "learning_rate": 2.9802595731498027e-05, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.1665099710226059, "step": 1365, "valid_targets_mean": 6357.5, "valid_targets_min": 977 }, { "epoch": 2.8364389233954452, "grad_norm": 0.7314349692520135, "learning_rate": 2.9712446787345076e-05, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.30443474650382996, "step": 1370, "valid_targets_mean": 2490.6, "valid_targets_min": 540 }, { "epoch": 2.846790890269151, "grad_norm": 0.5362978528913575, "learning_rate": 2.962203887345137e-05, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.2595052719116211, "step": 1375, "valid_targets_mean": 3539.8, "valid_targets_min": 720 }, { "epoch": 2.857142857142857, "grad_norm": 0.6062346483149705, "learning_rate": 2.9531374400426158e-05, "loss": 0.3262, "loss_nan_ranks": 0, "loss_rank_avg": 0.24060280621051788, "step": 1380, "valid_targets_mean": 2836.4, "valid_targets_min": 652 }, { "epoch": 2.867494824016563, "grad_norm": 0.7082210941894594, "learning_rate": 2.9440455785719496e-05, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.2264600545167923, "step": 1385, "valid_targets_mean": 1664.6, "valid_targets_min": 495 }, { "epoch": 2.877846790890269, "grad_norm": 0.6123887449000341, "learning_rate": 2.934928545355781e-05, "loss": 0.2984, "loss_nan_ranks": 0, "loss_rank_avg": 0.3257123827934265, "step": 1390, "valid_targets_mean": 3369.2, "valid_targets_min": 829 }, { "epoch": 2.888198757763975, "grad_norm": 0.6864043917128869, "learning_rate": 2.925786583487922e-05, "loss": 0.2905, "loss_nan_ranks": 0, "loss_rank_avg": 0.31987008452415466, "step": 1395, "valid_targets_mean": 2711.7, "valid_targets_min": 810 }, { "epoch": 2.898550724637681, "grad_norm": 0.6080342575365325, "learning_rate": 2.916619936726877e-05, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.2373320758342743, "step": 1400, "valid_targets_mean": 3641.7, "valid_targets_min": 881 }, { "epoch": 2.908902691511387, "grad_norm": 0.7181192036864602, "learning_rate": 2.9074288494893407e-05, "loss": 0.3389, "loss_nan_ranks": 0, "loss_rank_avg": 0.31169378757476807, "step": 1405, "valid_targets_mean": 2594.9, "valid_targets_min": 787 }, { "epoch": 2.919254658385093, "grad_norm": 0.7116785040649848, "learning_rate": 2.8982135668436796e-05, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.2377220094203949, "step": 1410, "valid_targets_mean": 2565.6, "valid_targets_min": 812 }, { "epoch": 2.929606625258799, "grad_norm": 0.527003497336332, "learning_rate": 2.8889743345034012e-05, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.24901200830936432, "step": 1415, "valid_targets_mean": 3355.5, "valid_targets_min": 906 }, { "epoch": 2.939958592132505, "grad_norm": 0.7215643198974966, "learning_rate": 2.8797113988205992e-05, "loss": 0.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.26589393615722656, "step": 1420, "valid_targets_mean": 2117.3, "valid_targets_min": 518 }, { "epoch": 2.950310559006211, "grad_norm": 0.7304693761897525, "learning_rate": 2.8704250067793853e-05, "loss": 0.2543, "loss_nan_ranks": 0, "loss_rank_avg": 0.3305160701274872, "step": 1425, "valid_targets_mean": 2289.8, "valid_targets_min": 795 }, { "epoch": 2.960662525879917, "grad_norm": 0.5524041278998529, "learning_rate": 2.8611154059893072e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.2436435967683792, "step": 1430, "valid_targets_mean": 3544.5, "valid_targets_min": 642 }, { "epoch": 2.971014492753623, "grad_norm": 0.6949146976027709, "learning_rate": 2.851782844678741e-05, "loss": 0.2591, "loss_nan_ranks": 0, "loss_rank_avg": 0.24652817845344543, "step": 1435, "valid_targets_mean": 2396.6, "valid_targets_min": 693 }, { "epoch": 2.981366459627329, "grad_norm": 0.855845523061833, "learning_rate": 2.8424275716882764e-05, "loss": 0.3187, "loss_nan_ranks": 0, "loss_rank_avg": 0.35203707218170166, "step": 1440, "valid_targets_mean": 2468.2, "valid_targets_min": 960 }, { "epoch": 2.991718426501035, "grad_norm": 0.6069280690104846, "learning_rate": 2.8330498364640803e-05, "loss": 0.2729, "loss_nan_ranks": 0, "loss_rank_avg": 0.2389097809791565, "step": 1445, "valid_targets_mean": 2823.1, "valid_targets_min": 850 }, { "epoch": 3.002070393374741, "grad_norm": 0.7079484446595876, "learning_rate": 2.823649889051245e-05, "loss": 0.2605, "loss_nan_ranks": 0, "loss_rank_avg": 0.33429914712905884, "step": 1450, "valid_targets_mean": 2347.8, "valid_targets_min": 650 }, { "epoch": 3.012422360248447, "grad_norm": 0.5927362264974598, "learning_rate": 2.8142279800871226e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.17803658545017242, "step": 1455, "valid_targets_mean": 2970.0, "valid_targets_min": 683 }, { "epoch": 3.022774327122153, "grad_norm": 0.6173739269582847, "learning_rate": 2.8047843607946416e-05, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.21716290712356567, "step": 1460, "valid_targets_mean": 3280.1, "valid_targets_min": 625 }, { "epoch": 3.0331262939958594, "grad_norm": 0.8835749274852875, "learning_rate": 2.7953192829756087e-05, "loss": 0.2605, "loss_nan_ranks": 0, "loss_rank_avg": 0.23659950494766235, "step": 1465, "valid_targets_mean": 1768.8, "valid_targets_min": 692 }, { "epoch": 3.0434782608695654, "grad_norm": 0.6416344650777536, "learning_rate": 2.7858329990039922e-05, "loss": 0.2249, "loss_nan_ranks": 0, "loss_rank_avg": 0.26247477531433105, "step": 1470, "valid_targets_mean": 4569.3, "valid_targets_min": 658 }, { "epoch": 3.0538302277432714, "grad_norm": 0.7529415797399801, "learning_rate": 2.7763257618191965e-05, "loss": 0.2372, "loss_nan_ranks": 0, "loss_rank_avg": 0.26717787981033325, "step": 1475, "valid_targets_mean": 2397.6, "valid_targets_min": 277 }, { "epoch": 3.0641821946169774, "grad_norm": 0.7317704953810572, "learning_rate": 2.7667978249193142e-05, "loss": 0.26, "loss_nan_ranks": 0, "loss_rank_avg": 0.21715983748435974, "step": 1480, "valid_targets_mean": 2296.4, "valid_targets_min": 769 }, { "epoch": 3.0745341614906834, "grad_norm": 0.5247604954590532, "learning_rate": 2.757249442354373e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.27207493782043457, "step": 1485, "valid_targets_mean": 5021.0, "valid_targets_min": 496 }, { "epoch": 3.0848861283643894, "grad_norm": 1.0520512297726068, "learning_rate": 2.747680868719553e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.2122560292482376, "step": 1490, "valid_targets_mean": 2820.4, "valid_targets_min": 725 }, { "epoch": 3.0952380952380953, "grad_norm": 0.6767778323794827, "learning_rate": 2.738092359148405e-05, "loss": 0.2312, "loss_nan_ranks": 0, "loss_rank_avg": 0.2775751054286957, "step": 1495, "valid_targets_mean": 2690.2, "valid_targets_min": 830 }, { "epoch": 3.1055900621118013, "grad_norm": 0.6576226728100677, "learning_rate": 2.7284841693060462e-05, "loss": 0.2208, "loss_nan_ranks": 0, "loss_rank_avg": 0.20576655864715576, "step": 1500, "valid_targets_mean": 2834.8, "valid_targets_min": 768 }, { "epoch": 2.439222042139384, "grad_norm": 0.8205999048363152, "learning_rate": 3.295112400968073e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.2548583745956421, "step": 1505, "valid_targets_mean": 1901.8, "valid_targets_min": 292 }, { "epoch": 2.447325769854133, "grad_norm": 0.5315794072702741, "learning_rate": 3.2889429817593494e-05, "loss": 0.2603, "loss_nan_ranks": 0, "loss_rank_avg": 0.1704677790403366, "step": 1510, "valid_targets_mean": 3963.4, "valid_targets_min": 594 }, { "epoch": 2.4554294975688817, "grad_norm": 0.7664196020253414, "learning_rate": 3.2827525129535135e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.1991099715232849, "step": 1515, "valid_targets_mean": 2012.4, "valid_targets_min": 624 }, { "epoch": 2.4635332252836304, "grad_norm": 0.8521592624429181, "learning_rate": 3.276541095646482e-05, "loss": 0.2445, "loss_nan_ranks": 0, "loss_rank_avg": 0.29062721133232117, "step": 1520, "valid_targets_mean": 1823.2, "valid_targets_min": 501 }, { "epoch": 2.471636952998379, "grad_norm": 0.5852765718678786, "learning_rate": 3.2703088312762825e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.24727652966976166, "step": 1525, "valid_targets_mean": 3405.0, "valid_targets_min": 363 }, { "epoch": 2.479740680713128, "grad_norm": 0.813053837691479, "learning_rate": 3.2640558216213914e-05, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.30369141697883606, "step": 1530, "valid_targets_mean": 2343.3, "valid_targets_min": 696 }, { "epoch": 2.487844408427877, "grad_norm": 0.8194320234055189, "learning_rate": 3.2577821687990764e-05, "loss": 0.2135, "loss_nan_ranks": 0, "loss_rank_avg": 0.23056931793689728, "step": 1535, "valid_targets_mean": 2043.1, "valid_targets_min": 216 }, { "epoch": 2.4959481361426255, "grad_norm": 0.7683424849834839, "learning_rate": 3.2514879752637236e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.2309729903936386, "step": 1540, "valid_targets_mean": 2539.1, "valid_targets_min": 331 }, { "epoch": 2.5040518638573745, "grad_norm": 0.776312961878328, "learning_rate": 3.2451733438051705e-05, "loss": 0.2291, "loss_nan_ranks": 0, "loss_rank_avg": 0.18839803338050842, "step": 1545, "valid_targets_mean": 1955.8, "valid_targets_min": 514 }, { "epoch": 2.512155591572123, "grad_norm": 0.655759060281187, "learning_rate": 3.238838377547023e-05, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.189316064119339, "step": 1550, "valid_targets_mean": 2929.6, "valid_targets_min": 757 }, { "epoch": 2.520259319286872, "grad_norm": 1.6044275923948417, "learning_rate": 3.2324831799449724e-05, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.17633099853992462, "step": 1555, "valid_targets_mean": 2779.9, "valid_targets_min": 820 }, { "epoch": 2.528363047001621, "grad_norm": 0.6561320237172028, "learning_rate": 3.226107854785106e-05, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.1860257238149643, "step": 1560, "valid_targets_mean": 3073.5, "valid_targets_min": 800 }, { "epoch": 2.5364667747163696, "grad_norm": 0.6383285185047638, "learning_rate": 3.2197125061822135e-05, "loss": 0.2507, "loss_nan_ranks": 0, "loss_rank_avg": 0.2523868680000305, "step": 1565, "valid_targets_mean": 3199.5, "valid_targets_min": 727 }, { "epoch": 2.5445705024311183, "grad_norm": 0.7962930999328149, "learning_rate": 3.213297238578082e-05, "loss": 0.2197, "loss_nan_ranks": 0, "loss_rank_avg": 0.20864513516426086, "step": 1570, "valid_targets_mean": 2732.2, "valid_targets_min": 1016 }, { "epoch": 2.5526742301458674, "grad_norm": 0.7676276530225514, "learning_rate": 3.206862156739799e-05, "loss": 0.2563, "loss_nan_ranks": 0, "loss_rank_avg": 0.3047863245010376, "step": 1575, "valid_targets_mean": 2614.4, "valid_targets_min": 514 }, { "epoch": 2.560777957860616, "grad_norm": 0.8226887644393849, "learning_rate": 3.2004073657580314e-05, "loss": 0.1946, "loss_nan_ranks": 0, "loss_rank_avg": 0.2075314223766327, "step": 1580, "valid_targets_mean": 2038.8, "valid_targets_min": 337 }, { "epoch": 2.5688816855753647, "grad_norm": 0.7831791976947534, "learning_rate": 3.193932971045316e-05, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.19461211562156677, "step": 1585, "valid_targets_mean": 2053.1, "valid_targets_min": 658 }, { "epoch": 2.5769854132901133, "grad_norm": 0.5644239851430982, "learning_rate": 3.187439078334338e-05, "loss": 0.2177, "loss_nan_ranks": 0, "loss_rank_avg": 0.18497009575366974, "step": 1590, "valid_targets_mean": 4375.7, "valid_targets_min": 704 }, { "epoch": 2.585089141004862, "grad_norm": 0.7466943240187409, "learning_rate": 3.180925793676199e-05, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.34886205196380615, "step": 1595, "valid_targets_mean": 3252.1, "valid_targets_min": 704 }, { "epoch": 2.593192868719611, "grad_norm": 0.654235875346469, "learning_rate": 3.1743932234386905e-05, "loss": 0.2239, "loss_nan_ranks": 0, "loss_rank_avg": 0.23556801676750183, "step": 1600, "valid_targets_mean": 2707.2, "valid_targets_min": 440 }, { "epoch": 2.6012965964343597, "grad_norm": 0.8478531512416733, "learning_rate": 3.167841474304555e-05, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.2540985345840454, "step": 1605, "valid_targets_mean": 2202.8, "valid_targets_min": 807 }, { "epoch": 2.6094003241491084, "grad_norm": 0.7568048524801189, "learning_rate": 3.161270653269743e-05, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.2507561445236206, "step": 1610, "valid_targets_mean": 2478.7, "valid_targets_min": 884 }, { "epoch": 2.6175040518638575, "grad_norm": 0.6768880292640026, "learning_rate": 3.154680867641666e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.2119147777557373, "step": 1615, "valid_targets_mean": 2845.9, "valid_targets_min": 933 }, { "epoch": 2.625607779578606, "grad_norm": 0.6937745038803551, "learning_rate": 3.1480722250374454e-05, "loss": 0.2131, "loss_nan_ranks": 0, "loss_rank_avg": 0.15716394782066345, "step": 1620, "valid_targets_mean": 3715.1, "valid_targets_min": 509 }, { "epoch": 2.633711507293355, "grad_norm": 0.687030718167616, "learning_rate": 3.1414448333821526e-05, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.26078009605407715, "step": 1625, "valid_targets_mean": 2993.9, "valid_targets_min": 835 }, { "epoch": 2.641815235008104, "grad_norm": 0.794998960315971, "learning_rate": 3.1347988009070496e-05, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.22042764723300934, "step": 1630, "valid_targets_mean": 2182.0, "valid_targets_min": 939 }, { "epoch": 2.6499189627228525, "grad_norm": 0.5288765889583341, "learning_rate": 3.1281342361478184e-05, "loss": 0.2031, "loss_nan_ranks": 0, "loss_rank_avg": 0.18932923674583435, "step": 1635, "valid_targets_mean": 4350.9, "valid_targets_min": 916 }, { "epoch": 2.658022690437601, "grad_norm": 0.8061510946147543, "learning_rate": 3.121451247942789e-05, "loss": 0.215, "loss_nan_ranks": 0, "loss_rank_avg": 0.23893296718597412, "step": 1640, "valid_targets_mean": 2239.7, "valid_targets_min": 1029 }, { "epoch": 2.6661264181523503, "grad_norm": 0.8897502162805498, "learning_rate": 3.1147499454311654e-05, "loss": 0.2132, "loss_nan_ranks": 0, "loss_rank_avg": 0.24748632311820984, "step": 1645, "valid_targets_mean": 3042.6, "valid_targets_min": 883 }, { "epoch": 2.674230145867099, "grad_norm": 0.7411104018017028, "learning_rate": 3.1080304380512386e-05, "loss": 0.2258, "loss_nan_ranks": 0, "loss_rank_avg": 0.3214663565158844, "step": 1650, "valid_targets_mean": 3191.7, "valid_targets_min": 954 }, { "epoch": 2.6823338735818476, "grad_norm": 0.6001100044618921, "learning_rate": 3.101292835538602e-05, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.21718555688858032, "step": 1655, "valid_targets_mean": 2929.2, "valid_targets_min": 510 }, { "epoch": 2.6904376012965967, "grad_norm": 0.5090566874249545, "learning_rate": 3.0945372479243605e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.1351870894432068, "step": 1660, "valid_targets_mean": 3636.1, "valid_targets_min": 511 }, { "epoch": 2.6985413290113454, "grad_norm": 0.8691139316583438, "learning_rate": 3.087763785533328e-05, "loss": 0.2353, "loss_nan_ranks": 0, "loss_rank_avg": 0.24571505188941956, "step": 1665, "valid_targets_mean": 2121.1, "valid_targets_min": 1000 }, { "epoch": 2.706645056726094, "grad_norm": 0.7213977715140599, "learning_rate": 3.0809725589822325e-05, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.22522029280662537, "step": 1670, "valid_targets_mean": 2168.9, "valid_targets_min": 752 }, { "epoch": 2.7147487844408427, "grad_norm": 0.6699076338131222, "learning_rate": 3.074163679177907e-05, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.24370843172073364, "step": 1675, "valid_targets_mean": 2977.4, "valid_targets_min": 953 }, { "epoch": 2.7228525121555913, "grad_norm": 0.6699594167700161, "learning_rate": 3.067337257315477e-05, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.19450387358665466, "step": 1680, "valid_targets_mean": 2758.7, "valid_targets_min": 924 }, { "epoch": 2.7309562398703404, "grad_norm": 0.7672860021178419, "learning_rate": 3.0604934048765444e-05, "loss": 0.2039, "loss_nan_ranks": 0, "loss_rank_avg": 0.22159236669540405, "step": 1685, "valid_targets_mean": 2533.1, "valid_targets_min": 511 }, { "epoch": 2.739059967585089, "grad_norm": 0.7039751582203525, "learning_rate": 3.05363223362737e-05, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.2049209177494049, "step": 1690, "valid_targets_mean": 2859.5, "valid_targets_min": 950 }, { "epoch": 2.7471636952998377, "grad_norm": 2.679447162042586, "learning_rate": 3.0467538556170463e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.1371978223323822, "step": 1695, "valid_targets_mean": 2292.4, "valid_targets_min": 525 }, { "epoch": 2.755267423014587, "grad_norm": 0.6779419086781114, "learning_rate": 3.0398583831756655e-05, "loss": 0.2261, "loss_nan_ranks": 0, "loss_rank_avg": 0.20101284980773926, "step": 1700, "valid_targets_mean": 2922.6, "valid_targets_min": 734 }, { "epoch": 2.7633711507293355, "grad_norm": 0.6929703972487979, "learning_rate": 3.03294592891249e-05, "loss": 0.2141, "loss_nan_ranks": 0, "loss_rank_avg": 0.2838400602340698, "step": 1705, "valid_targets_mean": 3094.0, "valid_targets_min": 697 }, { "epoch": 2.771474878444084, "grad_norm": 0.4798656780585094, "learning_rate": 3.0260166057141086e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.18296658992767334, "step": 1710, "valid_targets_mean": 5082.8, "valid_targets_min": 471 }, { "epoch": 2.7795786061588332, "grad_norm": 0.7731022915468665, "learning_rate": 3.0190705267425956e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.25233393907546997, "step": 1715, "valid_targets_mean": 2334.8, "valid_targets_min": 602 }, { "epoch": 2.787682333873582, "grad_norm": 0.833833609952511, "learning_rate": 3.0121078054336633e-05, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.27136874198913574, "step": 1720, "valid_targets_mean": 3887.7, "valid_targets_min": 629 }, { "epoch": 2.7957860615883305, "grad_norm": 0.572927781409477, "learning_rate": 3.005128555494806e-05, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.16209685802459717, "step": 1725, "valid_targets_mean": 3344.1, "valid_targets_min": 929 }, { "epoch": 2.8038897893030796, "grad_norm": 0.8175035205190527, "learning_rate": 2.998132890903448e-05, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.2571600377559662, "step": 1730, "valid_targets_mean": 2496.4, "valid_targets_min": 841 }, { "epoch": 2.8119935170178283, "grad_norm": 0.820561644375052, "learning_rate": 2.9911209259050763e-05, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.21497473120689392, "step": 1735, "valid_targets_mean": 2354.7, "valid_targets_min": 1149 }, { "epoch": 2.820097244732577, "grad_norm": 0.6492150323752979, "learning_rate": 2.984092775011382e-05, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.16714109480381012, "step": 1740, "valid_targets_mean": 2458.3, "valid_targets_min": 787 }, { "epoch": 2.828200972447326, "grad_norm": 0.7319549857733452, "learning_rate": 2.9770485529983834e-05, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.22950349748134613, "step": 1745, "valid_targets_mean": 3142.0, "valid_targets_min": 1024 }, { "epoch": 2.8363047001620747, "grad_norm": 0.6560080208991743, "learning_rate": 2.9699883749045564e-05, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.1986587643623352, "step": 1750, "valid_targets_mean": 3457.0, "valid_targets_min": 477 }, { "epoch": 2.8444084278768234, "grad_norm": 0.6382253092955735, "learning_rate": 2.962912356028953e-05, "loss": 0.216, "loss_nan_ranks": 0, "loss_rank_avg": 0.23129406571388245, "step": 1755, "valid_targets_mean": 2934.9, "valid_targets_min": 859 }, { "epoch": 2.852512155591572, "grad_norm": 0.5301256913380961, "learning_rate": 2.95582061192932e-05, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.18352752923965454, "step": 1760, "valid_targets_mean": 5318.9, "valid_targets_min": 288 }, { "epoch": 2.8606158833063207, "grad_norm": 0.5551356639022342, "learning_rate": 2.9487132584202115e-05, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.15121974050998688, "step": 1765, "valid_targets_mean": 3240.4, "valid_targets_min": 972 }, { "epoch": 2.8687196110210698, "grad_norm": 0.6494961371690191, "learning_rate": 2.9415904115710964e-05, "loss": 0.2369, "loss_nan_ranks": 0, "loss_rank_avg": 0.27294760942459106, "step": 1770, "valid_targets_mean": 3565.1, "valid_targets_min": 882 }, { "epoch": 2.8768233387358184, "grad_norm": 0.755878858613056, "learning_rate": 2.9344521877044633e-05, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.2581571936607361, "step": 1775, "valid_targets_mean": 2870.9, "valid_targets_min": 852 }, { "epoch": 2.884927066450567, "grad_norm": 0.6896180082571636, "learning_rate": 2.927298703393924e-05, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.3024943768978119, "step": 1780, "valid_targets_mean": 3049.6, "valid_targets_min": 466 }, { "epoch": 2.893030794165316, "grad_norm": 0.5548812442234702, "learning_rate": 2.9201300754623046e-05, "loss": 0.2251, "loss_nan_ranks": 0, "loss_rank_avg": 0.23311251401901245, "step": 1785, "valid_targets_mean": 4044.0, "valid_targets_min": 686 }, { "epoch": 2.901134521880065, "grad_norm": 1.438754224110583, "learning_rate": 2.9129464209797404e-05, "loss": 0.2276, "loss_nan_ranks": 0, "loss_rank_avg": 0.24073530733585358, "step": 1790, "valid_targets_mean": 1909.4, "valid_targets_min": 617 }, { "epoch": 2.9092382495948135, "grad_norm": 0.7830491458219581, "learning_rate": 2.9057478572617644e-05, "loss": 0.215, "loss_nan_ranks": 0, "loss_rank_avg": 0.24332499504089355, "step": 1795, "valid_targets_mean": 2556.9, "valid_targets_min": 1002 }, { "epoch": 2.9173419773095626, "grad_norm": 0.6145444178155638, "learning_rate": 2.898534501867391e-05, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.25278767943382263, "step": 1800, "valid_targets_mean": 3891.1, "valid_targets_min": 971 }, { "epoch": 2.9254457050243112, "grad_norm": 0.3981787416840784, "learning_rate": 2.8913064725971947e-05, "loss": 0.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.14965100586414337, "step": 1805, "valid_targets_mean": 5392.8, "valid_targets_min": 908 }, { "epoch": 2.93354943273906, "grad_norm": 0.5818947273050361, "learning_rate": 2.8840638874913894e-05, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.24818670749664307, "step": 1810, "valid_targets_mean": 3600.8, "valid_targets_min": 509 }, { "epoch": 2.941653160453809, "grad_norm": 0.7145037253167454, "learning_rate": 2.8768068648278976e-05, "loss": 0.2105, "loss_nan_ranks": 0, "loss_rank_avg": 0.1713862121105194, "step": 1815, "valid_targets_mean": 2208.1, "valid_targets_min": 815 }, { "epoch": 2.9497568881685576, "grad_norm": 0.6506752973751263, "learning_rate": 2.8695355231204206e-05, "loss": 0.2021, "loss_nan_ranks": 0, "loss_rank_avg": 0.1586257517337799, "step": 1820, "valid_targets_mean": 2533.8, "valid_targets_min": 918 }, { "epoch": 2.9578606158833063, "grad_norm": 0.9308540302999432, "learning_rate": 2.862249981116502e-05, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.18500950932502747, "step": 1825, "valid_targets_mean": 1953.1, "valid_targets_min": 386 }, { "epoch": 2.965964343598055, "grad_norm": 0.868527787807027, "learning_rate": 2.854950357795589e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.30140724778175354, "step": 1830, "valid_targets_mean": 2394.5, "valid_targets_min": 544 }, { "epoch": 2.974068071312804, "grad_norm": 0.7675779936155871, "learning_rate": 2.847636772367091e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.38385745882987976, "step": 1835, "valid_targets_mean": 3416.3, "valid_targets_min": 652 }, { "epoch": 2.9821717990275527, "grad_norm": 0.5095446691779011, "learning_rate": 2.8403093442684287e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.17920516431331635, "step": 1840, "valid_targets_mean": 4411.1, "valid_targets_min": 968 }, { "epoch": 2.9902755267423013, "grad_norm": 0.7425898253446929, "learning_rate": 2.8329681931630877e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.21636709570884705, "step": 1845, "valid_targets_mean": 2047.3, "valid_targets_min": 332 }, { "epoch": 2.99837925445705, "grad_norm": 0.7698249801134349, "learning_rate": 2.825613438938663e-05, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.3017503619194031, "step": 1850, "valid_targets_mean": 2716.4, "valid_targets_min": 815 }, { "epoch": 3.006482982171799, "grad_norm": 0.7062953708878924, "learning_rate": 2.8182452017048983e-05, "loss": 0.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.16801732778549194, "step": 1855, "valid_targets_mean": 2252.6, "valid_targets_min": 612 }, { "epoch": 3.0145867098865478, "grad_norm": 0.7009970781236867, "learning_rate": 2.81086360179173e-05, "loss": 0.2254, "loss_nan_ranks": 0, "loss_rank_avg": 0.3520157039165497, "step": 1860, "valid_targets_mean": 3688.4, "valid_targets_min": 821 }, { "epoch": 3.0226904376012964, "grad_norm": 1.0084991924004758, "learning_rate": 2.8034687597473164e-05, "loss": 0.2193, "loss_nan_ranks": 0, "loss_rank_avg": 0.21333259344100952, "step": 1865, "valid_targets_mean": 2459.2, "valid_targets_min": 286 }, { "epoch": 3.0307941653160455, "grad_norm": 0.5137156161040282, "learning_rate": 2.796060796336074e-05, "loss": 0.2002, "loss_nan_ranks": 0, "loss_rank_avg": 0.18863826990127563, "step": 1870, "valid_targets_mean": 5101.9, "valid_targets_min": 689 }, { "epoch": 3.038897893030794, "grad_norm": 1.8100288546636265, "learning_rate": 2.7886398325367018e-05, "loss": 0.2146, "loss_nan_ranks": 0, "loss_rank_avg": 0.2229488492012024, "step": 1875, "valid_targets_mean": 2298.8, "valid_targets_min": 353 }, { "epoch": 3.047001620745543, "grad_norm": 0.720734898463899, "learning_rate": 2.7812059895402064e-05, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.20065172016620636, "step": 1880, "valid_targets_mean": 3090.3, "valid_targets_min": 681 }, { "epoch": 3.055105348460292, "grad_norm": 0.8640799066873229, "learning_rate": 2.773759388747925e-05, "loss": 0.3024, "loss_nan_ranks": 0, "loss_rank_avg": 0.4552222788333893, "step": 1885, "valid_targets_mean": 3287.7, "valid_targets_min": 804 }, { "epoch": 3.0632090761750406, "grad_norm": 0.6353362563989103, "learning_rate": 2.7663001517695386e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.24317996203899384, "step": 1890, "valid_targets_mean": 3646.6, "valid_targets_min": 630 }, { "epoch": 3.0713128038897892, "grad_norm": 0.7914447945449794, "learning_rate": 2.7588284004210907e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.20814718306064606, "step": 1895, "valid_targets_mean": 2367.0, "valid_targets_min": 849 }, { "epoch": 3.079416531604538, "grad_norm": 0.6958540521779719, "learning_rate": 2.7513442567229936e-05, "loss": 0.1968, "loss_nan_ranks": 0, "loss_rank_avg": 0.20249110460281372, "step": 1900, "valid_targets_mean": 2836.4, "valid_targets_min": 1033 }, { "epoch": 3.087520259319287, "grad_norm": 0.596529064303546, "learning_rate": 2.7438478428980407e-05, "loss": 0.2174, "loss_nan_ranks": 0, "loss_rank_avg": 0.14787033200263977, "step": 1905, "valid_targets_mean": 3139.7, "valid_targets_min": 475 }, { "epoch": 3.0956239870340356, "grad_norm": 0.7078002600984272, "learning_rate": 2.7363392813694047e-05, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.3391125798225403, "step": 1910, "valid_targets_mean": 3532.0, "valid_targets_min": 345 }, { "epoch": 3.1037277147487843, "grad_norm": 0.7778209985657967, "learning_rate": 2.7288186947586426e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.18052786588668823, "step": 1915, "valid_targets_mean": 2382.4, "valid_targets_min": 815 }, { "epoch": 3.1118314424635334, "grad_norm": 0.6013057667276556, "learning_rate": 2.7212862058836925e-05, "loss": 0.2246, "loss_nan_ranks": 0, "loss_rank_avg": 0.20441167056560516, "step": 1920, "valid_targets_mean": 4624.4, "valid_targets_min": 1011 }, { "epoch": 3.119935170178282, "grad_norm": 0.8433721924819828, "learning_rate": 2.713741937756865e-05, "loss": 0.2132, "loss_nan_ranks": 0, "loss_rank_avg": 0.21256756782531738, "step": 1925, "valid_targets_mean": 2051.4, "valid_targets_min": 1096 }, { "epoch": 3.1280388978930307, "grad_norm": 0.8267912865776698, "learning_rate": 2.7061860135828384e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.23010283708572388, "step": 1930, "valid_targets_mean": 2566.1, "valid_targets_min": 1053 }, { "epoch": 3.1361426256077793, "grad_norm": 0.9281087995213807, "learning_rate": 2.6986185567566442e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.26588061451911926, "step": 1935, "valid_targets_mean": 2648.5, "valid_targets_min": 1102 }, { "epoch": 3.1442463533225284, "grad_norm": 0.7402140669755561, "learning_rate": 2.6910396908616527e-05, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.24440577626228333, "step": 1940, "valid_targets_mean": 2880.9, "valid_targets_min": 1200 }, { "epoch": 3.152350081037277, "grad_norm": 0.9250550622058952, "learning_rate": 2.6834495396675526e-05, "loss": 0.214, "loss_nan_ranks": 0, "loss_rank_avg": 0.18351495265960693, "step": 1945, "valid_targets_mean": 1815.4, "valid_targets_min": 792 }, { "epoch": 3.1604538087520258, "grad_norm": 0.7075464086399091, "learning_rate": 2.6758482271283347e-05, "loss": 0.183, "loss_nan_ranks": 0, "loss_rank_avg": 0.14974619448184967, "step": 1950, "valid_targets_mean": 2622.6, "valid_targets_min": 918 }, { "epoch": 3.168557536466775, "grad_norm": 0.9235868375401112, "learning_rate": 2.668235877380263e-05, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.24251984059810638, "step": 1955, "valid_targets_mean": 1804.3, "valid_targets_min": 958 }, { "epoch": 3.1766612641815235, "grad_norm": 0.6596779615208653, "learning_rate": 2.660612614739849e-05, "loss": 0.1977, "loss_nan_ranks": 0, "loss_rank_avg": 0.14453783631324768, "step": 1960, "valid_targets_mean": 2709.9, "valid_targets_min": 976 }, { "epoch": 3.184764991896272, "grad_norm": 0.766766066884446, "learning_rate": 2.652978563701822e-05, "loss": 0.2015, "loss_nan_ranks": 0, "loss_rank_avg": 0.1874874234199524, "step": 1965, "valid_targets_mean": 2113.1, "valid_targets_min": 551 }, { "epoch": 3.1928687196110213, "grad_norm": 0.8124849594835287, "learning_rate": 2.645333848937095e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.23300279676914215, "step": 1970, "valid_targets_mean": 2446.9, "valid_targets_min": 901 }, { "epoch": 3.20097244732577, "grad_norm": 0.46106063693318805, "learning_rate": 2.6376785952907292e-05, "loss": 0.1697, "loss_nan_ranks": 0, "loss_rank_avg": 0.10534625500440598, "step": 1975, "valid_targets_mean": 4224.2, "valid_targets_min": 910 }, { "epoch": 3.2090761750405186, "grad_norm": 0.7587794893394673, "learning_rate": 2.630012927779896e-05, "loss": 0.2402, "loss_nan_ranks": 0, "loss_rank_avg": 0.2638416290283203, "step": 1980, "valid_targets_mean": 2923.1, "valid_targets_min": 460 }, { "epoch": 3.217179902755267, "grad_norm": 0.8879684966937325, "learning_rate": 2.6223369715918338e-05, "loss": 0.2079, "loss_nan_ranks": 0, "loss_rank_avg": 0.22857242822647095, "step": 1985, "valid_targets_mean": 1645.6, "valid_targets_min": 501 }, { "epoch": 3.2252836304700163, "grad_norm": 0.7748370854682728, "learning_rate": 2.614650852081805e-05, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.24988800287246704, "step": 1990, "valid_targets_mean": 2849.4, "valid_targets_min": 782 }, { "epoch": 3.233387358184765, "grad_norm": 0.7495261062213084, "learning_rate": 2.606954694771047e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.23291251063346863, "step": 1995, "valid_targets_mean": 2843.9, "valid_targets_min": 981 }, { "epoch": 3.2414910858995136, "grad_norm": 0.7547991819930768, "learning_rate": 2.5992486253447258e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.21426227688789368, "step": 2000, "valid_targets_mean": 2390.5, "valid_targets_min": 525 }, { "epoch": 3.2495948136142627, "grad_norm": 0.8127669361485503, "learning_rate": 2.5915327696498787e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.12424997985363007, "step": 2005, "valid_targets_mean": 1779.2, "valid_targets_min": 518 }, { "epoch": 3.2576985413290114, "grad_norm": 0.7721290973743158, "learning_rate": 2.583807253693362e-05, "loss": 0.2001, "loss_nan_ranks": 0, "loss_rank_avg": 0.18391962349414825, "step": 2010, "valid_targets_mean": 2541.4, "valid_targets_min": 1182 }, { "epoch": 3.26580226904376, "grad_norm": 0.7334128634083178, "learning_rate": 2.576072203639794e-05, "loss": 0.2041, "loss_nan_ranks": 0, "loss_rank_avg": 0.19778266549110413, "step": 2015, "valid_targets_mean": 2840.1, "valid_targets_min": 980 }, { "epoch": 3.2739059967585087, "grad_norm": 0.9287603147287846, "learning_rate": 2.5683277458094926e-05, "loss": 0.1992, "loss_nan_ranks": 0, "loss_rank_avg": 0.2278834730386734, "step": 2020, "valid_targets_mean": 1949.1, "valid_targets_min": 815 }, { "epoch": 3.282009724473258, "grad_norm": 0.8397730144943303, "learning_rate": 2.560574006676413e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.2002110779285431, "step": 2025, "valid_targets_mean": 3523.7, "valid_targets_min": 310 }, { "epoch": 3.2901134521880064, "grad_norm": 0.4390442212313819, "learning_rate": 2.5528111128660826e-05, "loss": 0.1701, "loss_nan_ranks": 0, "loss_rank_avg": 0.13749784231185913, "step": 2030, "valid_targets_mean": 5424.6, "valid_targets_min": 232 }, { "epoch": 3.298217179902755, "grad_norm": 0.6699615633322983, "learning_rate": 2.545039191153533e-05, "loss": 0.1734, "loss_nan_ranks": 0, "loss_rank_avg": 0.2043614387512207, "step": 2035, "valid_targets_mean": 3574.8, "valid_targets_min": 1054 }, { "epoch": 3.306320907617504, "grad_norm": 0.8633099775212048, "learning_rate": 2.53725836846123e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.1649923026561737, "step": 2040, "valid_targets_mean": 1737.0, "valid_targets_min": 456 }, { "epoch": 3.314424635332253, "grad_norm": 0.6256214069648829, "learning_rate": 2.5294687718569994e-05, "loss": 0.2001, "loss_nan_ranks": 0, "loss_rank_avg": 0.14858299493789673, "step": 2045, "valid_targets_mean": 3804.9, "valid_targets_min": 769 }, { "epoch": 3.3225283630470015, "grad_norm": 0.9944856313019108, "learning_rate": 2.5216705285519525e-05, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.17022621631622314, "step": 2050, "valid_targets_mean": 2688.2, "valid_targets_min": 269 }, { "epoch": 3.3306320907617506, "grad_norm": 0.6389414039882365, "learning_rate": 2.5138637658984116e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.12931106984615326, "step": 2055, "valid_targets_mean": 2573.4, "valid_targets_min": 597 }, { "epoch": 3.3387358184764993, "grad_norm": 0.6456462614939432, "learning_rate": 2.5060486113878244e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.22942790389060974, "step": 2060, "valid_targets_mean": 3076.4, "valid_targets_min": 640 }, { "epoch": 3.346839546191248, "grad_norm": 0.4552379058782566, "learning_rate": 2.4982251926486873e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.0790659636259079, "step": 2065, "valid_targets_mean": 3547.6, "valid_targets_min": 747 }, { "epoch": 3.354943273905997, "grad_norm": 0.5502283454291953, "learning_rate": 2.490393637444458e-05, "loss": 0.1957, "loss_nan_ranks": 0, "loss_rank_avg": 0.16592127084732056, "step": 2070, "valid_targets_mean": 4692.4, "valid_targets_min": 988 }, { "epoch": 3.3630470016207457, "grad_norm": 0.8617017867222999, "learning_rate": 2.482554073671471e-05, "loss": 0.2125, "loss_nan_ranks": 0, "loss_rank_avg": 0.24501700699329376, "step": 2075, "valid_targets_mean": 2338.4, "valid_targets_min": 937 }, { "epoch": 3.3711507293354943, "grad_norm": 0.7899472946015639, "learning_rate": 2.4747066293568452e-05, "loss": 0.2152, "loss_nan_ranks": 0, "loss_rank_avg": 0.15188781917095184, "step": 2080, "valid_targets_mean": 2104.1, "valid_targets_min": 556 }, { "epoch": 3.379254457050243, "grad_norm": 0.8193544565230731, "learning_rate": 2.4668514326564e-05, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.17579089105129242, "step": 2085, "valid_targets_mean": 2063.2, "valid_targets_min": 553 }, { "epoch": 3.387358184764992, "grad_norm": 0.889128650784621, "learning_rate": 2.4589886118525556e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.18815834820270538, "step": 2090, "valid_targets_mean": 1816.8, "valid_targets_min": 471 }, { "epoch": 3.3954619124797407, "grad_norm": 0.7550229654302467, "learning_rate": 2.4511182953522405e-05, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.26341044902801514, "step": 2095, "valid_targets_mean": 3581.5, "valid_targets_min": 656 }, { "epoch": 3.4035656401944894, "grad_norm": 0.8942138699800349, "learning_rate": 2.4432406116847954e-05, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.2436755895614624, "step": 2100, "valid_targets_mean": 1985.3, "valid_targets_min": 916 }, { "epoch": 3.411669367909238, "grad_norm": 0.5028709815573968, "learning_rate": 2.435355689499874e-05, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.11536405980587006, "step": 2105, "valid_targets_mean": 3964.9, "valid_targets_min": 233 }, { "epoch": 3.419773095623987, "grad_norm": 0.714825678842735, "learning_rate": 2.4274636575653398e-05, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.15641966462135315, "step": 2110, "valid_targets_mean": 2424.9, "valid_targets_min": 865 }, { "epoch": 3.427876823338736, "grad_norm": 0.8122455585254386, "learning_rate": 2.4195646447651663e-05, "loss": 0.2298, "loss_nan_ranks": 0, "loss_rank_avg": 0.2142556607723236, "step": 2115, "valid_targets_mean": 4355.4, "valid_targets_min": 1109 }, { "epoch": 3.4359805510534844, "grad_norm": 0.783700231697767, "learning_rate": 2.411658780097331e-05, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.3505910634994507, "step": 2120, "valid_targets_mean": 4021.6, "valid_targets_min": 1086 }, { "epoch": 3.4440842787682335, "grad_norm": 0.7313909744848299, "learning_rate": 2.4037461926717075e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.17269133031368256, "step": 2125, "valid_targets_mean": 2451.2, "valid_targets_min": 514 }, { "epoch": 3.452188006482982, "grad_norm": 0.8088615988871327, "learning_rate": 2.395827011707959e-05, "loss": 0.2503, "loss_nan_ranks": 0, "loss_rank_avg": 0.20847368240356445, "step": 2130, "valid_targets_mean": 2553.2, "valid_targets_min": 658 }, { "epoch": 3.460291734197731, "grad_norm": 0.5900039519353123, "learning_rate": 2.3879013665334258e-05, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.20145244896411896, "step": 2135, "valid_targets_mean": 4923.4, "valid_targets_min": 677 }, { "epoch": 3.46839546191248, "grad_norm": 0.6378206622182675, "learning_rate": 2.3799693865810163e-05, "loss": 0.2032, "loss_nan_ranks": 0, "loss_rank_avg": 0.16754154860973358, "step": 2140, "valid_targets_mean": 3790.3, "valid_targets_min": 750 }, { "epoch": 3.4764991896272286, "grad_norm": 0.7389226745729313, "learning_rate": 2.37203120138709e-05, "loss": 0.2046, "loss_nan_ranks": 0, "loss_rank_avg": 0.2016831338405609, "step": 2145, "valid_targets_mean": 3017.4, "valid_targets_min": 913 }, { "epoch": 3.4846029173419772, "grad_norm": 0.542849963051636, "learning_rate": 2.3640869405893446e-05, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.19606372714042664, "step": 2150, "valid_targets_mean": 3942.9, "valid_targets_min": 464 }, { "epoch": 3.492706645056726, "grad_norm": 0.8814880321553831, "learning_rate": 2.3561367339246976e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.2154223620891571, "step": 2155, "valid_targets_mean": 1835.9, "valid_targets_min": 778 }, { "epoch": 3.500810372771475, "grad_norm": 0.7067348415715224, "learning_rate": 2.3481807112271678e-05, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.166023850440979, "step": 2160, "valid_targets_mean": 3050.1, "valid_targets_min": 890 }, { "epoch": 3.5089141004862237, "grad_norm": 0.620735692816103, "learning_rate": 2.3402190024257543e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.13485875725746155, "step": 2165, "valid_targets_mean": 3070.6, "valid_targets_min": 680 }, { "epoch": 3.5170178282009723, "grad_norm": 0.7429662318750067, "learning_rate": 2.3322517375423165e-05, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.16115394234657288, "step": 2170, "valid_targets_mean": 2298.1, "valid_targets_min": 712 }, { "epoch": 3.525121555915721, "grad_norm": 0.8477525841685281, "learning_rate": 2.3242790466894494e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.19504885375499725, "step": 2175, "valid_targets_mean": 2246.0, "valid_targets_min": 398 }, { "epoch": 3.53322528363047, "grad_norm": 0.7627025545672735, "learning_rate": 2.316301060068359e-05, "loss": 0.2083, "loss_nan_ranks": 0, "loss_rank_avg": 0.21119363605976105, "step": 2180, "valid_targets_mean": 2926.6, "valid_targets_min": 692 }, { "epoch": 3.5413290113452187, "grad_norm": 1.100127953832155, "learning_rate": 2.3083179079667347e-05, "loss": 0.2094, "loss_nan_ranks": 0, "loss_rank_avg": 0.20743992924690247, "step": 2185, "valid_targets_mean": 4087.3, "valid_targets_min": 924 }, { "epoch": 3.5494327390599674, "grad_norm": 0.5805399953892108, "learning_rate": 2.300329720756625e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.15286213159561157, "step": 2190, "valid_targets_mean": 3119.1, "valid_targets_min": 342 }, { "epoch": 3.5575364667747165, "grad_norm": 0.7519460987432748, "learning_rate": 2.2923366288923045e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.18701784312725067, "step": 2195, "valid_targets_mean": 2679.4, "valid_targets_min": 704 }, { "epoch": 3.565640194489465, "grad_norm": 0.5738422561843207, "learning_rate": 2.2843387629081453e-05, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.14277049899101257, "step": 2200, "valid_targets_mean": 4261.6, "valid_targets_min": 835 }, { "epoch": 3.5737439222042138, "grad_norm": 0.6995930320107968, "learning_rate": 2.2763362534164854e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.1426575481891632, "step": 2205, "valid_targets_mean": 2615.9, "valid_targets_min": 550 }, { "epoch": 3.581847649918963, "grad_norm": 0.778790384658622, "learning_rate": 2.268329231105498e-05, "loss": 0.1957, "loss_nan_ranks": 0, "loss_rank_avg": 0.22932958602905273, "step": 2210, "valid_targets_mean": 2972.4, "valid_targets_min": 704 }, { "epoch": 3.5899513776337115, "grad_norm": 0.8621285854700218, "learning_rate": 2.2603178267370504e-05, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.20100966095924377, "step": 2215, "valid_targets_mean": 2199.8, "valid_targets_min": 509 }, { "epoch": 3.59805510534846, "grad_norm": 0.6366888964927337, "learning_rate": 2.2523021711445746e-05, "loss": 0.1847, "loss_nan_ranks": 0, "loss_rank_avg": 0.14098083972930908, "step": 2220, "valid_targets_mean": 3288.6, "valid_targets_min": 814 }, { "epoch": 3.6061588330632093, "grad_norm": 1.031030067314881, "learning_rate": 2.2442823952309308e-05, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.21637287735939026, "step": 2225, "valid_targets_mean": 1423.6, "valid_targets_min": 521 }, { "epoch": 3.614262560777958, "grad_norm": 0.8638929404500169, "learning_rate": 2.2362586299662642e-05, "loss": 0.1955, "loss_nan_ranks": 0, "loss_rank_avg": 0.2800928056240082, "step": 2230, "valid_targets_mean": 2027.9, "valid_targets_min": 386 }, { "epoch": 3.6223662884927066, "grad_norm": 0.7529589056185002, "learning_rate": 2.228231006385873e-05, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.3154662251472473, "step": 2235, "valid_targets_mean": 4337.9, "valid_targets_min": 566 }, { "epoch": 3.6304700162074557, "grad_norm": 0.6840352862675642, "learning_rate": 2.2201996555880633e-05, "loss": 0.1879, "loss_nan_ranks": 0, "loss_rank_avg": 0.13636550307273865, "step": 2240, "valid_targets_mean": 2383.8, "valid_targets_min": 477 }, { "epoch": 3.6385737439222043, "grad_norm": 0.7568859162264532, "learning_rate": 2.2121647087320105e-05, "loss": 0.2209, "loss_nan_ranks": 0, "loss_rank_avg": 0.17221365869045258, "step": 2245, "valid_targets_mean": 2137.6, "valid_targets_min": 671 }, { "epoch": 3.646677471636953, "grad_norm": 0.8960270729679528, "learning_rate": 2.204126297035617e-05, "loss": 0.2129, "loss_nan_ranks": 0, "loss_rank_avg": 0.23943698406219482, "step": 2250, "valid_targets_mean": 1959.3, "valid_targets_min": 562 }, { "epoch": 3.6547811993517016, "grad_norm": 0.7464106224245589, "learning_rate": 2.196084551773368e-05, "loss": 0.2071, "loss_nan_ranks": 0, "loss_rank_avg": 0.18965956568717957, "step": 2255, "valid_targets_mean": 2451.1, "valid_targets_min": 973 }, { "epoch": 3.6628849270664503, "grad_norm": 0.9722153370680764, "learning_rate": 2.1880396042741906e-05, "loss": 0.2534, "loss_nan_ranks": 0, "loss_rank_avg": 0.22785764932632446, "step": 2260, "valid_targets_mean": 1551.8, "valid_targets_min": 757 }, { "epoch": 3.6709886547811994, "grad_norm": 0.4697676488300176, "learning_rate": 2.179991585919307e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.0863395407795906, "step": 2265, "valid_targets_mean": 3504.8, "valid_targets_min": 522 }, { "epoch": 3.679092382495948, "grad_norm": 0.7371456685043023, "learning_rate": 2.1719406281400873e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.2391626387834549, "step": 2270, "valid_targets_mean": 2812.4, "valid_targets_min": 636 }, { "epoch": 3.6871961102106967, "grad_norm": 0.7116149527659587, "learning_rate": 2.163886862415908e-05, "loss": 0.2048, "loss_nan_ranks": 0, "loss_rank_avg": 0.16868996620178223, "step": 2275, "valid_targets_mean": 3199.4, "valid_targets_min": 823 }, { "epoch": 3.695299837925446, "grad_norm": 0.6944396008804573, "learning_rate": 2.155830420272e-05, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.36398154497146606, "step": 2280, "valid_targets_mean": 4588.9, "valid_targets_min": 857 }, { "epoch": 3.7034035656401945, "grad_norm": 0.49891846247542965, "learning_rate": 2.1477714332773022e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.12793442606925964, "step": 2285, "valid_targets_mean": 4197.6, "valid_targets_min": 750 }, { "epoch": 3.711507293354943, "grad_norm": 0.7737664275138527, "learning_rate": 2.139710033042314e-05, "loss": 0.2154, "loss_nan_ranks": 0, "loss_rank_avg": 0.21408765017986298, "step": 2290, "valid_targets_mean": 2392.2, "valid_targets_min": 436 }, { "epoch": 3.719611021069692, "grad_norm": 0.6249478567474501, "learning_rate": 2.1316463512169453e-05, "loss": 0.2269, "loss_nan_ranks": 0, "loss_rank_avg": 0.17073558270931244, "step": 2295, "valid_targets_mean": 3448.7, "valid_targets_min": 816 }, { "epoch": 3.727714748784441, "grad_norm": 0.6319183901564622, "learning_rate": 2.1235805194883665e-05, "loss": 0.1862, "loss_nan_ranks": 0, "loss_rank_avg": 0.12544557452201843, "step": 2300, "valid_targets_mean": 3194.1, "valid_targets_min": 828 }, { "epoch": 3.7358184764991895, "grad_norm": 0.8809027809587772, "learning_rate": 2.115512669578857e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.21802709996700287, "step": 2305, "valid_targets_mean": 2093.7, "valid_targets_min": 540 }, { "epoch": 3.7439222042139386, "grad_norm": 0.8125759794942795, "learning_rate": 2.107442933243656e-05, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.1779268980026245, "step": 2310, "valid_targets_mean": 2595.6, "valid_targets_min": 1016 }, { "epoch": 3.7520259319286873, "grad_norm": 0.7211723580416524, "learning_rate": 2.099371442268809e-05, "loss": 0.2015, "loss_nan_ranks": 0, "loss_rank_avg": 0.1611754596233368, "step": 2315, "valid_targets_mean": 2815.6, "valid_targets_min": 715 }, { "epoch": 3.760129659643436, "grad_norm": 0.7848416454395023, "learning_rate": 2.0912983284690157e-05, "loss": 0.1933, "loss_nan_ranks": 0, "loss_rank_avg": 0.2059643268585205, "step": 2320, "valid_targets_mean": 2567.2, "valid_targets_min": 232 }, { "epoch": 3.768233387358185, "grad_norm": 0.5904887355051087, "learning_rate": 2.0832237236854794e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.15662437677383423, "step": 2325, "valid_targets_mean": 3666.7, "valid_targets_min": 1253 }, { "epoch": 3.7763371150729337, "grad_norm": 0.7236461690914054, "learning_rate": 2.0751477597837528e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.12969183921813965, "step": 2330, "valid_targets_mean": 2251.1, "valid_targets_min": 590 }, { "epoch": 3.7844408427876823, "grad_norm": 0.9505422297729229, "learning_rate": 2.0670705686515822e-05, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.23993048071861267, "step": 2335, "valid_targets_mean": 1928.8, "valid_targets_min": 505 }, { "epoch": 3.792544570502431, "grad_norm": 0.6637526217519724, "learning_rate": 2.0589922821967566e-05, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.1568320393562317, "step": 2340, "valid_targets_mean": 2895.9, "valid_targets_min": 662 }, { "epoch": 3.8006482982171796, "grad_norm": 1.0128117172897237, "learning_rate": 2.0509130323449545e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.15534460544586182, "step": 2345, "valid_targets_mean": 1361.9, "valid_targets_min": 488 }, { "epoch": 3.8087520259319287, "grad_norm": 0.6671945777380213, "learning_rate": 2.0428329510375838e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.30660581588745117, "step": 2350, "valid_targets_mean": 4413.9, "valid_targets_min": 531 }, { "epoch": 3.8168557536466774, "grad_norm": 0.5544375126811655, "learning_rate": 2.0347521702296333e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.17179805040359497, "step": 2355, "valid_targets_mean": 4360.7, "valid_targets_min": 700 }, { "epoch": 3.824959481361426, "grad_norm": 0.8902971352705107, "learning_rate": 2.026670821887516e-05, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.16486603021621704, "step": 2360, "valid_targets_mean": 1924.4, "valid_targets_min": 514 }, { "epoch": 3.833063209076175, "grad_norm": 0.691767954969929, "learning_rate": 2.0185890379869115e-05, "loss": 0.2224, "loss_nan_ranks": 0, "loss_rank_avg": 0.29504096508026123, "step": 2365, "valid_targets_mean": 3782.2, "valid_targets_min": 1077 }, { "epoch": 3.841166936790924, "grad_norm": 0.7902862954174232, "learning_rate": 2.0105069505106126e-05, "loss": 0.1761, "loss_nan_ranks": 0, "loss_rank_avg": 0.2295757234096527, "step": 2370, "valid_targets_mean": 2529.1, "valid_targets_min": 650 }, { "epoch": 3.8492706645056725, "grad_norm": 0.6983178682113452, "learning_rate": 2.00242469144637e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.1746961772441864, "step": 2375, "valid_targets_mean": 3053.4, "valid_targets_min": 860 }, { "epoch": 3.8573743922204216, "grad_norm": 0.7564438056864309, "learning_rate": 1.994342392784738e-05, "loss": 0.1784, "loss_nan_ranks": 0, "loss_rank_avg": 0.17830297350883484, "step": 2380, "valid_targets_mean": 2944.7, "valid_targets_min": 1044 }, { "epoch": 3.86547811993517, "grad_norm": 0.755822155072044, "learning_rate": 1.9862601865169154e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.19303062558174133, "step": 2385, "valid_targets_mean": 2711.5, "valid_targets_min": 1487 }, { "epoch": 3.873581847649919, "grad_norm": 0.7160490637060567, "learning_rate": 1.9781782046325938e-05, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.18017929792404175, "step": 2390, "valid_targets_mean": 2449.2, "valid_targets_min": 510 }, { "epoch": 3.881685575364668, "grad_norm": 0.6508016267439924, "learning_rate": 1.9700965791177986e-05, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.22605565190315247, "step": 2395, "valid_targets_mean": 3326.8, "valid_targets_min": 525 }, { "epoch": 3.8897893030794166, "grad_norm": 0.6852974910747845, "learning_rate": 1.9620154419527372e-05, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.24458330869674683, "step": 2400, "valid_targets_mean": 3742.1, "valid_targets_min": 531 }, { "epoch": 3.8978930307941653, "grad_norm": 0.8183442535515982, "learning_rate": 1.953934925109641e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.3048601746559143, "step": 2405, "valid_targets_mean": 2523.3, "valid_targets_min": 540 }, { "epoch": 3.9059967585089144, "grad_norm": 0.7630671943332308, "learning_rate": 1.945855160550611e-05, "loss": 0.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.16103631258010864, "step": 2410, "valid_targets_mean": 2636.6, "valid_targets_min": 604 }, { "epoch": 3.914100486223663, "grad_norm": 0.8070470089137307, "learning_rate": 1.937776280225463e-05, "loss": 0.2098, "loss_nan_ranks": 0, "loss_rank_avg": 0.20676636695861816, "step": 2415, "valid_targets_mean": 2609.7, "valid_targets_min": 840 }, { "epoch": 3.9222042139384117, "grad_norm": 0.9463383844932369, "learning_rate": 1.929698416069571e-05, "loss": 0.2172, "loss_nan_ranks": 0, "loss_rank_avg": 0.197508305311203, "step": 2420, "valid_targets_mean": 1525.7, "valid_targets_min": 759 }, { "epoch": 3.9303079416531603, "grad_norm": 0.6974073097875326, "learning_rate": 1.9216217000017182e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.21730129420757294, "step": 2425, "valid_targets_mean": 2918.9, "valid_targets_min": 693 }, { "epoch": 3.938411669367909, "grad_norm": 0.6196655766852457, "learning_rate": 1.9135462639219325e-05, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.22163273394107819, "step": 2430, "valid_targets_mean": 4302.2, "valid_targets_min": 914 }, { "epoch": 3.946515397082658, "grad_norm": 1.0083387028610686, "learning_rate": 1.905472239709343e-05, "loss": 0.1875, "loss_nan_ranks": 0, "loss_rank_avg": 0.27771952748298645, "step": 2435, "valid_targets_mean": 1752.2, "valid_targets_min": 792 }, { "epoch": 3.9546191247974067, "grad_norm": 0.6436193457753687, "learning_rate": 1.89739975922002e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.24347497522830963, "step": 2440, "valid_targets_mean": 3727.1, "valid_targets_min": 731 }, { "epoch": 3.9627228525121554, "grad_norm": 0.7463707250780504, "learning_rate": 1.889328954284823e-05, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.21482862532138824, "step": 2445, "valid_targets_mean": 2699.9, "valid_targets_min": 575 }, { "epoch": 3.9708265802269045, "grad_norm": 0.8578748435821815, "learning_rate": 1.8812599567072496e-05, "loss": 0.2208, "loss_nan_ranks": 0, "loss_rank_avg": 0.22225850820541382, "step": 2450, "valid_targets_mean": 2473.5, "valid_targets_min": 781 }, { "epoch": 3.978930307941653, "grad_norm": 0.6000598430860175, "learning_rate": 1.873192898261281e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.17323483526706696, "step": 2455, "valid_targets_mean": 3969.9, "valid_targets_min": 501 }, { "epoch": 3.987034035656402, "grad_norm": 0.6411349311068479, "learning_rate": 1.8651279106892317e-05, "loss": 0.2063, "loss_nan_ranks": 0, "loss_rank_avg": 0.22670185565948486, "step": 2460, "valid_targets_mean": 3840.9, "valid_targets_min": 506 }, { "epoch": 3.995137763371151, "grad_norm": 0.8265211359345982, "learning_rate": 1.8570651256995933e-05, "loss": 0.1763, "loss_nan_ranks": 0, "loss_rank_avg": 0.16508886218070984, "step": 2465, "valid_targets_mean": 1857.5, "valid_targets_min": 407 }, { "epoch": 4.003241491085899, "grad_norm": 0.7438519471306131, "learning_rate": 1.849004674964891e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.13882270455360413, "step": 2470, "valid_targets_mean": 2407.8, "valid_targets_min": 699 }, { "epoch": 4.011345218800648, "grad_norm": 0.666660079984095, "learning_rate": 1.840946690119528e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.18586783111095428, "step": 2475, "valid_targets_mean": 3428.2, "valid_targets_min": 631 }, { "epoch": 4.019448946515397, "grad_norm": 0.6224308701315978, "learning_rate": 1.8328913027576373e-05, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.1357424110174179, "step": 2480, "valid_targets_mean": 2990.6, "valid_targets_min": 297 }, { "epoch": 4.0275526742301455, "grad_norm": 0.9706356061146716, "learning_rate": 1.824838644430934e-05, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.17957650125026703, "step": 2485, "valid_targets_mean": 2300.4, "valid_targets_min": 819 }, { "epoch": 4.035656401944895, "grad_norm": 0.5507038011859006, "learning_rate": 1.8167888466465652e-05, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.1574670970439911, "step": 2490, "valid_targets_mean": 6137.8, "valid_targets_min": 269 }, { "epoch": 4.043760129659644, "grad_norm": 0.9201955501879038, "learning_rate": 1.8087420408649596e-05, "loss": 0.1852, "loss_nan_ranks": 0, "loss_rank_avg": 0.1650194525718689, "step": 2495, "valid_targets_mean": 1996.8, "valid_targets_min": 971 }, { "epoch": 4.051863857374392, "grad_norm": 0.7731697108102025, "learning_rate": 1.8006983584976877e-05, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.18308573961257935, "step": 2500, "valid_targets_mean": 2703.9, "valid_targets_min": 740 }, { "epoch": 4.059967585089141, "grad_norm": 0.7203113706129127, "learning_rate": 1.7926579309053098e-05, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.1433395892381668, "step": 2505, "valid_targets_mean": 2686.1, "valid_targets_min": 601 }, { "epoch": 4.06807131280389, "grad_norm": 0.857648318619981, "learning_rate": 1.7846208893952346e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.17913417518138885, "step": 2510, "valid_targets_mean": 2421.8, "valid_targets_min": 216 }, { "epoch": 4.076175040518638, "grad_norm": 0.9249873120711297, "learning_rate": 1.7765873652195713e-05, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.19423171877861023, "step": 2515, "valid_targets_mean": 2475.4, "valid_targets_min": 946 }, { "epoch": 4.084278768233387, "grad_norm": 2.311467435227256, "learning_rate": 1.7685574895729886e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.4830706715583801, "step": 2520, "valid_targets_mean": 3542.9, "valid_targets_min": 305 }, { "epoch": 4.0923824959481365, "grad_norm": 0.654022585178441, "learning_rate": 1.7605313935905722e-05, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.1987391710281372, "step": 2525, "valid_targets_mean": 4264.9, "valid_targets_min": 549 }, { "epoch": 4.100486223662885, "grad_norm": 0.7899542972251363, "learning_rate": 1.7525092083456795e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.15167073905467987, "step": 2530, "valid_targets_mean": 2471.2, "valid_targets_min": 544 }, { "epoch": 4.108589951377634, "grad_norm": 0.7446749286045431, "learning_rate": 1.744491064847805e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.14512816071510315, "step": 2535, "valid_targets_mean": 3130.6, "valid_targets_min": 828 }, { "epoch": 4.116693679092383, "grad_norm": 0.6706352002553055, "learning_rate": 1.7364770940404375e-05, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.18727947771549225, "step": 2540, "valid_targets_mean": 3859.0, "valid_targets_min": 972 }, { "epoch": 4.124797406807131, "grad_norm": 0.7374471536131514, "learning_rate": 1.7284674267989213e-05, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.3415883183479309, "step": 2545, "valid_targets_mean": 3796.5, "valid_targets_min": 731 }, { "epoch": 4.13290113452188, "grad_norm": 0.6623719219174707, "learning_rate": 1.72046219392832e-05, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.09289093315601349, "step": 2550, "valid_targets_mean": 2261.0, "valid_targets_min": 372 }, { "epoch": 4.1410048622366284, "grad_norm": 0.6819916449930195, "learning_rate": 1.712461526161279e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.19168910384178162, "step": 2555, "valid_targets_mean": 3595.6, "valid_targets_min": 431 }, { "epoch": 4.1491085899513775, "grad_norm": 1.006431838006035, "learning_rate": 1.7044655541558934e-05, "loss": 0.1734, "loss_nan_ranks": 0, "loss_rank_avg": 0.19053317606449127, "step": 2560, "valid_targets_mean": 2357.0, "valid_targets_min": 939 }, { "epoch": 4.157212317666127, "grad_norm": 0.7533939089362455, "learning_rate": 1.69647440849357e-05, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.2373582273721695, "step": 2565, "valid_targets_mean": 2927.2, "valid_targets_min": 947 }, { "epoch": 4.165316045380875, "grad_norm": 0.890040140849173, "learning_rate": 1.6884882196768985e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.188620924949646, "step": 2570, "valid_targets_mean": 2630.1, "valid_targets_min": 734 }, { "epoch": 4.173419773095624, "grad_norm": 0.9465451734827055, "learning_rate": 1.680507118127518e-05, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.19093164801597595, "step": 2575, "valid_targets_mean": 1947.6, "valid_targets_min": 594 }, { "epoch": 4.181523500810373, "grad_norm": 0.7658272802842436, "learning_rate": 1.6725312341839895e-05, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.14707794785499573, "step": 2580, "valid_targets_mean": 2918.4, "valid_targets_min": 965 }, { "epoch": 4.189627228525121, "grad_norm": 0.6443361980317487, "learning_rate": 1.664560698099664e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.15699368715286255, "step": 2585, "valid_targets_mean": 3664.1, "valid_targets_min": 1065 }, { "epoch": 4.19773095623987, "grad_norm": 0.9445201634571403, "learning_rate": 1.6565956400405586e-05, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.19105768203735352, "step": 2590, "valid_targets_mean": 1996.1, "valid_targets_min": 776 }, { "epoch": 4.2058346839546195, "grad_norm": 1.5563352274482452, "learning_rate": 1.6486361900832284e-05, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.1398153007030487, "step": 2595, "valid_targets_mean": 1860.5, "valid_targets_min": 741 }, { "epoch": 4.213938411669368, "grad_norm": 0.6946128489566771, "learning_rate": 1.6406824782126428e-05, "loss": 0.2203, "loss_nan_ranks": 0, "loss_rank_avg": 0.22305166721343994, "step": 2600, "valid_targets_mean": 3348.3, "valid_targets_min": 959 }, { "epoch": 4.222042139384117, "grad_norm": 0.6233066610164918, "learning_rate": 1.632734634320064e-05, "loss": 0.2009, "loss_nan_ranks": 0, "loss_rank_avg": 0.22936005890369415, "step": 2605, "valid_targets_mean": 3911.8, "valid_targets_min": 925 }, { "epoch": 4.230145867098866, "grad_norm": 0.6881169895401946, "learning_rate": 1.6247927882009256e-05, "loss": 0.158, "loss_nan_ranks": 0, "loss_rank_avg": 0.13565057516098022, "step": 2610, "valid_targets_mean": 3660.1, "valid_targets_min": 1077 }, { "epoch": 4.238249594813614, "grad_norm": 0.9276168493947143, "learning_rate": 1.6168570695527096e-05, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.2158156931400299, "step": 2615, "valid_targets_mean": 2655.6, "valid_targets_min": 909 }, { "epoch": 4.246353322528363, "grad_norm": 1.0419792453131715, "learning_rate": 1.6089276079728334e-05, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.12811069190502167, "step": 2620, "valid_targets_mean": 1496.8, "valid_targets_min": 303 }, { "epoch": 4.254457050243111, "grad_norm": 0.5184090018750442, "learning_rate": 1.6010045329565294e-05, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.08075259625911713, "step": 2625, "valid_targets_mean": 3308.2, "valid_targets_min": 705 }, { "epoch": 4.2625607779578605, "grad_norm": 1.374064211424771, "learning_rate": 1.5930879738947328e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.14756430685520172, "step": 2630, "valid_targets_mean": 2306.1, "valid_targets_min": 875 }, { "epoch": 4.27066450567261, "grad_norm": 0.7709350033003551, "learning_rate": 1.585178060071966e-05, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.16429486870765686, "step": 2635, "valid_targets_mean": 2699.4, "valid_targets_min": 471 }, { "epoch": 4.278768233387358, "grad_norm": 0.7949963216390307, "learning_rate": 1.5772749206642296e-05, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.11400672793388367, "step": 2640, "valid_targets_mean": 2194.9, "valid_targets_min": 564 }, { "epoch": 4.286871961102107, "grad_norm": 1.0554910650197593, "learning_rate": 1.5693786847368918e-05, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.1564255654811859, "step": 2645, "valid_targets_mean": 1670.0, "valid_targets_min": 742 }, { "epoch": 4.294975688816856, "grad_norm": 0.8555240936332876, "learning_rate": 1.5614894812425806e-05, "loss": 0.1256, "loss_nan_ranks": 0, "loss_rank_avg": 0.1624247133731842, "step": 2650, "valid_targets_mean": 2291.0, "valid_targets_min": 685 }, { "epoch": 4.303079416531604, "grad_norm": 0.7761516523216345, "learning_rate": 1.5536074390190786e-05, "loss": 0.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.12907105684280396, "step": 2655, "valid_targets_mean": 2245.6, "valid_targets_min": 518 }, { "epoch": 4.311183144246353, "grad_norm": 1.4090587432444437, "learning_rate": 1.5457326867872177e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.17307105660438538, "step": 2660, "valid_targets_mean": 2902.2, "valid_targets_min": 757 }, { "epoch": 4.319286871961102, "grad_norm": 0.7599287679035327, "learning_rate": 1.5378653531487784e-05, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.1532491147518158, "step": 2665, "valid_targets_mean": 2631.6, "valid_targets_min": 539 }, { "epoch": 4.327390599675851, "grad_norm": 0.8485351714572734, "learning_rate": 1.5300055665843875e-05, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.14278289675712585, "step": 2670, "valid_targets_mean": 2180.6, "valid_targets_min": 355 }, { "epoch": 4.3354943273906, "grad_norm": 0.7356937932327555, "learning_rate": 1.5221534554514225e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.13728389143943787, "step": 2675, "valid_targets_mean": 2713.6, "valid_targets_min": 908 }, { "epoch": 4.343598055105349, "grad_norm": 0.8514962373379015, "learning_rate": 1.5143091479819146e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.12912364304065704, "step": 2680, "valid_targets_mean": 2137.4, "valid_targets_min": 636 }, { "epoch": 4.351701782820097, "grad_norm": 0.8511576532571051, "learning_rate": 1.5064727722804531e-05, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.20828333497047424, "step": 2685, "valid_targets_mean": 2588.8, "valid_targets_min": 495 }, { "epoch": 4.359805510534846, "grad_norm": 1.0492092151976131, "learning_rate": 1.4986444563220948e-05, "loss": 0.2177, "loss_nan_ranks": 0, "loss_rank_avg": 0.23015139997005463, "step": 2690, "valid_targets_mean": 1931.1, "valid_targets_min": 426 }, { "epoch": 4.367909238249595, "grad_norm": 0.9100981933490145, "learning_rate": 1.4908243279502741e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.1979110985994339, "step": 2695, "valid_targets_mean": 2374.7, "valid_targets_min": 1030 }, { "epoch": 4.376012965964343, "grad_norm": 0.7595733722776951, "learning_rate": 1.4830125148747138e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.1817144751548767, "step": 2700, "valid_targets_mean": 2891.0, "valid_targets_min": 782 }, { "epoch": 4.3841166936790925, "grad_norm": 0.7794754495340108, "learning_rate": 1.475209144669341e-05, "loss": 0.1891, "loss_nan_ranks": 0, "loss_rank_avg": 0.2341780811548233, "step": 2705, "valid_targets_mean": 3009.4, "valid_targets_min": 915 }, { "epoch": 4.392220421393841, "grad_norm": 0.9584422683500831, "learning_rate": 1.4674143447702036e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.13136430084705353, "step": 2710, "valid_targets_mean": 1982.9, "valid_targets_min": 671 }, { "epoch": 4.40032414910859, "grad_norm": 0.5758324638844335, "learning_rate": 1.4596282424733877e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.06660260260105133, "step": 2715, "valid_targets_mean": 3760.6, "valid_targets_min": 805 }, { "epoch": 4.408427876823339, "grad_norm": 0.6558036998170294, "learning_rate": 1.4518509649329406e-05, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.157700315117836, "step": 2720, "valid_targets_mean": 3546.7, "valid_targets_min": 932 }, { "epoch": 4.416531604538087, "grad_norm": 0.8633304546821023, "learning_rate": 1.4440826391587926e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.12797395884990692, "step": 2725, "valid_targets_mean": 3217.9, "valid_targets_min": 735 }, { "epoch": 4.424635332252836, "grad_norm": 0.6582694588059188, "learning_rate": 1.4363233920146855e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.16166099905967712, "step": 2730, "valid_targets_mean": 4224.6, "valid_targets_min": 801 }, { "epoch": 4.432739059967585, "grad_norm": 0.7022399878776832, "learning_rate": 1.4285733502160955e-05, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.1490454524755478, "step": 2735, "valid_targets_mean": 3313.8, "valid_targets_min": 977 }, { "epoch": 4.4408427876823335, "grad_norm": 0.6688054411278289, "learning_rate": 1.4208326403281702e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.1919623762369156, "step": 2740, "valid_targets_mean": 3607.4, "valid_targets_min": 693 }, { "epoch": 4.448946515397083, "grad_norm": 0.9020567053374119, "learning_rate": 1.4131013887636576e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.16687409579753876, "step": 2745, "valid_targets_mean": 2358.4, "valid_targets_min": 801 }, { "epoch": 4.457050243111832, "grad_norm": 0.7645681159215328, "learning_rate": 1.4053797217808432e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.2162127047777176, "step": 2750, "valid_targets_mean": 3857.8, "valid_targets_min": 853 }, { "epoch": 4.46515397082658, "grad_norm": 0.867803300126707, "learning_rate": 1.3976677654814866e-05, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.11421076953411102, "step": 2755, "valid_targets_mean": 2012.0, "valid_targets_min": 510 }, { "epoch": 4.473257698541329, "grad_norm": 0.8742220073053529, "learning_rate": 1.3899656458087647e-05, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.15495306253433228, "step": 2760, "valid_targets_mean": 2445.5, "valid_targets_min": 782 }, { "epoch": 4.481361426256078, "grad_norm": 0.7571940426598677, "learning_rate": 1.3822734885452136e-05, "loss": 0.2069, "loss_nan_ranks": 0, "loss_rank_avg": 0.1919158697128296, "step": 2765, "valid_targets_mean": 3757.5, "valid_targets_min": 824 }, { "epoch": 4.489465153970826, "grad_norm": 0.8691721790493876, "learning_rate": 1.3745914193106715e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.14633077383041382, "step": 2770, "valid_targets_mean": 1987.1, "valid_targets_min": 406 }, { "epoch": 4.4975688816855754, "grad_norm": 1.000044264127931, "learning_rate": 1.366919563560233e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.3116513788700104, "step": 2775, "valid_targets_mean": 4190.8, "valid_targets_min": 605 }, { "epoch": 4.5056726094003245, "grad_norm": 0.8331745332190477, "learning_rate": 1.3592580465821956e-05, "loss": 0.1926, "loss_nan_ranks": 0, "loss_rank_avg": 0.18027907609939575, "step": 2780, "valid_targets_mean": 2925.8, "valid_targets_min": 809 }, { "epoch": 4.513776337115073, "grad_norm": 0.8471157769543586, "learning_rate": 1.3516069934960174e-05, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.18600761890411377, "step": 2785, "valid_targets_mean": 2895.5, "valid_targets_min": 859 }, { "epoch": 4.521880064829822, "grad_norm": 0.8127559212585381, "learning_rate": 1.3439665292502695e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.16321048140525818, "step": 2790, "valid_targets_mean": 2676.2, "valid_targets_min": 899 }, { "epoch": 4.52998379254457, "grad_norm": 0.8681867438751043, "learning_rate": 1.3363367786205985e-05, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.16139662265777588, "step": 2795, "valid_targets_mean": 2765.1, "valid_targets_min": 1075 }, { "epoch": 4.538087520259319, "grad_norm": 0.6147735291418077, "learning_rate": 1.3287178662076893e-05, "loss": 0.1871, "loss_nan_ranks": 0, "loss_rank_avg": 0.2413632571697235, "step": 2800, "valid_targets_mean": 4606.2, "valid_targets_min": 679 }, { "epoch": 4.546191247974068, "grad_norm": 0.7563381558755065, "learning_rate": 1.3211099164352261e-05, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.21764537692070007, "step": 2805, "valid_targets_mean": 2891.3, "valid_targets_min": 521 }, { "epoch": 4.5542949756888165, "grad_norm": 0.7369725771049391, "learning_rate": 1.3135130535478655e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.15378154814243317, "step": 2810, "valid_targets_mean": 3029.8, "valid_targets_min": 686 }, { "epoch": 4.562398703403566, "grad_norm": 0.8372190818629114, "learning_rate": 1.3059274016092057e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.17605245113372803, "step": 2815, "valid_targets_mean": 3103.2, "valid_targets_min": 736 }, { "epoch": 4.570502431118315, "grad_norm": 0.831632617042843, "learning_rate": 1.2983530844997585e-05, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.1470744013786316, "step": 2820, "valid_targets_mean": 2123.9, "valid_targets_min": 524 }, { "epoch": 4.578606158833063, "grad_norm": 0.8005009026500092, "learning_rate": 1.2907902259149287e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.17905943095684052, "step": 2825, "valid_targets_mean": 2288.1, "valid_targets_min": 669 }, { "epoch": 4.586709886547812, "grad_norm": 0.7146959989523917, "learning_rate": 1.2832389493629928e-05, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.18556524813175201, "step": 2830, "valid_targets_mean": 3489.2, "valid_targets_min": 866 }, { "epoch": 4.594813614262561, "grad_norm": 0.982213080774264, "learning_rate": 1.275699378163083e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.20789432525634766, "step": 2835, "valid_targets_mean": 2519.7, "valid_targets_min": 328 }, { "epoch": 4.602917341977309, "grad_norm": 0.5100944274599919, "learning_rate": 1.2681716354431704e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.09983259439468384, "step": 2840, "valid_targets_mean": 5123.9, "valid_targets_min": 505 }, { "epoch": 4.611021069692058, "grad_norm": 0.9532072125518306, "learning_rate": 1.2606558441380587e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.2288963943719864, "step": 2845, "valid_targets_mean": 1986.6, "valid_targets_min": 459 }, { "epoch": 4.6191247974068075, "grad_norm": 0.7215937040297506, "learning_rate": 1.2531521269873736e-05, "loss": 0.1727, "loss_nan_ranks": 0, "loss_rank_avg": 0.18275988101959229, "step": 2850, "valid_targets_mean": 3461.2, "valid_targets_min": 865 }, { "epoch": 4.627228525121556, "grad_norm": 0.7854523287609847, "learning_rate": 1.245660606533559e-05, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.2999517619609833, "step": 2855, "valid_targets_mean": 3333.9, "valid_targets_min": 710 }, { "epoch": 4.635332252836305, "grad_norm": 0.9116092627493867, "learning_rate": 1.2381814051198751e-05, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.13685894012451172, "step": 2860, "valid_targets_mean": 1892.0, "valid_targets_min": 704 }, { "epoch": 4.643435980551054, "grad_norm": 2.35524174458915, "learning_rate": 1.2307146448884021e-05, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.1372871696949005, "step": 2865, "valid_targets_mean": 2473.6, "valid_targets_min": 555 }, { "epoch": 4.651539708265802, "grad_norm": 0.7956965758481088, "learning_rate": 1.2232604477780445e-05, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.20719727873802185, "step": 2870, "valid_targets_mean": 4660.5, "valid_targets_min": 1343 }, { "epoch": 4.659643435980551, "grad_norm": 0.7578731157658531, "learning_rate": 1.2158189355225382e-05, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.16715043783187866, "step": 2875, "valid_targets_mean": 3336.8, "valid_targets_min": 1080 }, { "epoch": 4.667747163695299, "grad_norm": 0.5455735164703488, "learning_rate": 1.2083902296484659e-05, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.1390770971775055, "step": 2880, "valid_targets_mean": 5098.4, "valid_targets_min": 741 }, { "epoch": 4.6758508914100485, "grad_norm": 0.8754352764073323, "learning_rate": 1.2009744514732698e-05, "loss": 0.1251, "loss_nan_ranks": 0, "loss_rank_avg": 0.1272560954093933, "step": 2885, "valid_targets_mean": 1902.8, "valid_targets_min": 856 }, { "epoch": 4.683954619124798, "grad_norm": 0.7125376899744773, "learning_rate": 1.1935717221032707e-05, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.12357346713542938, "step": 2890, "valid_targets_mean": 3547.1, "valid_targets_min": 686 }, { "epoch": 4.692058346839546, "grad_norm": 0.9406847214639302, "learning_rate": 1.1861821624316916e-05, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.1456756889820099, "step": 2895, "valid_targets_mean": 2065.8, "valid_targets_min": 974 }, { "epoch": 4.700162074554295, "grad_norm": 0.6883619788971869, "learning_rate": 1.1788058931366822e-05, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.2756902575492859, "step": 2900, "valid_targets_mean": 4024.9, "valid_targets_min": 880 }, { "epoch": 4.708265802269044, "grad_norm": 0.7882633472589065, "learning_rate": 1.1714430346793479e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.13730135560035706, "step": 2905, "valid_targets_mean": 2645.8, "valid_targets_min": 928 }, { "epoch": 4.716369529983792, "grad_norm": 0.8885552000120186, "learning_rate": 1.1640937073017837e-05, "loss": 0.1522, "loss_nan_ranks": 0, "loss_rank_avg": 0.11991922557353973, "step": 2910, "valid_targets_mean": 2493.4, "valid_targets_min": 918 }, { "epoch": 4.724473257698541, "grad_norm": 0.9089134585480407, "learning_rate": 1.1567580310251097e-05, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.16488614678382874, "step": 2915, "valid_targets_mean": 2730.6, "valid_targets_min": 571 }, { "epoch": 4.73257698541329, "grad_norm": 0.9805367472588664, "learning_rate": 1.1494361256475105e-05, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.1491793394088745, "step": 2920, "valid_targets_mean": 1666.0, "valid_targets_min": 363 }, { "epoch": 4.740680713128039, "grad_norm": 0.9415315025271603, "learning_rate": 1.1421281107422804e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.2649831473827362, "step": 2925, "valid_targets_mean": 2495.4, "valid_targets_min": 334 }, { "epoch": 4.748784440842788, "grad_norm": 0.7579993458608958, "learning_rate": 1.1348341056558709e-05, "loss": 0.1862, "loss_nan_ranks": 0, "loss_rank_avg": 0.21222791075706482, "step": 2930, "valid_targets_mean": 3278.5, "valid_targets_min": 807 }, { "epoch": 4.756888168557537, "grad_norm": 0.8752970421825866, "learning_rate": 1.1275542295059384e-05, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.11920589953660965, "step": 2935, "valid_targets_mean": 2097.3, "valid_targets_min": 701 }, { "epoch": 4.764991896272285, "grad_norm": 0.9284513357192202, "learning_rate": 1.1202886011794023e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.2457813024520874, "step": 2940, "valid_targets_mean": 2385.9, "valid_targets_min": 782 }, { "epoch": 4.773095623987034, "grad_norm": 0.9398075096458122, "learning_rate": 1.1130373393305004e-05, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.12277652323246002, "step": 2945, "valid_targets_mean": 2361.6, "valid_targets_min": 741 }, { "epoch": 4.781199351701783, "grad_norm": 1.1737385550719055, "learning_rate": 1.1058005623788564e-05, "loss": 0.184, "loss_nan_ranks": 0, "loss_rank_avg": 0.140442356467247, "step": 2950, "valid_targets_mean": 1775.1, "valid_targets_min": 1008 }, { "epoch": 4.789303079416531, "grad_norm": 0.8063596837128346, "learning_rate": 1.0985783885075407e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.18340390920639038, "step": 2955, "valid_targets_mean": 2692.0, "valid_targets_min": 697 }, { "epoch": 4.7974068071312805, "grad_norm": 0.8609461611073953, "learning_rate": 1.0913709356611411e-05, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.14733055233955383, "step": 2960, "valid_targets_mean": 2302.0, "valid_targets_min": 860 }, { "epoch": 4.805510534846029, "grad_norm": 0.5940642190543134, "learning_rate": 1.0841783215438406e-05, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.19221073389053345, "step": 2965, "valid_targets_mean": 5023.8, "valid_targets_min": 807 }, { "epoch": 4.813614262560778, "grad_norm": 1.0256200972517306, "learning_rate": 1.07700066361749e-05, "loss": 0.1923, "loss_nan_ranks": 0, "loss_rank_avg": 0.23758450150489807, "step": 2970, "valid_targets_mean": 2783.9, "valid_targets_min": 633 }, { "epoch": 4.821717990275527, "grad_norm": 0.8057695967861453, "learning_rate": 1.0698380790996921e-05, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.15349268913269043, "step": 2975, "valid_targets_mean": 3128.6, "valid_targets_min": 1141 }, { "epoch": 4.829821717990275, "grad_norm": 0.7274055955361053, "learning_rate": 1.0626906849618903e-05, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.16329367458820343, "step": 2980, "valid_targets_mean": 3118.8, "valid_targets_min": 761 }, { "epoch": 4.837925445705024, "grad_norm": 0.8346294549363144, "learning_rate": 1.0555585979274513e-05, "loss": 0.2442, "loss_nan_ranks": 0, "loss_rank_avg": 0.2559146285057068, "step": 2985, "valid_targets_mean": 3082.2, "valid_targets_min": 522 }, { "epoch": 4.846029173419773, "grad_norm": 1.3240258810633323, "learning_rate": 1.0484419344697667e-05, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.13262823224067688, "step": 2990, "valid_targets_mean": 1733.1, "valid_targets_min": 564 }, { "epoch": 4.854132901134522, "grad_norm": 0.995006362928102, "learning_rate": 1.0413408108103445e-05, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.20635709166526794, "step": 2995, "valid_targets_mean": 3296.1, "valid_targets_min": 562 }, { "epoch": 4.862236628849271, "grad_norm": 0.8460865973678914, "learning_rate": 1.0342553429169163e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.11528654396533966, "step": 3000, "valid_targets_mean": 1933.8, "valid_targets_min": 607 }, { "epoch": 4.87034035656402, "grad_norm": 1.147006877758278, "learning_rate": 1.0271856465015388e-05, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.18788880109786987, "step": 3005, "valid_targets_mean": 1968.5, "valid_targets_min": 626 }, { "epoch": 4.878444084278768, "grad_norm": 0.8479478722559892, "learning_rate": 1.0201318370187065e-05, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.13283419609069824, "step": 3010, "valid_targets_mean": 2158.6, "valid_targets_min": 496 }, { "epoch": 4.886547811993517, "grad_norm": 0.7961067473066475, "learning_rate": 1.0130940296634683e-05, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.18867862224578857, "step": 3015, "valid_targets_mean": 2611.9, "valid_targets_min": 514 }, { "epoch": 4.894651539708266, "grad_norm": 1.0151300176784335, "learning_rate": 1.0060723393695411e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.23992988467216492, "step": 3020, "valid_targets_mean": 2529.1, "valid_targets_min": 525 }, { "epoch": 4.902755267423014, "grad_norm": 0.9733399168762327, "learning_rate": 9.990668808074378e-06, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.14787709712982178, "step": 3025, "valid_targets_mean": 1709.7, "valid_targets_min": 781 }, { "epoch": 4.9108589951377635, "grad_norm": 0.72365986298008, "learning_rate": 9.920777683825906e-06, "loss": 0.1701, "loss_nan_ranks": 0, "loss_rank_avg": 0.19551479816436768, "step": 3030, "valid_targets_mean": 2936.8, "valid_targets_min": 371 }, { "epoch": 4.918962722852513, "grad_norm": 0.8027516059720535, "learning_rate": 9.851051162334871e-06, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.1954280436038971, "step": 3035, "valid_targets_mean": 2570.2, "valid_targets_min": 761 }, { "epoch": 4.927066450567261, "grad_norm": 0.762963457517037, "learning_rate": 9.781490382298018e-06, "loss": 0.1348, "loss_nan_ranks": 0, "loss_rank_avg": 0.15942156314849854, "step": 3040, "valid_targets_mean": 3299.4, "valid_targets_min": 943 }, { "epoch": 4.93517017828201, "grad_norm": 0.8720989205317229, "learning_rate": 9.712096479705382e-06, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.11061131954193115, "step": 3045, "valid_targets_mean": 2380.6, "valid_targets_min": 733 }, { "epoch": 4.943273905996758, "grad_norm": 0.6183829564964957, "learning_rate": 9.642870587821761e-06, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.13789555430412292, "step": 3050, "valid_targets_mean": 3705.7, "valid_targets_min": 722 }, { "epoch": 4.951377633711507, "grad_norm": 0.9202251472551713, "learning_rate": 9.573813837168166e-06, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.16328653693199158, "step": 3055, "valid_targets_mean": 2631.2, "valid_targets_min": 461 }, { "epoch": 4.959481361426256, "grad_norm": 0.6337283642064705, "learning_rate": 9.504927355503399e-06, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.0957586020231247, "step": 3060, "valid_targets_mean": 3474.9, "valid_targets_min": 715 }, { "epoch": 4.9675850891410045, "grad_norm": 0.9004406261162295, "learning_rate": 9.436212267805591e-06, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.12372364848852158, "step": 3065, "valid_targets_mean": 1903.6, "valid_targets_min": 656 }, { "epoch": 4.975688816855754, "grad_norm": 0.5981555247573468, "learning_rate": 9.367669696253885e-06, "loss": 0.2001, "loss_nan_ranks": 0, "loss_rank_avg": 0.10008936375379562, "step": 3070, "valid_targets_mean": 3947.9, "valid_targets_min": 910 }, { "epoch": 4.983792544570503, "grad_norm": 0.7429447660340368, "learning_rate": 9.299300760210059e-06, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.2495230734348297, "step": 3075, "valid_targets_mean": 3267.3, "valid_targets_min": 613 }, { "epoch": 4.991896272285251, "grad_norm": 0.8545859108818904, "learning_rate": 9.231106576200268e-06, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.1375666856765747, "step": 3080, "valid_targets_mean": 2512.9, "valid_targets_min": 1033 }, { "epoch": 5.0, "grad_norm": 1.0000828363963175, "learning_rate": 9.163088257896825e-06, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.12231343239545822, "step": 3085, "valid_targets_mean": 1496.2, "valid_targets_min": 692 }, { "epoch": 5.008103727714749, "grad_norm": 1.283136207413487, "learning_rate": 9.095246916099978e-06, "loss": 0.165, "loss_nan_ranks": 0, "loss_rank_avg": 0.16958777606487274, "step": 3090, "valid_targets_mean": 2647.4, "valid_targets_min": 582 }, { "epoch": 5.016207455429497, "grad_norm": 0.943279239764171, "learning_rate": 9.027583658719812e-06, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.12485413998365402, "step": 3095, "valid_targets_mean": 1937.0, "valid_targets_min": 484 }, { "epoch": 5.024311183144246, "grad_norm": 0.8436158526907404, "learning_rate": 8.960099590758104e-06, "loss": 0.1453, "loss_nan_ranks": 0, "loss_rank_avg": 0.1455596685409546, "step": 3100, "valid_targets_mean": 2281.4, "valid_targets_min": 820 }, { "epoch": 5.0324149108589955, "grad_norm": 0.9944315406392032, "learning_rate": 8.892795814290342e-06, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.19890674948692322, "step": 3105, "valid_targets_mean": 2202.4, "valid_targets_min": 754 }, { "epoch": 5.040518638573744, "grad_norm": 0.6387733217996346, "learning_rate": 8.825673428447668e-06, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.13640737533569336, "step": 3110, "valid_targets_mean": 4190.6, "valid_targets_min": 698 }, { "epoch": 5.048622366288493, "grad_norm": 0.7019234673750581, "learning_rate": 8.758733529398945e-06, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.09768907725811005, "step": 3115, "valid_targets_mean": 2849.2, "valid_targets_min": 862 }, { "epoch": 5.056726094003242, "grad_norm": 1.384661286889182, "learning_rate": 8.691977210332892e-06, "loss": 0.1274, "loss_nan_ranks": 0, "loss_rank_avg": 0.13747167587280273, "step": 3120, "valid_targets_mean": 2221.4, "valid_targets_min": 670 }, { "epoch": 5.06482982171799, "grad_norm": 0.930073668995111, "learning_rate": 8.625405561440172e-06, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.11428385972976685, "step": 3125, "valid_targets_mean": 1706.4, "valid_targets_min": 628 }, { "epoch": 5.072933549432739, "grad_norm": 0.7331543719322425, "learning_rate": 8.559019669895648e-06, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.22601112723350525, "step": 3130, "valid_targets_mean": 3574.3, "valid_targets_min": 398 }, { "epoch": 5.081037277147487, "grad_norm": 0.9113971174023665, "learning_rate": 8.492820619840563e-06, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.287741094827652, "step": 3135, "valid_targets_mean": 2638.6, "valid_targets_min": 341 }, { "epoch": 5.0891410048622365, "grad_norm": 0.8833049318176625, "learning_rate": 8.426809492364907e-06, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.11894373595714569, "step": 3140, "valid_targets_mean": 2332.4, "valid_targets_min": 822 }, { "epoch": 5.097244732576986, "grad_norm": 0.5946354001150366, "learning_rate": 8.360987365489698e-06, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.1098465770483017, "step": 3145, "valid_targets_mean": 3904.6, "valid_targets_min": 1072 }, { "epoch": 5.105348460291734, "grad_norm": 0.8044122587163143, "learning_rate": 8.295355314149413e-06, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.13747110962867737, "step": 3150, "valid_targets_mean": 2310.0, "valid_targets_min": 337 }, { "epoch": 5.113452188006483, "grad_norm": 0.5980128769879898, "learning_rate": 8.229914410174435e-06, "loss": 0.1099, "loss_nan_ranks": 0, "loss_rank_avg": 0.08813309669494629, "step": 3155, "valid_targets_mean": 3792.1, "valid_targets_min": 993 }, { "epoch": 5.121555915721232, "grad_norm": 0.622312258802971, "learning_rate": 8.16466572227352e-06, "loss": 0.1068, "loss_nan_ranks": 0, "loss_rank_avg": 0.0873100534081459, "step": 3160, "valid_targets_mean": 3185.2, "valid_targets_min": 554 }, { "epoch": 5.12965964343598, "grad_norm": 0.8954975866967348, "learning_rate": 8.099610316016373e-06, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.13367177546024323, "step": 3165, "valid_targets_mean": 2045.3, "valid_targets_min": 501 }, { "epoch": 5.137763371150729, "grad_norm": 0.8258936353394385, "learning_rate": 8.03474925381625e-06, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.16128379106521606, "step": 3170, "valid_targets_mean": 3819.5, "valid_targets_min": 883 }, { "epoch": 5.145867098865478, "grad_norm": 0.9892899982440995, "learning_rate": 7.97008359491257e-06, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.1371055245399475, "step": 3175, "valid_targets_mean": 1996.4, "valid_targets_min": 902 }, { "epoch": 5.153970826580227, "grad_norm": 0.9178033916752635, "learning_rate": 7.905614395353649e-06, "loss": 0.1424, "loss_nan_ranks": 0, "loss_rank_avg": 0.13662882149219513, "step": 3180, "valid_targets_mean": 2094.7, "valid_targets_min": 269 }, { "epoch": 5.162074554294976, "grad_norm": 0.9445719514300331, "learning_rate": 7.841342707979442e-06, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.30393123626708984, "step": 3185, "valid_targets_mean": 3291.1, "valid_targets_min": 862 }, { "epoch": 5.170178282009725, "grad_norm": 0.7306623592816158, "learning_rate": 7.77726958240437e-06, "loss": 0.1444, "loss_nan_ranks": 0, "loss_rank_avg": 0.100005142390728, "step": 3190, "valid_targets_mean": 2373.6, "valid_targets_min": 1047 }, { "epoch": 5.178282009724473, "grad_norm": 0.5681715595432818, "learning_rate": 7.713396065000133e-06, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.16320055723190308, "step": 3195, "valid_targets_mean": 5024.4, "valid_targets_min": 936 }, { "epoch": 5.186385737439222, "grad_norm": 0.9141392131056238, "learning_rate": 7.649723198878676e-06, "loss": 0.13, "loss_nan_ranks": 0, "loss_rank_avg": 0.17028486728668213, "step": 3200, "valid_targets_mean": 2462.1, "valid_targets_min": 855 }, { "epoch": 5.194489465153971, "grad_norm": 1.0211463763575084, "learning_rate": 7.586252023875125e-06, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.13707610964775085, "step": 3205, "valid_targets_mean": 1633.6, "valid_targets_min": 501 }, { "epoch": 5.2025931928687195, "grad_norm": 0.9857389473887078, "learning_rate": 7.522983576530791e-06, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.1323859989643097, "step": 3210, "valid_targets_mean": 1957.2, "valid_targets_min": 550 }, { "epoch": 5.210696920583469, "grad_norm": 1.0143771026388138, "learning_rate": 7.459918890076272e-06, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.16915765404701233, "step": 3215, "valid_targets_mean": 3357.4, "valid_targets_min": 689 }, { "epoch": 5.218800648298217, "grad_norm": 0.8291361309836706, "learning_rate": 7.397058994414563e-06, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.18082496523857117, "step": 3220, "valid_targets_mean": 2756.2, "valid_targets_min": 1082 }, { "epoch": 5.226904376012966, "grad_norm": 0.6737718264710545, "learning_rate": 7.3344049161042495e-06, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.14597007632255554, "step": 3225, "valid_targets_mean": 4198.1, "valid_targets_min": 1181 }, { "epoch": 5.235008103727715, "grad_norm": 0.6961828666596263, "learning_rate": 7.271957678342738e-06, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.07819020748138428, "step": 3230, "valid_targets_mean": 2952.6, "valid_targets_min": 601 }, { "epoch": 5.243111831442463, "grad_norm": 1.2860828286107657, "learning_rate": 7.209718300949519e-06, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.11555998027324677, "step": 3235, "valid_targets_mean": 2056.3, "valid_targets_min": 974 }, { "epoch": 5.251215559157212, "grad_norm": 0.6896094917138008, "learning_rate": 7.14768780034957e-06, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.18422646820545197, "step": 3240, "valid_targets_mean": 3863.6, "valid_targets_min": 954 }, { "epoch": 5.259319286871961, "grad_norm": 0.8253153069121804, "learning_rate": 7.085867189556697e-06, "loss": 0.2144, "loss_nan_ranks": 0, "loss_rank_avg": 0.20815926790237427, "step": 3245, "valid_targets_mean": 3034.3, "valid_targets_min": 786 }, { "epoch": 5.26742301458671, "grad_norm": 0.7086894492399584, "learning_rate": 7.024257478157015e-06, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.10221417248249054, "step": 3250, "valid_targets_mean": 3288.2, "valid_targets_min": 1042 }, { "epoch": 5.275526742301459, "grad_norm": 0.5798277120600573, "learning_rate": 6.96285967229249e-06, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.14061783254146576, "step": 3255, "valid_targets_mean": 5321.4, "valid_targets_min": 632 }, { "epoch": 5.283630470016208, "grad_norm": 0.6297473245719093, "learning_rate": 6.901674774644449e-06, "loss": 0.1113, "loss_nan_ranks": 0, "loss_rank_avg": 0.09192270785570145, "step": 3260, "valid_targets_mean": 3162.9, "valid_targets_min": 722 }, { "epoch": 5.291734197730956, "grad_norm": 0.655326604774191, "learning_rate": 6.840703784417262e-06, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.1667039543390274, "step": 3265, "valid_targets_mean": 3882.1, "valid_targets_min": 910 }, { "epoch": 5.299837925445705, "grad_norm": 0.9464717792115727, "learning_rate": 6.779947697321974e-06, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.11113858968019485, "step": 3270, "valid_targets_mean": 2199.8, "valid_targets_min": 342 }, { "epoch": 5.307941653160454, "grad_norm": 0.8508764069285351, "learning_rate": 6.719407505560094e-06, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.14729882776737213, "step": 3275, "valid_targets_mean": 2665.4, "valid_targets_min": 1089 }, { "epoch": 5.316045380875202, "grad_norm": 1.03542912623809, "learning_rate": 6.659084197807348e-06, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.4161680340766907, "step": 3280, "valid_targets_mean": 4139.7, "valid_targets_min": 656 }, { "epoch": 5.3241491085899515, "grad_norm": 0.8555285929048103, "learning_rate": 6.598978759197554e-06, "loss": 0.119, "loss_nan_ranks": 0, "loss_rank_avg": 0.19164308905601501, "step": 3285, "valid_targets_mean": 2472.9, "valid_targets_min": 488 }, { "epoch": 5.332252836304701, "grad_norm": 0.7884153355344533, "learning_rate": 6.539092171306541e-06, "loss": 0.1166, "loss_nan_ranks": 0, "loss_rank_avg": 0.13263387978076935, "step": 3290, "valid_targets_mean": 2924.2, "valid_targets_min": 873 }, { "epoch": 5.340356564019449, "grad_norm": 0.7139375465777716, "learning_rate": 6.479425412136093e-06, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.08301765471696854, "step": 3295, "valid_targets_mean": 3015.2, "valid_targets_min": 456 }, { "epoch": 5.348460291734198, "grad_norm": 0.8136742499601274, "learning_rate": 6.419979456098016e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.0914689153432846, "step": 3300, "valid_targets_mean": 2395.7, "valid_targets_min": 471 }, { "epoch": 5.356564019448946, "grad_norm": 0.8426989185718268, "learning_rate": 6.360755273998174e-06, "loss": 0.1761, "loss_nan_ranks": 0, "loss_rank_avg": 0.18558555841445923, "step": 3305, "valid_targets_mean": 3175.8, "valid_targets_min": 426 }, { "epoch": 5.364667747163695, "grad_norm": 0.7043825571960722, "learning_rate": 6.301753833020691e-06, "loss": 0.1404, "loss_nan_ranks": 0, "loss_rank_avg": 0.185553640127182, "step": 3310, "valid_targets_mean": 3304.7, "valid_targets_min": 863 }, { "epoch": 5.372771474878444, "grad_norm": 0.9549981037856647, "learning_rate": 6.242976096712112e-06, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.22695674002170563, "step": 3315, "valid_targets_mean": 2425.8, "valid_targets_min": 334 }, { "epoch": 5.3808752025931925, "grad_norm": 0.8195898613602235, "learning_rate": 6.18442302496568e-06, "loss": 0.1695, "loss_nan_ranks": 0, "loss_rank_avg": 0.13929906487464905, "step": 3320, "valid_targets_mean": 2468.8, "valid_targets_min": 524 }, { "epoch": 5.388978930307942, "grad_norm": 1.029682002666224, "learning_rate": 6.1260955740056835e-06, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.1550445258617401, "step": 3325, "valid_targets_mean": 2025.9, "valid_targets_min": 1103 }, { "epoch": 5.397082658022691, "grad_norm": 1.1169106309979446, "learning_rate": 6.067994696371797e-06, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.15255971252918243, "step": 3330, "valid_targets_mean": 2080.6, "valid_targets_min": 1215 }, { "epoch": 5.405186385737439, "grad_norm": 0.8850686193118384, "learning_rate": 6.010121340903574e-06, "loss": 0.1224, "loss_nan_ranks": 0, "loss_rank_avg": 0.1398320496082306, "step": 3335, "valid_targets_mean": 2204.1, "valid_targets_min": 882 }, { "epoch": 5.413290113452188, "grad_norm": 0.6189940261103392, "learning_rate": 5.952476452724898e-06, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.10511147975921631, "step": 3340, "valid_targets_mean": 3397.1, "valid_targets_min": 536 }, { "epoch": 5.421393841166937, "grad_norm": 0.7869848129875665, "learning_rate": 5.895060973228606e-06, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.17136400938034058, "step": 3345, "valid_targets_mean": 3590.9, "valid_targets_min": 216 }, { "epoch": 5.429497568881685, "grad_norm": 0.9786557729553311, "learning_rate": 5.837875840061064e-06, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.12982967495918274, "step": 3350, "valid_targets_mean": 1677.5, "valid_targets_min": 514 }, { "epoch": 5.437601296596434, "grad_norm": 0.8317312217862712, "learning_rate": 5.780921987106878e-06, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.12355664372444153, "step": 3355, "valid_targets_mean": 2306.0, "valid_targets_min": 950 }, { "epoch": 5.4457050243111835, "grad_norm": 0.7338499031126493, "learning_rate": 5.724200344473651e-06, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.19103437662124634, "step": 3360, "valid_targets_mean": 3675.8, "valid_targets_min": 949 }, { "epoch": 5.453808752025932, "grad_norm": 0.6656448002153311, "learning_rate": 5.66771183847677e-06, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.09611663967370987, "step": 3365, "valid_targets_mean": 2633.0, "valid_targets_min": 612 }, { "epoch": 5.461912479740681, "grad_norm": 1.0874356250956578, "learning_rate": 5.611457391624309e-06, "loss": 0.1322, "loss_nan_ranks": 0, "loss_rank_avg": 0.15315888822078705, "step": 3370, "valid_targets_mean": 3031.9, "valid_targets_min": 472 }, { "epoch": 5.47001620745543, "grad_norm": 1.0445039076091298, "learning_rate": 5.555437922601918e-06, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.16164973378181458, "step": 3375, "valid_targets_mean": 1917.6, "valid_targets_min": 514 }, { "epoch": 5.478119935170178, "grad_norm": 0.8104164724449195, "learning_rate": 5.499654346257879e-06, "loss": 0.1359, "loss_nan_ranks": 0, "loss_rank_avg": 0.12006053328514099, "step": 3380, "valid_targets_mean": 2426.0, "valid_targets_min": 901 }, { "epoch": 5.486223662884927, "grad_norm": 0.7493612429318233, "learning_rate": 5.444107573588116e-06, "loss": 0.1917, "loss_nan_ranks": 0, "loss_rank_avg": 0.1710258424282074, "step": 3385, "valid_targets_mean": 3943.8, "valid_targets_min": 594 }, { "epoch": 5.4943273905996755, "grad_norm": 0.893693814456575, "learning_rate": 5.388798511721329e-06, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.19235970079898834, "step": 3390, "valid_targets_mean": 2304.8, "valid_targets_min": 487 }, { "epoch": 5.5024311183144246, "grad_norm": 0.9281024443148513, "learning_rate": 5.333728063904213e-06, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.13582965731620789, "step": 3395, "valid_targets_mean": 3602.9, "valid_targets_min": 754 }, { "epoch": 5.510534846029174, "grad_norm": 0.7276815688419767, "learning_rate": 5.278897129486656e-06, "loss": 0.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.13215868175029755, "step": 3400, "valid_targets_mean": 3562.9, "valid_targets_min": 945 }, { "epoch": 5.518638573743922, "grad_norm": 0.8662128457006715, "learning_rate": 5.224306603907095e-06, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.12716642022132874, "step": 3405, "valid_targets_mean": 2820.1, "valid_targets_min": 929 }, { "epoch": 5.526742301458671, "grad_norm": 0.7807235589640765, "learning_rate": 5.169957378677859e-06, "loss": 0.1258, "loss_nan_ranks": 0, "loss_rank_avg": 0.1254601776599884, "step": 3410, "valid_targets_mean": 2691.8, "valid_targets_min": 978 }, { "epoch": 5.53484602917342, "grad_norm": 0.7560906227588559, "learning_rate": 5.11585034137064e-06, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.23728054761886597, "step": 3415, "valid_targets_mean": 3586.0, "valid_targets_min": 656 }, { "epoch": 5.542949756888168, "grad_norm": 1.102731743141789, "learning_rate": 5.061986375601977e-06, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.13842478394508362, "step": 3420, "valid_targets_mean": 1943.7, "valid_targets_min": 645 }, { "epoch": 5.551053484602917, "grad_norm": 0.7825513713620168, "learning_rate": 5.0083663610188215e-06, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.11432783305644989, "step": 3425, "valid_targets_mean": 2848.9, "valid_targets_min": 740 }, { "epoch": 5.5591572123176665, "grad_norm": 0.9134357132489729, "learning_rate": 4.954991173284207e-06, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.16197806596755981, "step": 3430, "valid_targets_mean": 2609.7, "valid_targets_min": 677 }, { "epoch": 5.567260940032415, "grad_norm": 0.9586959035897938, "learning_rate": 4.901861684062899e-06, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.11932115256786346, "step": 3435, "valid_targets_mean": 2300.0, "valid_targets_min": 652 }, { "epoch": 5.575364667747164, "grad_norm": 0.9077572994362951, "learning_rate": 4.848978761007206e-06, "loss": 0.1211, "loss_nan_ranks": 0, "loss_rank_avg": 0.15258963406085968, "step": 3440, "valid_targets_mean": 2265.6, "valid_targets_min": 932 }, { "epoch": 5.583468395461912, "grad_norm": 1.1023316942136527, "learning_rate": 4.796343267742782e-06, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.14780212938785553, "step": 3445, "valid_targets_mean": 1948.9, "valid_targets_min": 841 }, { "epoch": 5.591572123176661, "grad_norm": 0.7251051495316837, "learning_rate": 4.743956063854529e-06, "loss": 0.1311, "loss_nan_ranks": 0, "loss_rank_avg": 0.09377004206180573, "step": 3450, "valid_targets_mean": 2942.9, "valid_targets_min": 811 }, { "epoch": 5.59967585089141, "grad_norm": 0.8488916792785556, "learning_rate": 4.691818004872557e-06, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.12640199065208435, "step": 3455, "valid_targets_mean": 2410.6, "valid_targets_min": 972 }, { "epoch": 5.607779578606159, "grad_norm": 0.8737493446227516, "learning_rate": 4.639929942258217e-06, "loss": 0.1383, "loss_nan_ranks": 0, "loss_rank_avg": 0.11130397021770477, "step": 3460, "valid_targets_mean": 1994.3, "valid_targets_min": 742 }, { "epoch": 5.6158833063209075, "grad_norm": 0.8723045293450462, "learning_rate": 4.588292723390204e-06, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.18794122338294983, "step": 3465, "valid_targets_mean": 2340.5, "valid_targets_min": 626 }, { "epoch": 5.623987034035657, "grad_norm": 0.9131558045501164, "learning_rate": 4.536907191550694e-06, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.18654656410217285, "step": 3470, "valid_targets_mean": 3264.6, "valid_targets_min": 940 }, { "epoch": 5.632090761750405, "grad_norm": 0.7832447854160407, "learning_rate": 4.4857741859116024e-06, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.10856875032186508, "step": 3475, "valid_targets_mean": 4026.0, "valid_targets_min": 828 }, { "epoch": 5.640194489465154, "grad_norm": 0.9603685340587842, "learning_rate": 4.434894541520862e-06, "loss": 0.1285, "loss_nan_ranks": 0, "loss_rank_avg": 0.12167471647262573, "step": 3480, "valid_targets_mean": 2858.6, "valid_targets_min": 681 }, { "epoch": 5.648298217179903, "grad_norm": 0.8143816562047289, "learning_rate": 4.3842690892887795e-06, "loss": 0.1283, "loss_nan_ranks": 0, "loss_rank_avg": 0.11910448223352432, "step": 3485, "valid_targets_mean": 2518.2, "valid_targets_min": 883 }, { "epoch": 5.656401944894651, "grad_norm": 1.0269959031972293, "learning_rate": 4.333898655974484e-06, "loss": 0.1366, "loss_nan_ranks": 0, "loss_rank_avg": 0.13059552013874054, "step": 3490, "valid_targets_mean": 2272.3, "valid_targets_min": 565 }, { "epoch": 5.6645056726094, "grad_norm": 0.8493579524196188, "learning_rate": 4.283784064172405e-06, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.23569592833518982, "step": 3495, "valid_targets_mean": 2847.4, "valid_targets_min": 549 }, { "epoch": 5.672609400324149, "grad_norm": 1.0045947500475891, "learning_rate": 4.233926132298867e-06, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.12646427750587463, "step": 3500, "valid_targets_mean": 1906.7, "valid_targets_min": 724 }, { "epoch": 5.680713128038898, "grad_norm": 1.4216952442247126, "learning_rate": 4.1843256745787e-06, "loss": 0.1444, "loss_nan_ranks": 0, "loss_rank_avg": 0.18572121858596802, "step": 3505, "valid_targets_mean": 1459.9, "valid_targets_min": 544 }, { "epoch": 5.688816855753647, "grad_norm": 0.9002937899719397, "learning_rate": 4.134983501031942e-06, "loss": 0.1033, "loss_nan_ranks": 0, "loss_rank_avg": 0.11701390147209167, "step": 3510, "valid_targets_mean": 2314.2, "valid_targets_min": 776 }, { "epoch": 5.696920583468396, "grad_norm": 0.8596504160989296, "learning_rate": 4.085900417460633e-06, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.15798306465148926, "step": 3515, "valid_targets_mean": 2459.4, "valid_targets_min": 1225 }, { "epoch": 5.705024311183144, "grad_norm": 1.0572710496515947, "learning_rate": 4.037077225435628e-06, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.14602217078208923, "step": 3520, "valid_targets_mean": 1989.2, "valid_targets_min": 645 }, { "epoch": 5.713128038897893, "grad_norm": 0.5224530736412875, "learning_rate": 3.988514722283523e-06, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.0725245401263237, "step": 3525, "valid_targets_mean": 3406.3, "valid_targets_min": 553 }, { "epoch": 5.721231766612641, "grad_norm": 0.9644662300746688, "learning_rate": 3.940213701073636e-06, "loss": 0.1119, "loss_nan_ranks": 0, "loss_rank_avg": 0.10431959480047226, "step": 3530, "valid_targets_mean": 1862.7, "valid_targets_min": 1094 }, { "epoch": 5.72933549432739, "grad_norm": 0.6423940525393956, "learning_rate": 3.892174950605039e-06, "loss": 0.1221, "loss_nan_ranks": 0, "loss_rank_avg": 0.0762447863817215, "step": 3535, "valid_targets_mean": 2733.1, "valid_targets_min": 737 }, { "epoch": 5.7374392220421395, "grad_norm": 1.0504974617543583, "learning_rate": 3.844399255393705e-06, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.12259531021118164, "step": 3540, "valid_targets_mean": 2066.3, "valid_targets_min": 509 }, { "epoch": 5.745542949756889, "grad_norm": 1.0177720813084683, "learning_rate": 3.7968873956596563e-06, "loss": 0.1244, "loss_nan_ranks": 0, "loss_rank_avg": 0.18689052760601044, "step": 3545, "valid_targets_mean": 2081.0, "valid_targets_min": 812 }, { "epoch": 5.753646677471637, "grad_norm": 1.081526403816516, "learning_rate": 3.749640147314264e-06, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.15227672457695007, "step": 3550, "valid_targets_mean": 1617.8, "valid_targets_min": 450 }, { "epoch": 5.761750405186386, "grad_norm": 1.281386145306865, "learning_rate": 3.7026582819475443e-06, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.1037423312664032, "step": 3555, "valid_targets_mean": 1829.5, "valid_targets_min": 694 }, { "epoch": 5.769854132901134, "grad_norm": 1.166110176855929, "learning_rate": 3.6559425668155733e-06, "loss": 0.1227, "loss_nan_ranks": 0, "loss_rank_avg": 0.11849828064441681, "step": 3560, "valid_targets_mean": 2195.3, "valid_targets_min": 759 }, { "epoch": 5.777957860615883, "grad_norm": 0.5899092092985859, "learning_rate": 3.6094937648279647e-06, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.10452926158905029, "step": 3565, "valid_targets_mean": 3788.1, "valid_targets_min": 778 }, { "epoch": 5.786061588330632, "grad_norm": 0.6076238022877796, "learning_rate": 3.563312634535383e-06, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.09219780564308167, "step": 3570, "valid_targets_mean": 4160.1, "valid_targets_min": 893 }, { "epoch": 5.7941653160453805, "grad_norm": 0.9424647522354361, "learning_rate": 3.517399930117196e-06, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.13615809381008148, "step": 3575, "valid_targets_mean": 2198.9, "valid_targets_min": 866 }, { "epoch": 5.80226904376013, "grad_norm": 0.5696560681892507, "learning_rate": 3.4717564013691087e-06, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.11359340697526932, "step": 3580, "valid_targets_mean": 5013.9, "valid_targets_min": 968 }, { "epoch": 5.810372771474879, "grad_norm": 0.8141064051451715, "learning_rate": 3.4263827936909744e-06, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.12475259602069855, "step": 3585, "valid_targets_mean": 2504.2, "valid_targets_min": 806 }, { "epoch": 5.818476499189627, "grad_norm": 0.5674431699647517, "learning_rate": 3.38127984807457e-06, "loss": 0.112, "loss_nan_ranks": 0, "loss_rank_avg": 0.09661044925451279, "step": 3590, "valid_targets_mean": 4857.5, "valid_targets_min": 834 }, { "epoch": 5.826580226904376, "grad_norm": 0.7103962514018813, "learning_rate": 3.3364483010915237e-06, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.12006492912769318, "step": 3595, "valid_targets_mean": 3394.4, "valid_targets_min": 644 }, { "epoch": 5.834683954619125, "grad_norm": 0.9765118903364278, "learning_rate": 3.2918888848812913e-06, "loss": 0.1362, "loss_nan_ranks": 0, "loss_rank_avg": 0.18907558917999268, "step": 3600, "valid_targets_mean": 2537.3, "valid_targets_min": 232 }, { "epoch": 5.842787682333873, "grad_norm": 0.6452405236633486, "learning_rate": 3.2476023271391698e-06, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.10429327189922333, "step": 3605, "valid_targets_mean": 3199.5, "valid_targets_min": 912 }, { "epoch": 5.8508914100486225, "grad_norm": 0.9704787354907897, "learning_rate": 3.2035893511044524e-06, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.12537583708763123, "step": 3610, "valid_targets_mean": 2012.1, "valid_targets_min": 505 }, { "epoch": 5.858995137763371, "grad_norm": 1.0125575644527998, "learning_rate": 3.159850675548577e-06, "loss": 0.1254, "loss_nan_ranks": 0, "loss_rank_avg": 0.13451366126537323, "step": 3615, "valid_targets_mean": 2137.6, "valid_targets_min": 844 }, { "epoch": 5.86709886547812, "grad_norm": 0.5958492150298547, "learning_rate": 3.116387014763429e-06, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.18298457562923431, "step": 3620, "valid_targets_mean": 4842.6, "valid_targets_min": 1062 }, { "epoch": 5.875202593192869, "grad_norm": 0.9194613793350569, "learning_rate": 3.073199078549638e-06, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.14356893301010132, "step": 3625, "valid_targets_mean": 2403.4, "valid_targets_min": 769 }, { "epoch": 5.883306320907618, "grad_norm": 0.7587379022022571, "learning_rate": 3.0302875722050064e-06, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.19144773483276367, "step": 3630, "valid_targets_mean": 3720.6, "valid_targets_min": 742 }, { "epoch": 5.891410048622366, "grad_norm": 0.757032598883858, "learning_rate": 2.987653196513003e-06, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.10905779898166656, "step": 3635, "valid_targets_mean": 2983.9, "valid_targets_min": 404 }, { "epoch": 5.899513776337115, "grad_norm": 0.84410146266729, "learning_rate": 2.9452966477312815e-06, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.12055391073226929, "step": 3640, "valid_targets_mean": 2604.8, "valid_targets_min": 953 }, { "epoch": 5.9076175040518635, "grad_norm": 0.6912606615140152, "learning_rate": 2.9032186175803545e-06, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.231064572930336, "step": 3645, "valid_targets_mean": 4160.1, "valid_targets_min": 589 }, { "epoch": 5.915721231766613, "grad_norm": 0.9150252191276331, "learning_rate": 2.8614197932322585e-06, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.14955416321754456, "step": 3650, "valid_targets_mean": 2538.5, "valid_targets_min": 1130 }, { "epoch": 5.923824959481362, "grad_norm": 1.0537159718577105, "learning_rate": 2.819900857299358e-06, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.12648676335811615, "step": 3655, "valid_targets_mean": 1749.5, "valid_targets_min": 551 }, { "epoch": 5.93192868719611, "grad_norm": 0.9562074384683694, "learning_rate": 2.778662487823187e-06, "loss": 0.1226, "loss_nan_ranks": 0, "loss_rank_avg": 0.11901277303695679, "step": 3660, "valid_targets_mean": 3005.4, "valid_targets_min": 885 }, { "epoch": 5.940032414910859, "grad_norm": 0.9786475511741156, "learning_rate": 2.7377053582633652e-06, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.1406671404838562, "step": 3665, "valid_targets_mean": 2011.9, "valid_targets_min": 746 }, { "epoch": 5.948136142625608, "grad_norm": 0.780480994666007, "learning_rate": 2.6970301374866337e-06, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.15554064512252808, "step": 3670, "valid_targets_mean": 2561.8, "valid_targets_min": 697 }, { "epoch": 5.956239870340356, "grad_norm": 0.6847569982772912, "learning_rate": 2.656637489755889e-06, "loss": 0.107, "loss_nan_ranks": 0, "loss_rank_avg": 0.08473924547433853, "step": 3675, "valid_targets_mean": 2566.4, "valid_targets_min": 617 }, { "epoch": 5.964343598055105, "grad_norm": 1.1663803129546406, "learning_rate": 2.616528074719371e-06, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.16240835189819336, "step": 3680, "valid_targets_mean": 1863.8, "valid_targets_min": 735 }, { "epoch": 5.9724473257698545, "grad_norm": 1.0505470362211855, "learning_rate": 2.576702547399863e-06, "loss": 0.1137, "loss_nan_ranks": 0, "loss_rank_avg": 0.11963564902544022, "step": 3685, "valid_targets_mean": 2972.6, "valid_targets_min": 924 }, { "epoch": 5.980551053484603, "grad_norm": 0.6153132292802707, "learning_rate": 2.53716155818402e-06, "loss": 0.1199, "loss_nan_ranks": 0, "loss_rank_avg": 0.10222367942333221, "step": 3690, "valid_targets_mean": 3769.6, "valid_targets_min": 496 }, { "epoch": 5.988654781199352, "grad_norm": 0.7706022269958611, "learning_rate": 2.49790575281172e-06, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.10004860907793045, "step": 3695, "valid_targets_mean": 4118.3, "valid_targets_min": 461 }, { "epoch": 5.9967585089141, "grad_norm": 1.1497778298396315, "learning_rate": 2.4589357723655405e-06, "loss": 0.1159, "loss_nan_ranks": 0, "loss_rank_avg": 0.12909851968288422, "step": 3700, "valid_targets_mean": 1985.4, "valid_targets_min": 912 }, { "epoch": 6.004862236628849, "grad_norm": 0.8065263620717076, "learning_rate": 2.4202522532602846e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.12583133578300476, "step": 3705, "valid_targets_mean": 2561.8, "valid_targets_min": 706 }, { "epoch": 6.012965964343598, "grad_norm": 0.47440335088604885, "learning_rate": 2.381855827232571e-06, "loss": 0.1023, "loss_nan_ranks": 0, "loss_rank_avg": 0.08017963171005249, "step": 3710, "valid_targets_mean": 4353.3, "valid_targets_min": 232 }, { "epoch": 6.021069692058346, "grad_norm": 0.8208816345120449, "learning_rate": 2.343747121330544e-06, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.12535922229290009, "step": 3715, "valid_targets_mean": 2856.1, "valid_targets_min": 941 }, { "epoch": 6.0291734197730955, "grad_norm": 0.7429830314090826, "learning_rate": 2.3059267579036183e-06, "loss": 0.1217, "loss_nan_ranks": 0, "loss_rank_avg": 0.10140064358711243, "step": 3720, "valid_targets_mean": 3342.2, "valid_targets_min": 1157 }, { "epoch": 6.037277147487845, "grad_norm": 0.5938762525392249, "learning_rate": 2.268395354592312e-06, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.11517813801765442, "step": 3725, "valid_targets_mean": 5581.0, "valid_targets_min": 232 }, { "epoch": 6.045380875202593, "grad_norm": 0.8583542985755236, "learning_rate": 2.2311535243181637e-06, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.2661886513233185, "step": 3730, "valid_targets_mean": 3863.1, "valid_targets_min": 443 }, { "epoch": 6.053484602917342, "grad_norm": 0.8438682223939366, "learning_rate": 2.1942018752737227e-06, "loss": 0.121, "loss_nan_ranks": 0, "loss_rank_avg": 0.08933848142623901, "step": 3735, "valid_targets_mean": 2379.1, "valid_targets_min": 929 }, { "epoch": 6.061588330632091, "grad_norm": 0.4750345988672662, "learning_rate": 2.1575410109126293e-06, "loss": 0.1062, "loss_nan_ranks": 0, "loss_rank_avg": 0.07867272198200226, "step": 3740, "valid_targets_mean": 5703.2, "valid_targets_min": 767 }, { "epoch": 6.069692058346839, "grad_norm": 0.7820914107075465, "learning_rate": 2.121171529939734e-06, "loss": 0.1316, "loss_nan_ranks": 0, "loss_rank_avg": 0.15075111389160156, "step": 3745, "valid_targets_mean": 3570.4, "valid_targets_min": 763 }, { "epoch": 6.077795786061588, "grad_norm": 0.7594471532290356, "learning_rate": 2.085094026301349e-06, "loss": 0.1173, "loss_nan_ranks": 0, "loss_rank_avg": 0.20603245496749878, "step": 3750, "valid_targets_mean": 3489.7, "valid_targets_min": 968 }, { "epoch": 6.085899513776337, "grad_norm": 0.6047064426773207, "learning_rate": 2.0493090891755262e-06, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.07911926507949829, "step": 3755, "valid_targets_mean": 3143.4, "valid_targets_min": 973 }, { "epoch": 6.094003241491086, "grad_norm": 0.5079708101672858, "learning_rate": 2.013817302962444e-06, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.17122353613376617, "step": 3760, "valid_targets_mean": 6064.8, "valid_targets_min": 1526 }, { "epoch": 6.102106969205835, "grad_norm": 0.8625230922660629, "learning_rate": 1.9786192472748643e-06, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.10119368880987167, "step": 3765, "valid_targets_mean": 2206.5, "valid_targets_min": 924 }, { "epoch": 6.110210696920584, "grad_norm": 1.0935738204994028, "learning_rate": 1.9437154969286577e-06, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.12805625796318054, "step": 3770, "valid_targets_mean": 1756.6, "valid_targets_min": 534 }, { "epoch": 6.118314424635332, "grad_norm": 0.7094021347408048, "learning_rate": 1.9091066219334365e-06, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.09319410473108292, "step": 3775, "valid_targets_mean": 3571.6, "valid_targets_min": 600 }, { "epoch": 6.126418152350081, "grad_norm": 0.8810616245799291, "learning_rate": 1.8747931874832325e-06, "loss": 0.13, "loss_nan_ranks": 0, "loss_rank_avg": 0.06927265226840973, "step": 3780, "valid_targets_mean": 3894.1, "valid_targets_min": 954 }, { "epoch": 6.13452188006483, "grad_norm": 0.7966465543664667, "learning_rate": 1.8407757539472548e-06, "loss": 0.1291, "loss_nan_ranks": 0, "loss_rank_avg": 0.1974271982908249, "step": 3785, "valid_targets_mean": 3178.2, "valid_targets_min": 450 }, { "epoch": 6.1426256077795784, "grad_norm": 0.5378695627769883, "learning_rate": 1.8070548768607744e-06, "loss": 0.1343, "loss_nan_ranks": 0, "loss_rank_avg": 0.10642120242118835, "step": 3790, "valid_targets_mean": 4619.8, "valid_targets_min": 850 }, { "epoch": 6.1507293354943275, "grad_norm": 1.0147575200870909, "learning_rate": 1.773631106915996e-06, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.09471525251865387, "step": 3795, "valid_targets_mean": 2203.6, "valid_targets_min": 1137 }, { "epoch": 6.158833063209076, "grad_norm": 0.7484970018269975, "learning_rate": 1.740504989953129e-06, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.11913225054740906, "step": 3800, "valid_targets_mean": 2594.4, "valid_targets_min": 907 }, { "epoch": 6.166936790923825, "grad_norm": 0.8241935721612473, "learning_rate": 1.707677066951432e-06, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.21923650801181793, "step": 3805, "valid_targets_mean": 3371.1, "valid_targets_min": 644 }, { "epoch": 6.175040518638574, "grad_norm": 0.7791725998755106, "learning_rate": 1.6751478740203776e-06, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.14890174567699432, "step": 3810, "valid_targets_mean": 3476.3, "valid_targets_min": 800 }, { "epoch": 6.183144246353322, "grad_norm": 0.9316060672966924, "learning_rate": 1.6429179423909248e-06, "loss": 0.1066, "loss_nan_ranks": 0, "loss_rank_avg": 0.09502556920051575, "step": 3815, "valid_targets_mean": 1851.6, "valid_targets_min": 319 }, { "epoch": 6.191247974068071, "grad_norm": 0.6681121617992075, "learning_rate": 1.6109877984068089e-06, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.10410622507333755, "step": 3820, "valid_targets_mean": 3242.0, "valid_targets_min": 645 }, { "epoch": 6.19935170178282, "grad_norm": 0.7966050962281183, "learning_rate": 1.5793579635159883e-06, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.12778472900390625, "step": 3825, "valid_targets_mean": 2881.1, "valid_targets_min": 1181 }, { "epoch": 6.207455429497569, "grad_norm": 1.0811104704970367, "learning_rate": 1.5480289542620686e-06, "loss": 0.1234, "loss_nan_ranks": 0, "loss_rank_avg": 0.14305716753005981, "step": 3830, "valid_targets_mean": 1729.1, "valid_targets_min": 505 }, { "epoch": 6.215559157212318, "grad_norm": 0.8218570136420974, "learning_rate": 1.517001282275936e-06, "loss": 0.1119, "loss_nan_ranks": 0, "loss_rank_avg": 0.19680121541023254, "step": 3835, "valid_targets_mean": 3000.9, "valid_targets_min": 776 }, { "epoch": 6.223662884927067, "grad_norm": 1.3444875208456322, "learning_rate": 1.486275454267354e-06, "loss": 0.1256, "loss_nan_ranks": 0, "loss_rank_avg": 0.1285068839788437, "step": 3840, "valid_targets_mean": 2764.1, "valid_targets_min": 604 }, { "epoch": 6.231766612641815, "grad_norm": 0.8944598377852021, "learning_rate": 1.4558519720166975e-06, "loss": 0.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.16025900840759277, "step": 3845, "valid_targets_mean": 2910.8, "valid_targets_min": 906 }, { "epoch": 6.239870340356564, "grad_norm": 0.651296867676762, "learning_rate": 1.4257313323667798e-06, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.08879795670509338, "step": 3850, "valid_targets_mean": 3112.5, "valid_targets_min": 400 }, { "epoch": 6.247974068071313, "grad_norm": 0.5999610443428787, "learning_rate": 1.3959140272146998e-06, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.11679062247276306, "step": 3855, "valid_targets_mean": 3881.8, "valid_targets_min": 853 }, { "epoch": 6.256077795786061, "grad_norm": 0.9636049482804864, "learning_rate": 1.366400543503854e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.18295209109783173, "step": 3860, "valid_targets_mean": 2168.9, "valid_targets_min": 607 }, { "epoch": 6.2641815235008105, "grad_norm": 0.78397490864793, "learning_rate": 1.3371913632159506e-06, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.089485764503479, "step": 3865, "valid_targets_mean": 2398.6, "valid_targets_min": 871 }, { "epoch": 6.272285251215559, "grad_norm": 0.7820564283288564, "learning_rate": 1.3082869633631413e-06, "loss": 0.1407, "loss_nan_ranks": 0, "loss_rank_avg": 0.1150301992893219, "step": 3870, "valid_targets_mean": 2335.1, "valid_targets_min": 927 }, { "epoch": 6.280388978930308, "grad_norm": 1.027079175401604, "learning_rate": 1.2796878159802595e-06, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.15304911136627197, "step": 3875, "valid_targets_mean": 2105.1, "valid_targets_min": 954 }, { "epoch": 6.288492706645057, "grad_norm": 0.6199836306967389, "learning_rate": 1.2513943881170754e-06, "loss": 0.137, "loss_nan_ranks": 0, "loss_rank_avg": 0.13365209102630615, "step": 3880, "valid_targets_mean": 4391.9, "valid_targets_min": 1005 }, { "epoch": 6.296596434359805, "grad_norm": 0.7727236218240091, "learning_rate": 1.2234071418306903e-06, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.10507519543170929, "step": 3885, "valid_targets_mean": 2839.7, "valid_targets_min": 671 }, { "epoch": 6.304700162074554, "grad_norm": 0.8259960625219598, "learning_rate": 1.1957265341779855e-06, "loss": 0.1128, "loss_nan_ranks": 0, "loss_rank_avg": 0.06842942535877228, "step": 3890, "valid_targets_mean": 2111.8, "valid_targets_min": 509 }, { "epoch": 6.312803889789303, "grad_norm": 1.3006108319686243, "learning_rate": 1.1683530172081592e-06, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.16923511028289795, "step": 3895, "valid_targets_mean": 2721.0, "valid_targets_min": 318 }, { "epoch": 6.3209076175040515, "grad_norm": 0.9212042910130562, "learning_rate": 1.1412870379553387e-06, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.11085739731788635, "step": 3900, "valid_targets_mean": 2037.5, "valid_targets_min": 928 }, { "epoch": 6.329011345218801, "grad_norm": 0.7484624073581349, "learning_rate": 1.1145290384312846e-06, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.10903692245483398, "step": 3905, "valid_targets_mean": 2927.1, "valid_targets_min": 662 }, { "epoch": 6.33711507293355, "grad_norm": 0.7780860184446243, "learning_rate": 1.0880794556181762e-06, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.13929596543312073, "step": 3910, "valid_targets_mean": 3093.2, "valid_targets_min": 844 }, { "epoch": 6.345218800648298, "grad_norm": 0.857143392794329, "learning_rate": 1.0619387214614662e-06, "loss": 0.1038, "loss_nan_ranks": 0, "loss_rank_avg": 0.08489274978637695, "step": 3915, "valid_targets_mean": 2249.3, "valid_targets_min": 754 }, { "epoch": 6.353322528363047, "grad_norm": 0.7892887000224863, "learning_rate": 1.0361072628628354e-06, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.1285485327243805, "step": 3920, "valid_targets_mean": 3397.4, "valid_targets_min": 759 }, { "epoch": 6.361426256077796, "grad_norm": 0.8963361991084041, "learning_rate": 1.0105855016732113e-06, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.15654143691062927, "step": 3925, "valid_targets_mean": 2594.8, "valid_targets_min": 347 }, { "epoch": 6.369529983792544, "grad_norm": 0.9164724545517589, "learning_rate": 9.853738546858893e-07, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.09162580966949463, "step": 3930, "valid_targets_mean": 2038.8, "valid_targets_min": 704 }, { "epoch": 6.377633711507293, "grad_norm": 0.6269508433513853, "learning_rate": 9.604727336297203e-07, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.10261643677949905, "step": 3935, "valid_targets_mean": 3776.9, "valid_targets_min": 518 }, { "epoch": 6.3857374392220425, "grad_norm": 0.7267537967221318, "learning_rate": 9.358825451623832e-07, "loss": 0.1693, "loss_nan_ranks": 0, "loss_rank_avg": 0.16209650039672852, "step": 3940, "valid_targets_mean": 3149.4, "valid_targets_min": 484 }, { "epoch": 6.393841166936791, "grad_norm": 0.8819007736794746, "learning_rate": 9.116036908637582e-07, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.13063153624534607, "step": 3945, "valid_targets_mean": 2710.8, "valid_targets_min": 918 }, { "epoch": 6.40194489465154, "grad_norm": 0.6745885226985678, "learning_rate": 8.876365672293441e-07, "loss": 0.091, "loss_nan_ranks": 0, "loss_rank_avg": 0.08468009531497955, "step": 3950, "valid_targets_mean": 3238.0, "valid_targets_min": 967 }, { "epoch": 6.410048622366288, "grad_norm": 0.8819209149898708, "learning_rate": 8.639815656638162e-07, "loss": 0.1247, "loss_nan_ranks": 0, "loss_rank_avg": 0.15380942821502686, "step": 3955, "valid_targets_mean": 2853.2, "valid_targets_min": 873 }, { "epoch": 6.418152350081037, "grad_norm": 0.8845074945045972, "learning_rate": 8.406390724745961e-07, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.1663370132446289, "step": 3960, "valid_targets_mean": 2657.0, "valid_targets_min": 277 }, { "epoch": 6.426256077795786, "grad_norm": 0.7576749630747052, "learning_rate": 8.176094688655789e-07, "loss": 0.1185, "loss_nan_ranks": 0, "loss_rank_avg": 0.1374589502811432, "step": 3965, "valid_targets_mean": 3111.9, "valid_targets_min": 501 }, { "epoch": 6.434359805510534, "grad_norm": 0.8629454796074068, "learning_rate": 7.948931309308872e-07, "loss": 0.1229, "loss_nan_ranks": 0, "loss_rank_avg": 0.13856954872608185, "step": 3970, "valid_targets_mean": 3491.9, "valid_targets_min": 314 }, { "epoch": 6.4424635332252835, "grad_norm": 1.0231777837569396, "learning_rate": 7.724904296487246e-07, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.11940930783748627, "step": 3975, "valid_targets_mean": 1845.0, "valid_targets_min": 870 }, { "epoch": 6.450567260940033, "grad_norm": 0.8238449493780197, "learning_rate": 7.504017308753386e-07, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.18350258469581604, "step": 3980, "valid_targets_mean": 4485.2, "valid_targets_min": 217 }, { "epoch": 6.458670988654781, "grad_norm": 0.8464204623046769, "learning_rate": 7.286273953390278e-07, "loss": 0.2092, "loss_nan_ranks": 0, "loss_rank_avg": 0.258614182472229, "step": 3985, "valid_targets_mean": 3313.9, "valid_targets_min": 810 }, { "epoch": 6.46677471636953, "grad_norm": 0.8918238849564315, "learning_rate": 7.071677786342568e-07, "loss": 0.1237, "loss_nan_ranks": 0, "loss_rank_avg": 0.1031871885061264, "step": 3990, "valid_targets_mean": 2293.3, "valid_targets_min": 864 }, { "epoch": 6.474878444084279, "grad_norm": 0.8528535194867968, "learning_rate": 6.860232312158554e-07, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.15150435268878937, "step": 3995, "valid_targets_mean": 2968.9, "valid_targets_min": 747 }, { "epoch": 6.482982171799027, "grad_norm": 0.7636360851041402, "learning_rate": 6.651940983932737e-07, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.19292369484901428, "step": 4000, "valid_targets_mean": 3176.4, "valid_targets_min": 1041 }, { "epoch": 6.491085899513776, "grad_norm": 1.0126383046774314, "learning_rate": 6.44680720324975e-07, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.12578508257865906, "step": 4005, "valid_targets_mean": 1690.8, "valid_targets_min": 828 }, { "epoch": 6.4991896272285254, "grad_norm": 0.7355254192324758, "learning_rate": 6.244834320128501e-07, "loss": 0.1175, "loss_nan_ranks": 0, "loss_rank_avg": 0.10512825846672058, "step": 4010, "valid_targets_mean": 2727.1, "valid_targets_min": 835 }, { "epoch": 6.507293354943274, "grad_norm": 0.8817717410341444, "learning_rate": 6.0460256329677e-07, "loss": 0.1362, "loss_nan_ranks": 0, "loss_rank_avg": 0.0961059033870697, "step": 4015, "valid_targets_mean": 1961.8, "valid_targets_min": 851 }, { "epoch": 6.515397082658023, "grad_norm": 0.9530199455424444, "learning_rate": 5.850384388491814e-07, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.11027082055807114, "step": 4020, "valid_targets_mean": 2610.9, "valid_targets_min": 726 }, { "epoch": 6.523500810372772, "grad_norm": 1.1973587173189302, "learning_rate": 5.657913781698221e-07, "loss": 0.1467, "loss_nan_ranks": 0, "loss_rank_avg": 0.15702632069587708, "step": 4025, "valid_targets_mean": 2178.3, "valid_targets_min": 735 }, { "epoch": 6.53160453808752, "grad_norm": 0.9362106839228681, "learning_rate": 5.468616955804873e-07, "loss": 0.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.1587480902671814, "step": 4030, "valid_targets_mean": 2364.8, "valid_targets_min": 402 }, { "epoch": 6.539708265802269, "grad_norm": 0.8971025729416715, "learning_rate": 5.282497002198983e-07, "loss": 0.1034, "loss_nan_ranks": 0, "loss_rank_avg": 0.10483712702989578, "step": 4035, "valid_targets_mean": 2060.6, "valid_targets_min": 906 }, { "epoch": 6.547811993517017, "grad_norm": 2.337830249158839, "learning_rate": 5.099556960386686e-07, "loss": 0.119, "loss_nan_ranks": 0, "loss_rank_avg": 0.114591583609581, "step": 4040, "valid_targets_mean": 1819.8, "valid_targets_min": 589 }, { "epoch": 6.5559157212317665, "grad_norm": 0.9163559690136783, "learning_rate": 4.919799817943238e-07, "loss": 0.1064, "loss_nan_ranks": 0, "loss_rank_avg": 0.1364617496728897, "step": 4045, "valid_targets_mean": 2475.9, "valid_targets_min": 328 }, { "epoch": 6.564019448946516, "grad_norm": 1.0530486479633936, "learning_rate": 4.7432285104642703e-07, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.1412011682987213, "step": 4050, "valid_targets_mean": 1812.3, "valid_targets_min": 495 }, { "epoch": 6.572123176661265, "grad_norm": 1.0490371458755887, "learning_rate": 4.569845921517968e-07, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.1328582465648651, "step": 4055, "valid_targets_mean": 2563.8, "valid_targets_min": 968 }, { "epoch": 6.580226904376013, "grad_norm": 0.8827517020820953, "learning_rate": 4.399654882597726e-07, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.09797355532646179, "step": 4060, "valid_targets_mean": 1908.7, "valid_targets_min": 734 }, { "epoch": 6.588330632090762, "grad_norm": 0.5796761962828608, "learning_rate": 4.232658173076232e-07, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.08027474582195282, "step": 4065, "valid_targets_mean": 4144.1, "valid_targets_min": 872 }, { "epoch": 6.59643435980551, "grad_norm": 1.0909407783873655, "learning_rate": 4.068858520159724e-07, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.11777451634407043, "step": 4070, "valid_targets_mean": 2117.9, "valid_targets_min": 292 }, { "epoch": 6.604538087520259, "grad_norm": 0.6833254490640153, "learning_rate": 3.9082585988437617e-07, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.1639232188463211, "step": 4075, "valid_targets_mean": 3476.4, "valid_targets_min": 822 }, { "epoch": 6.612641815235008, "grad_norm": 0.9742355762056493, "learning_rate": 3.7508610318693684e-07, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.1798877716064453, "step": 4080, "valid_targets_mean": 2434.2, "valid_targets_min": 782 }, { "epoch": 6.620745542949757, "grad_norm": 0.7781187724054021, "learning_rate": 3.596668389680247e-07, "loss": 0.1188, "loss_nan_ranks": 0, "loss_rank_avg": 0.09959834814071655, "step": 4085, "valid_targets_mean": 2723.8, "valid_targets_min": 529 }, { "epoch": 6.628849270664506, "grad_norm": 0.8466343867882937, "learning_rate": 3.445683190380833e-07, "loss": 0.1141, "loss_nan_ranks": 0, "loss_rank_avg": 0.08893650770187378, "step": 4090, "valid_targets_mean": 1926.0, "valid_targets_min": 568 }, { "epoch": 6.636952998379255, "grad_norm": 0.7908915562547193, "learning_rate": 3.297907899695019e-07, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.09306427836418152, "step": 4095, "valid_targets_mean": 2579.3, "valid_targets_min": 939 }, { "epoch": 6.645056726094003, "grad_norm": 0.6540049138105144, "learning_rate": 3.1533449309262056e-07, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.12161879241466522, "step": 4100, "valid_targets_mean": 3311.7, "valid_targets_min": 817 }, { "epoch": 6.653160453808752, "grad_norm": 0.8462221047782975, "learning_rate": 3.0119966449174474e-07, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.0935630202293396, "step": 4105, "valid_targets_mean": 1882.8, "valid_targets_min": 840 }, { "epoch": 6.661264181523501, "grad_norm": 0.81490063291204, "learning_rate": 2.8738653500133494e-07, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.10476881265640259, "step": 4110, "valid_targets_mean": 2528.9, "valid_targets_min": 984 }, { "epoch": 6.669367909238249, "grad_norm": 0.6366928478749754, "learning_rate": 2.738953302022096e-07, "loss": 0.1103, "loss_nan_ranks": 0, "loss_rank_avg": 0.08438228070735931, "step": 4115, "valid_targets_mean": 3672.2, "valid_targets_min": 930 }, { "epoch": 6.6774716369529985, "grad_norm": 0.5680139767437395, "learning_rate": 2.6072627041785925e-07, "loss": 0.1178, "loss_nan_ranks": 0, "loss_rank_avg": 0.05923807621002197, "step": 4120, "valid_targets_mean": 3334.2, "valid_targets_min": 913 }, { "epoch": 6.685575364667747, "grad_norm": 3.566418268679015, "learning_rate": 2.478795707108672e-07, "loss": 0.1124, "loss_nan_ranks": 0, "loss_rank_avg": 0.0984240397810936, "step": 4125, "valid_targets_mean": 3397.5, "valid_targets_min": 518 }, { "epoch": 6.693679092382496, "grad_norm": 0.8102395858284243, "learning_rate": 2.3535544087938345e-07, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.1713753342628479, "step": 4130, "valid_targets_mean": 2797.9, "valid_targets_min": 731 }, { "epoch": 6.701782820097245, "grad_norm": 0.9439721686588282, "learning_rate": 2.2315408545370288e-07, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.15056179463863373, "step": 4135, "valid_targets_mean": 2218.5, "valid_targets_min": 624 }, { "epoch": 6.709886547811994, "grad_norm": 0.9719771412362007, "learning_rate": 2.1127570369292361e-07, "loss": 0.1266, "loss_nan_ranks": 0, "loss_rank_avg": 0.1161581426858902, "step": 4140, "valid_targets_mean": 2372.7, "valid_targets_min": 560 }, { "epoch": 6.717990275526742, "grad_norm": 0.7885505138738974, "learning_rate": 1.9972048958168954e-07, "loss": 0.1297, "loss_nan_ranks": 0, "loss_rank_avg": 0.08716851472854614, "step": 4145, "valid_targets_mean": 2679.0, "valid_targets_min": 727 }, { "epoch": 6.726094003241491, "grad_norm": 0.7564261208584763, "learning_rate": 1.8848863182703513e-07, "loss": 0.1293, "loss_nan_ranks": 0, "loss_rank_avg": 0.14512531459331512, "step": 4150, "valid_targets_mean": 3178.8, "valid_targets_min": 836 }, { "epoch": 6.7341977309562395, "grad_norm": 0.8230943188429811, "learning_rate": 1.7758031385528784e-07, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.19820144772529602, "step": 4155, "valid_targets_mean": 2705.9, "valid_targets_min": 904 }, { "epoch": 6.742301458670989, "grad_norm": 0.7304895753350193, "learning_rate": 1.6699571380908385e-07, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.1148165911436081, "step": 4160, "valid_targets_mean": 2799.2, "valid_targets_min": 740 }, { "epoch": 6.750405186385738, "grad_norm": 0.8783884446179141, "learning_rate": 1.5673500454445046e-07, "loss": 0.1137, "loss_nan_ranks": 0, "loss_rank_avg": 0.1160724088549614, "step": 4165, "valid_targets_mean": 1911.4, "valid_targets_min": 757 }, { "epoch": 6.758508914100486, "grad_norm": 0.8452843386698703, "learning_rate": 1.4679835362799266e-07, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.17844310402870178, "step": 4170, "valid_targets_mean": 2903.6, "valid_targets_min": 717 }, { "epoch": 6.766612641815235, "grad_norm": 0.9641957278215031, "learning_rate": 1.3718592333414881e-07, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.1178508773446083, "step": 4175, "valid_targets_mean": 1679.4, "valid_targets_min": 456 }, { "epoch": 6.774716369529984, "grad_norm": 0.6732633682506574, "learning_rate": 1.2789787064253934e-07, "loss": 0.1513, "loss_nan_ranks": 0, "loss_rank_avg": 0.12225890159606934, "step": 4180, "valid_targets_mean": 3461.0, "valid_targets_min": 695 }, { "epoch": 6.782820097244732, "grad_norm": 0.9548675664452392, "learning_rate": 1.1893434723541542e-07, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.12099964916706085, "step": 4185, "valid_targets_mean": 1765.4, "valid_targets_min": 348 }, { "epoch": 6.790923824959481, "grad_norm": 0.7229822657096528, "learning_rate": 1.1029549949516549e-07, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.16705356538295746, "step": 4190, "valid_targets_mean": 4125.2, "valid_targets_min": 562 }, { "epoch": 6.7990275526742305, "grad_norm": 1.0053755294682665, "learning_rate": 1.0198146850193935e-07, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.10085690766572952, "step": 4195, "valid_targets_mean": 1957.5, "valid_targets_min": 464 }, { "epoch": 6.807131280388979, "grad_norm": 1.335653057078746, "learning_rate": 9.399239003132999e-08, "loss": 0.138, "loss_nan_ranks": 0, "loss_rank_avg": 0.09673996269702911, "step": 4200, "valid_targets_mean": 1523.4, "valid_targets_min": 705 }, { "epoch": 6.815235008103728, "grad_norm": 0.8800015171398834, "learning_rate": 8.632839455216869e-08, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.11644886434078217, "step": 4205, "valid_targets_mean": 2234.9, "valid_targets_min": 650 }, { "epoch": 6.823338735818476, "grad_norm": 0.782216107013055, "learning_rate": 7.89896072243912e-08, "loss": 0.1221, "loss_nan_ranks": 0, "loss_rank_avg": 0.10838295519351959, "step": 4210, "valid_targets_mean": 2606.8, "valid_targets_min": 1066 }, { "epoch": 6.831442463533225, "grad_norm": 0.7331468581917359, "learning_rate": 7.197614789698604e-08, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.27159422636032104, "step": 4215, "valid_targets_mean": 4613.2, "valid_targets_min": 1164 }, { "epoch": 6.839546191247974, "grad_norm": 0.7847565716440916, "learning_rate": 6.528813110604714e-08, "loss": 0.1195, "loss_nan_ranks": 0, "loss_rank_avg": 0.10585910081863403, "step": 4220, "valid_targets_mean": 2765.0, "valid_targets_min": 632 }, { "epoch": 6.847649918962723, "grad_norm": 0.8253246012683277, "learning_rate": 5.8925666072899845e-08, "loss": 0.1249, "loss_nan_ranks": 0, "loss_rank_avg": 0.14212317764759064, "step": 4225, "valid_targets_mean": 2604.4, "valid_targets_min": 583 }, { "epoch": 6.855753646677472, "grad_norm": 0.798983689706256, "learning_rate": 5.288885670231336e-08, "loss": 0.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.10902281105518341, "step": 4230, "valid_targets_mean": 2613.6, "valid_targets_min": 461 }, { "epoch": 6.863857374392221, "grad_norm": 0.8467915925619014, "learning_rate": 4.717780158080887e-08, "loss": 0.1119, "loss_nan_ranks": 0, "loss_rank_avg": 0.1464867889881134, "step": 4235, "valid_targets_mean": 2088.5, "valid_targets_min": 522 }, { "epoch": 6.871961102106969, "grad_norm": 1.0029490169977413, "learning_rate": 4.1792593975049644e-08, "loss": 0.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.12026522308588028, "step": 4240, "valid_targets_mean": 1802.7, "valid_targets_min": 819 }, { "epoch": 6.880064829821718, "grad_norm": 0.9011238391462046, "learning_rate": 3.6733321830315636e-08, "loss": 0.1337, "loss_nan_ranks": 0, "loss_rank_avg": 0.11811887472867966, "step": 4245, "valid_targets_mean": 2323.1, "valid_targets_min": 949 }, { "epoch": 6.888168557536467, "grad_norm": 0.7165823854167281, "learning_rate": 3.200006776906461e-08, "loss": 0.1129, "loss_nan_ranks": 0, "loss_rank_avg": 0.09492816030979156, "step": 4250, "valid_targets_mean": 2960.4, "valid_targets_min": 814 }, { "epoch": 6.896272285251215, "grad_norm": 0.9450518017052805, "learning_rate": 2.7592909089593224e-08, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.14789974689483643, "step": 4255, "valid_targets_mean": 2218.0, "valid_targets_min": 761 }, { "epoch": 6.904376012965964, "grad_norm": 0.7311474778057845, "learning_rate": 2.351191776475581e-08, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.1463954895734787, "step": 4260, "valid_targets_mean": 3855.9, "valid_targets_min": 1393 }, { "epoch": 6.9124797406807135, "grad_norm": 0.6301982317715115, "learning_rate": 1.9757160440814217e-08, "loss": 0.1343, "loss_nan_ranks": 0, "loss_rank_avg": 0.10000479966402054, "step": 4265, "valid_targets_mean": 3855.6, "valid_targets_min": 809 }, { "epoch": 6.920583468395462, "grad_norm": 0.9798344906644698, "learning_rate": 1.6328698436327562e-08, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.16356664896011353, "step": 4270, "valid_targets_mean": 2240.9, "valid_targets_min": 622 }, { "epoch": 6.928687196110211, "grad_norm": 0.8892538533790851, "learning_rate": 1.3226587741159702e-08, "loss": 0.1134, "loss_nan_ranks": 0, "loss_rank_avg": 0.13213740289211273, "step": 4275, "valid_targets_mean": 2755.2, "valid_targets_min": 736 }, { "epoch": 6.93679092382496, "grad_norm": 0.8637275559260358, "learning_rate": 1.0450879015566629e-08, "loss": 0.1239, "loss_nan_ranks": 0, "loss_rank_avg": 0.10389816761016846, "step": 4280, "valid_targets_mean": 2268.2, "valid_targets_min": 302 }, { "epoch": 6.944894651539708, "grad_norm": 0.7857182787493622, "learning_rate": 8.001617589368238e-09, "loss": 0.1201, "loss_nan_ranks": 0, "loss_rank_avg": 0.09846210479736328, "step": 4285, "valid_targets_mean": 2556.7, "valid_targets_min": 883 }, { "epoch": 6.952998379254457, "grad_norm": 0.5942319504605537, "learning_rate": 5.878843461200046e-09, "loss": 0.122, "loss_nan_ranks": 0, "loss_rank_avg": 0.08767960220575333, "step": 4290, "valid_targets_mean": 4519.6, "valid_targets_min": 783 }, { "epoch": 6.961102106969205, "grad_norm": 0.8250059679447841, "learning_rate": 4.082591297873695e-09, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.17609858512878418, "step": 4295, "valid_targets_mean": 3104.8, "valid_targets_min": 398 }, { "epoch": 6.9692058346839545, "grad_norm": 0.7499567331158492, "learning_rate": 2.6128904338018624e-09, "loss": 0.1151, "loss_nan_ranks": 0, "loss_rank_avg": 0.08152391016483307, "step": 4300, "valid_targets_mean": 2886.6, "valid_targets_min": 342 }, { "epoch": 6.977309562398704, "grad_norm": 0.9718691223278781, "learning_rate": 1.4697648705186417e-09, "loss": 0.1302, "loss_nan_ranks": 0, "loss_rank_avg": 0.15906545519828796, "step": 4305, "valid_targets_mean": 2148.2, "valid_targets_min": 565 }, { "epoch": 6.985413290113452, "grad_norm": 0.7283394841772546, "learning_rate": 6.532332762931859e-10, "loss": 0.0901, "loss_nan_ranks": 0, "loss_rank_avg": 0.12135720252990723, "step": 4310, "valid_targets_mean": 3223.2, "valid_targets_min": 741 }, { "epoch": 6.993517017828201, "grad_norm": 0.7328657780903466, "learning_rate": 1.6330898581884414e-10, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.09660885483026505, "step": 4315, "valid_targets_mean": 2950.4, "valid_targets_min": 780 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.20906896889209747, "step": 4319, "total_flos": 702151473364992.0, "train_loss": 0.11156423039722288, "train_runtime": 12711.7053, "train_samples_per_second": 5.432, "train_steps_per_second": 0.34, "valid_targets_mean": 3750.0, "valid_targets_min": 750 } ], "logging_steps": 5, "max_steps": 4319, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 702151473364992.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }