{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 7161, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.004887585532746823, "grad_norm": 12.44376256794233, "learning_rate": 2.2315202231520225e-07, "loss": 0.775, "loss_nan_ranks": 0, "loss_rank_avg": 0.7660703063011169, "step": 5, "valid_targets_mean": 2759.7, "valid_targets_min": 789 }, { "epoch": 0.009775171065493646, "grad_norm": 13.083127751453706, "learning_rate": 5.020920502092051e-07, "loss": 0.7585, "loss_nan_ranks": 0, "loss_rank_avg": 0.7838925123214722, "step": 10, "valid_targets_mean": 2175.1, "valid_targets_min": 647 }, { "epoch": 0.01466275659824047, "grad_norm": 10.557856263973706, "learning_rate": 7.810320781032078e-07, "loss": 0.7713, "loss_nan_ranks": 0, "loss_rank_avg": 0.7736507654190063, "step": 15, "valid_targets_mean": 2148.8, "valid_targets_min": 803 }, { "epoch": 0.019550342130987292, "grad_norm": 9.4146088353884, "learning_rate": 1.0599721059972108e-06, "loss": 0.7562, "loss_nan_ranks": 0, "loss_rank_avg": 0.7820156812667847, "step": 20, "valid_targets_mean": 2958.0, "valid_targets_min": 945 }, { "epoch": 0.024437927663734114, "grad_norm": 8.510426871763977, "learning_rate": 1.3389121338912134e-06, "loss": 0.7276, "loss_nan_ranks": 0, "loss_rank_avg": 0.7074830532073975, "step": 25, "valid_targets_mean": 2418.9, "valid_targets_min": 734 }, { "epoch": 0.02932551319648094, "grad_norm": 5.967061937258563, "learning_rate": 1.6178521617852163e-06, "loss": 0.6946, "loss_nan_ranks": 0, "loss_rank_avg": 0.7003393769264221, "step": 30, "valid_targets_mean": 2274.1, "valid_targets_min": 724 }, { "epoch": 0.03421309872922776, "grad_norm": 5.128418930959132, "learning_rate": 1.8967921896792191e-06, "loss": 0.6951, "loss_nan_ranks": 0, "loss_rank_avg": 0.6412136554718018, "step": 35, "valid_targets_mean": 2286.8, "valid_targets_min": 1077 }, { "epoch": 0.039100684261974585, "grad_norm": 3.685105984706391, "learning_rate": 2.175732217573222e-06, "loss": 0.622, "loss_nan_ranks": 0, "loss_rank_avg": 0.6155872344970703, "step": 40, "valid_targets_mean": 2433.9, "valid_targets_min": 635 }, { "epoch": 0.04398826979472141, "grad_norm": 3.552082634936528, "learning_rate": 2.4546722454672246e-06, "loss": 0.6131, "loss_nan_ranks": 0, "loss_rank_avg": 0.622800350189209, "step": 45, "valid_targets_mean": 2232.9, "valid_targets_min": 914 }, { "epoch": 0.04887585532746823, "grad_norm": 2.6301835879043747, "learning_rate": 2.7336122733612273e-06, "loss": 0.5903, "loss_nan_ranks": 0, "loss_rank_avg": 0.57831209897995, "step": 50, "valid_targets_mean": 2736.5, "valid_targets_min": 1194 }, { "epoch": 0.053763440860215055, "grad_norm": 1.939146654771752, "learning_rate": 3.0125523012552303e-06, "loss": 0.566, "loss_nan_ranks": 0, "loss_rank_avg": 0.5587443113327026, "step": 55, "valid_targets_mean": 2471.7, "valid_targets_min": 753 }, { "epoch": 0.05865102639296188, "grad_norm": 1.3923623066674402, "learning_rate": 3.2914923291492334e-06, "loss": 0.5091, "loss_nan_ranks": 0, "loss_rank_avg": 0.5293725728988647, "step": 60, "valid_targets_mean": 3486.3, "valid_targets_min": 1205 }, { "epoch": 0.0635386119257087, "grad_norm": 1.2847016539983112, "learning_rate": 3.570432357043236e-06, "loss": 0.5174, "loss_nan_ranks": 0, "loss_rank_avg": 0.48333871364593506, "step": 65, "valid_targets_mean": 2133.9, "valid_targets_min": 639 }, { "epoch": 0.06842619745845552, "grad_norm": 1.1703945643061187, "learning_rate": 3.849372384937239e-06, "loss": 0.4767, "loss_nan_ranks": 0, "loss_rank_avg": 0.47202277183532715, "step": 70, "valid_targets_mean": 2432.9, "valid_targets_min": 820 }, { "epoch": 0.07331378299120235, "grad_norm": 1.1061255401631531, "learning_rate": 4.128312412831242e-06, "loss": 0.5054, "loss_nan_ranks": 0, "loss_rank_avg": 0.5339841842651367, "step": 75, "valid_targets_mean": 2277.9, "valid_targets_min": 741 }, { "epoch": 0.07820136852394917, "grad_norm": 1.1039585723531486, "learning_rate": 4.407252440725244e-06, "loss": 0.4741, "loss_nan_ranks": 0, "loss_rank_avg": 0.49983298778533936, "step": 80, "valid_targets_mean": 2021.4, "valid_targets_min": 855 }, { "epoch": 0.08308895405669599, "grad_norm": 0.9865369304789178, "learning_rate": 4.6861924686192475e-06, "loss": 0.4612, "loss_nan_ranks": 0, "loss_rank_avg": 0.42603811621665955, "step": 85, "valid_targets_mean": 2219.6, "valid_targets_min": 734 }, { "epoch": 0.08797653958944282, "grad_norm": 1.071853710354841, "learning_rate": 4.9651324965132506e-06, "loss": 0.4694, "loss_nan_ranks": 0, "loss_rank_avg": 0.45195892453193665, "step": 90, "valid_targets_mean": 2383.9, "valid_targets_min": 1015 }, { "epoch": 0.09286412512218964, "grad_norm": 0.9176728913117824, "learning_rate": 5.244072524407254e-06, "loss": 0.4449, "loss_nan_ranks": 0, "loss_rank_avg": 0.42296427488327026, "step": 95, "valid_targets_mean": 2121.6, "valid_targets_min": 967 }, { "epoch": 0.09775171065493646, "grad_norm": 0.9296613279197797, "learning_rate": 5.523012552301256e-06, "loss": 0.4326, "loss_nan_ranks": 0, "loss_rank_avg": 0.4197250008583069, "step": 100, "valid_targets_mean": 2173.2, "valid_targets_min": 895 }, { "epoch": 0.10263929618768329, "grad_norm": 0.9405388278402095, "learning_rate": 5.801952580195258e-06, "loss": 0.4436, "loss_nan_ranks": 0, "loss_rank_avg": 0.4366050362586975, "step": 105, "valid_targets_mean": 2097.8, "valid_targets_min": 816 }, { "epoch": 0.10752688172043011, "grad_norm": 0.7924545346293838, "learning_rate": 6.080892608089262e-06, "loss": 0.4115, "loss_nan_ranks": 0, "loss_rank_avg": 0.4147997796535492, "step": 110, "valid_targets_mean": 2730.9, "valid_targets_min": 955 }, { "epoch": 0.11241446725317693, "grad_norm": 0.789932617535872, "learning_rate": 6.359832635983264e-06, "loss": 0.4256, "loss_nan_ranks": 0, "loss_rank_avg": 0.4059978723526001, "step": 115, "valid_targets_mean": 2887.8, "valid_targets_min": 1001 }, { "epoch": 0.11730205278592376, "grad_norm": 0.8095583193686153, "learning_rate": 6.6387726638772664e-06, "loss": 0.4145, "loss_nan_ranks": 0, "loss_rank_avg": 0.4052962064743042, "step": 120, "valid_targets_mean": 2514.8, "valid_targets_min": 847 }, { "epoch": 0.12218963831867058, "grad_norm": 0.7949836362164371, "learning_rate": 6.91771269177127e-06, "loss": 0.4196, "loss_nan_ranks": 0, "loss_rank_avg": 0.4143103063106537, "step": 125, "valid_targets_mean": 2648.2, "valid_targets_min": 826 }, { "epoch": 0.1270772238514174, "grad_norm": 0.799726720099262, "learning_rate": 7.1966527196652726e-06, "loss": 0.4221, "loss_nan_ranks": 0, "loss_rank_avg": 0.4228057265281677, "step": 130, "valid_targets_mean": 2594.8, "valid_targets_min": 698 }, { "epoch": 0.13196480938416422, "grad_norm": 0.9617534138420096, "learning_rate": 7.475592747559275e-06, "loss": 0.4009, "loss_nan_ranks": 0, "loss_rank_avg": 0.42820626497268677, "step": 135, "valid_targets_mean": 2055.6, "valid_targets_min": 632 }, { "epoch": 0.13685239491691104, "grad_norm": 0.8348186060833679, "learning_rate": 7.754532775453279e-06, "loss": 0.4162, "loss_nan_ranks": 0, "loss_rank_avg": 0.4349338114261627, "step": 140, "valid_targets_mean": 2389.0, "valid_targets_min": 1020 }, { "epoch": 0.14173998044965788, "grad_norm": 0.8157340380976558, "learning_rate": 8.033472803347281e-06, "loss": 0.4207, "loss_nan_ranks": 0, "loss_rank_avg": 0.42874521017074585, "step": 145, "valid_targets_mean": 2644.0, "valid_targets_min": 684 }, { "epoch": 0.1466275659824047, "grad_norm": 0.8180117684614197, "learning_rate": 8.312412831241283e-06, "loss": 0.3971, "loss_nan_ranks": 0, "loss_rank_avg": 0.4317898452281952, "step": 150, "valid_targets_mean": 2665.6, "valid_targets_min": 869 }, { "epoch": 0.15151515151515152, "grad_norm": 0.8885682855346618, "learning_rate": 8.591352859135287e-06, "loss": 0.3854, "loss_nan_ranks": 0, "loss_rank_avg": 0.4081709384918213, "step": 155, "valid_targets_mean": 2359.7, "valid_targets_min": 872 }, { "epoch": 0.15640273704789834, "grad_norm": 0.8080583509361516, "learning_rate": 8.87029288702929e-06, "loss": 0.3982, "loss_nan_ranks": 0, "loss_rank_avg": 0.410560667514801, "step": 160, "valid_targets_mean": 2443.3, "valid_targets_min": 650 }, { "epoch": 0.16129032258064516, "grad_norm": 1.0075730249123667, "learning_rate": 9.149232914923292e-06, "loss": 0.3827, "loss_nan_ranks": 0, "loss_rank_avg": 0.3756175637245178, "step": 165, "valid_targets_mean": 2445.9, "valid_targets_min": 729 }, { "epoch": 0.16617790811339198, "grad_norm": 0.7988923971464764, "learning_rate": 9.428172942817295e-06, "loss": 0.3902, "loss_nan_ranks": 0, "loss_rank_avg": 0.3763277530670166, "step": 170, "valid_targets_mean": 2335.2, "valid_targets_min": 754 }, { "epoch": 0.1710654936461388, "grad_norm": 0.8801234974461333, "learning_rate": 9.707112970711298e-06, "loss": 0.4039, "loss_nan_ranks": 0, "loss_rank_avg": 0.4362441897392273, "step": 175, "valid_targets_mean": 2604.2, "valid_targets_min": 722 }, { "epoch": 0.17595307917888564, "grad_norm": 1.0573428481191474, "learning_rate": 9.986052998605302e-06, "loss": 0.3815, "loss_nan_ranks": 0, "loss_rank_avg": 0.3826301395893097, "step": 180, "valid_targets_mean": 1948.0, "valid_targets_min": 718 }, { "epoch": 0.18084066471163246, "grad_norm": 0.8244047729823328, "learning_rate": 1.0264993026499304e-05, "loss": 0.3677, "loss_nan_ranks": 0, "loss_rank_avg": 0.3717021346092224, "step": 185, "valid_targets_mean": 2318.2, "valid_targets_min": 868 }, { "epoch": 0.18572825024437928, "grad_norm": 0.8733754607654697, "learning_rate": 1.0543933054393308e-05, "loss": 0.3875, "loss_nan_ranks": 0, "loss_rank_avg": 0.41147416830062866, "step": 190, "valid_targets_mean": 2373.2, "valid_targets_min": 855 }, { "epoch": 0.1906158357771261, "grad_norm": 0.8971397713788575, "learning_rate": 1.0822873082287308e-05, "loss": 0.399, "loss_nan_ranks": 0, "loss_rank_avg": 0.4053829312324524, "step": 195, "valid_targets_mean": 2233.9, "valid_targets_min": 731 }, { "epoch": 0.19550342130987292, "grad_norm": 1.0257634454527333, "learning_rate": 1.1101813110181312e-05, "loss": 0.3825, "loss_nan_ranks": 0, "loss_rank_avg": 0.34646230936050415, "step": 200, "valid_targets_mean": 1661.8, "valid_targets_min": 652 }, { "epoch": 0.20039100684261973, "grad_norm": 0.8750695251551033, "learning_rate": 1.1380753138075316e-05, "loss": 0.3884, "loss_nan_ranks": 0, "loss_rank_avg": 0.39979293942451477, "step": 205, "valid_targets_mean": 2502.0, "valid_targets_min": 749 }, { "epoch": 0.20527859237536658, "grad_norm": 0.8985663536980157, "learning_rate": 1.1659693165969317e-05, "loss": 0.3715, "loss_nan_ranks": 0, "loss_rank_avg": 0.3521466553211212, "step": 210, "valid_targets_mean": 2193.1, "valid_targets_min": 1185 }, { "epoch": 0.2101661779081134, "grad_norm": 0.8690020156723633, "learning_rate": 1.193863319386332e-05, "loss": 0.3906, "loss_nan_ranks": 0, "loss_rank_avg": 0.39606279134750366, "step": 215, "valid_targets_mean": 2162.5, "valid_targets_min": 791 }, { "epoch": 0.21505376344086022, "grad_norm": 0.7851411691827029, "learning_rate": 1.2217573221757324e-05, "loss": 0.3534, "loss_nan_ranks": 0, "loss_rank_avg": 0.3474773168563843, "step": 220, "valid_targets_mean": 2564.4, "valid_targets_min": 754 }, { "epoch": 0.21994134897360704, "grad_norm": 0.8708152091406828, "learning_rate": 1.2496513249651325e-05, "loss": 0.3652, "loss_nan_ranks": 0, "loss_rank_avg": 0.3648437261581421, "step": 225, "valid_targets_mean": 2014.6, "valid_targets_min": 544 }, { "epoch": 0.22482893450635386, "grad_norm": 0.8997257441861602, "learning_rate": 1.2775453277545329e-05, "loss": 0.3817, "loss_nan_ranks": 0, "loss_rank_avg": 0.3548926115036011, "step": 230, "valid_targets_mean": 1954.0, "valid_targets_min": 627 }, { "epoch": 0.22971652003910067, "grad_norm": 0.7622734239422039, "learning_rate": 1.3054393305439333e-05, "loss": 0.3576, "loss_nan_ranks": 0, "loss_rank_avg": 0.3857002854347229, "step": 235, "valid_targets_mean": 2903.6, "valid_targets_min": 964 }, { "epoch": 0.23460410557184752, "grad_norm": 0.8137819570309708, "learning_rate": 1.3333333333333333e-05, "loss": 0.367, "loss_nan_ranks": 0, "loss_rank_avg": 0.3650803864002228, "step": 240, "valid_targets_mean": 2334.2, "valid_targets_min": 746 }, { "epoch": 0.23949169110459434, "grad_norm": 0.9062648393789453, "learning_rate": 1.3612273361227337e-05, "loss": 0.3859, "loss_nan_ranks": 0, "loss_rank_avg": 0.38647863268852234, "step": 245, "valid_targets_mean": 2119.2, "valid_targets_min": 933 }, { "epoch": 0.24437927663734116, "grad_norm": 0.8593102670864973, "learning_rate": 1.3891213389121341e-05, "loss": 0.3547, "loss_nan_ranks": 0, "loss_rank_avg": 0.32468748092651367, "step": 250, "valid_targets_mean": 2219.7, "valid_targets_min": 807 }, { "epoch": 0.24926686217008798, "grad_norm": 1.6459054094057368, "learning_rate": 1.4170153417015342e-05, "loss": 0.3763, "loss_nan_ranks": 0, "loss_rank_avg": 0.3920065760612488, "step": 255, "valid_targets_mean": 3263.6, "valid_targets_min": 886 }, { "epoch": 0.2541544477028348, "grad_norm": 0.8244627390914492, "learning_rate": 1.4449093444909346e-05, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.3641440272331238, "step": 260, "valid_targets_mean": 2413.2, "valid_targets_min": 819 }, { "epoch": 0.2590420332355816, "grad_norm": 0.947648955580425, "learning_rate": 1.472803347280335e-05, "loss": 0.3644, "loss_nan_ranks": 0, "loss_rank_avg": 0.3710935413837433, "step": 265, "valid_targets_mean": 1834.6, "valid_targets_min": 668 }, { "epoch": 0.26392961876832843, "grad_norm": 0.7479773006623937, "learning_rate": 1.500697350069735e-05, "loss": 0.3868, "loss_nan_ranks": 0, "loss_rank_avg": 0.3943009376525879, "step": 270, "valid_targets_mean": 2967.0, "valid_targets_min": 712 }, { "epoch": 0.26881720430107525, "grad_norm": 0.6850159478077383, "learning_rate": 1.5285913528591356e-05, "loss": 0.357, "loss_nan_ranks": 0, "loss_rank_avg": 0.33576327562332153, "step": 275, "valid_targets_mean": 3043.9, "valid_targets_min": 648 }, { "epoch": 0.27370478983382207, "grad_norm": 0.8054999780008923, "learning_rate": 1.5564853556485358e-05, "loss": 0.3544, "loss_nan_ranks": 0, "loss_rank_avg": 0.36960098147392273, "step": 280, "valid_targets_mean": 2678.3, "valid_targets_min": 1027 }, { "epoch": 0.2785923753665689, "grad_norm": 0.9675054347484953, "learning_rate": 1.584379358437936e-05, "loss": 0.378, "loss_nan_ranks": 0, "loss_rank_avg": 0.3982788324356079, "step": 285, "valid_targets_mean": 1821.8, "valid_targets_min": 701 }, { "epoch": 0.28347996089931576, "grad_norm": 0.9860609488043531, "learning_rate": 1.6122733612273362e-05, "loss": 0.3773, "loss_nan_ranks": 0, "loss_rank_avg": 0.3843904137611389, "step": 290, "valid_targets_mean": 2513.7, "valid_targets_min": 881 }, { "epoch": 0.2883675464320626, "grad_norm": 0.991847663374839, "learning_rate": 1.6401673640167365e-05, "loss": 0.379, "loss_nan_ranks": 0, "loss_rank_avg": 0.4282916784286499, "step": 295, "valid_targets_mean": 2874.1, "valid_targets_min": 1072 }, { "epoch": 0.2932551319648094, "grad_norm": 0.8307727140975414, "learning_rate": 1.6680613668061367e-05, "loss": 0.3548, "loss_nan_ranks": 0, "loss_rank_avg": 0.34740254282951355, "step": 300, "valid_targets_mean": 2016.8, "valid_targets_min": 681 }, { "epoch": 0.2981427174975562, "grad_norm": 0.7143528489591171, "learning_rate": 1.6959553695955372e-05, "loss": 0.3636, "loss_nan_ranks": 0, "loss_rank_avg": 0.359591007232666, "step": 305, "valid_targets_mean": 3070.4, "valid_targets_min": 774 }, { "epoch": 0.30303030303030304, "grad_norm": 0.9089966300203021, "learning_rate": 1.7238493723849375e-05, "loss": 0.3498, "loss_nan_ranks": 0, "loss_rank_avg": 0.33375781774520874, "step": 310, "valid_targets_mean": 1869.1, "valid_targets_min": 780 }, { "epoch": 0.30791788856304986, "grad_norm": 0.8634809970221224, "learning_rate": 1.7517433751743377e-05, "loss": 0.3555, "loss_nan_ranks": 0, "loss_rank_avg": 0.37010622024536133, "step": 315, "valid_targets_mean": 2224.5, "valid_targets_min": 754 }, { "epoch": 0.3128054740957967, "grad_norm": 0.8540663264632482, "learning_rate": 1.779637377963738e-05, "loss": 0.3515, "loss_nan_ranks": 0, "loss_rank_avg": 0.3211752772331238, "step": 320, "valid_targets_mean": 2225.6, "valid_targets_min": 777 }, { "epoch": 0.3176930596285435, "grad_norm": 0.8804814214418613, "learning_rate": 1.807531380753138e-05, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.35791587829589844, "step": 325, "valid_targets_mean": 2065.7, "valid_targets_min": 548 }, { "epoch": 0.3225806451612903, "grad_norm": 0.7640563487552252, "learning_rate": 1.8354253835425383e-05, "loss": 0.3332, "loss_nan_ranks": 0, "loss_rank_avg": 0.3520016074180603, "step": 330, "valid_targets_mean": 2701.5, "valid_targets_min": 944 }, { "epoch": 0.32746823069403713, "grad_norm": 0.7296882324617866, "learning_rate": 1.863319386331939e-05, "loss": 0.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.31554561853408813, "step": 335, "valid_targets_mean": 3010.9, "valid_targets_min": 1211 }, { "epoch": 0.33235581622678395, "grad_norm": 0.7271443111223936, "learning_rate": 1.891213389121339e-05, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.3308175802230835, "step": 340, "valid_targets_mean": 2877.0, "valid_targets_min": 1375 }, { "epoch": 0.33724340175953077, "grad_norm": 0.8360036681979609, "learning_rate": 1.9191073919107393e-05, "loss": 0.3671, "loss_nan_ranks": 0, "loss_rank_avg": 0.34241533279418945, "step": 345, "valid_targets_mean": 2568.8, "valid_targets_min": 656 }, { "epoch": 0.3421309872922776, "grad_norm": 0.8550409656130434, "learning_rate": 1.9470013947001396e-05, "loss": 0.352, "loss_nan_ranks": 0, "loss_rank_avg": 0.3601570427417755, "step": 350, "valid_targets_mean": 2331.7, "valid_targets_min": 679 }, { "epoch": 0.34701857282502446, "grad_norm": 0.9155877630691556, "learning_rate": 1.9748953974895398e-05, "loss": 0.3635, "loss_nan_ranks": 0, "loss_rank_avg": 0.38951539993286133, "step": 355, "valid_targets_mean": 2071.4, "valid_targets_min": 760 }, { "epoch": 0.3519061583577713, "grad_norm": 0.883435595055635, "learning_rate": 2.0027894002789404e-05, "loss": 0.36, "loss_nan_ranks": 0, "loss_rank_avg": 0.3670802414417267, "step": 360, "valid_targets_mean": 1985.2, "valid_targets_min": 592 }, { "epoch": 0.3567937438905181, "grad_norm": 0.9206852695774652, "learning_rate": 2.0306834030683406e-05, "loss": 0.3377, "loss_nan_ranks": 0, "loss_rank_avg": 0.3370826840400696, "step": 365, "valid_targets_mean": 2055.2, "valid_targets_min": 799 }, { "epoch": 0.3616813294232649, "grad_norm": 0.7244221713153408, "learning_rate": 2.0585774058577405e-05, "loss": 0.3354, "loss_nan_ranks": 0, "loss_rank_avg": 0.36608511209487915, "step": 370, "valid_targets_mean": 3176.6, "valid_targets_min": 1237 }, { "epoch": 0.36656891495601174, "grad_norm": 0.8515795547939923, "learning_rate": 2.086471408647141e-05, "loss": 0.3533, "loss_nan_ranks": 0, "loss_rank_avg": 0.3597974181175232, "step": 375, "valid_targets_mean": 2919.8, "valid_targets_min": 1215 }, { "epoch": 0.37145650048875856, "grad_norm": 0.8264921304378712, "learning_rate": 2.1143654114365412e-05, "loss": 0.3603, "loss_nan_ranks": 0, "loss_rank_avg": 0.364242821931839, "step": 380, "valid_targets_mean": 2541.9, "valid_targets_min": 763 }, { "epoch": 0.3763440860215054, "grad_norm": 0.907898110015603, "learning_rate": 2.1422594142259415e-05, "loss": 0.341, "loss_nan_ranks": 0, "loss_rank_avg": 0.32725921273231506, "step": 385, "valid_targets_mean": 1902.6, "valid_targets_min": 464 }, { "epoch": 0.3812316715542522, "grad_norm": 0.938573710378532, "learning_rate": 2.170153417015342e-05, "loss": 0.3244, "loss_nan_ranks": 0, "loss_rank_avg": 0.34030425548553467, "step": 390, "valid_targets_mean": 2139.0, "valid_targets_min": 627 }, { "epoch": 0.386119257086999, "grad_norm": 0.9348906560243034, "learning_rate": 2.1980474198047422e-05, "loss": 0.3436, "loss_nan_ranks": 0, "loss_rank_avg": 0.3462354838848114, "step": 395, "valid_targets_mean": 2194.8, "valid_targets_min": 738 }, { "epoch": 0.39100684261974583, "grad_norm": 0.6752427727321951, "learning_rate": 2.225941422594142e-05, "loss": 0.3381, "loss_nan_ranks": 0, "loss_rank_avg": 0.33034390211105347, "step": 400, "valid_targets_mean": 3065.8, "valid_targets_min": 796 }, { "epoch": 0.39589442815249265, "grad_norm": 0.8105931491656845, "learning_rate": 2.2538354253835427e-05, "loss": 0.3508, "loss_nan_ranks": 0, "loss_rank_avg": 0.3310199975967407, "step": 405, "valid_targets_mean": 2525.2, "valid_targets_min": 900 }, { "epoch": 0.40078201368523947, "grad_norm": 0.8829736004010716, "learning_rate": 2.281729428172943e-05, "loss": 0.3529, "loss_nan_ranks": 0, "loss_rank_avg": 0.3105641305446625, "step": 410, "valid_targets_mean": 2156.9, "valid_targets_min": 805 }, { "epoch": 0.4056695992179863, "grad_norm": 1.053696655919182, "learning_rate": 2.309623430962343e-05, "loss": 0.3361, "loss_nan_ranks": 0, "loss_rank_avg": 0.3739250898361206, "step": 415, "valid_targets_mean": 2282.6, "valid_targets_min": 1170 }, { "epoch": 0.41055718475073316, "grad_norm": 0.809739823282899, "learning_rate": 2.3375174337517437e-05, "loss": 0.3311, "loss_nan_ranks": 0, "loss_rank_avg": 0.35403841733932495, "step": 420, "valid_targets_mean": 2249.1, "valid_targets_min": 698 }, { "epoch": 0.41544477028348, "grad_norm": 0.8114625727115713, "learning_rate": 2.365411436541144e-05, "loss": 0.3432, "loss_nan_ranks": 0, "loss_rank_avg": 0.3622049391269684, "step": 425, "valid_targets_mean": 2313.3, "valid_targets_min": 766 }, { "epoch": 0.4203323558162268, "grad_norm": 0.7569678066302454, "learning_rate": 2.3933054393305438e-05, "loss": 0.3358, "loss_nan_ranks": 0, "loss_rank_avg": 0.33777353167533875, "step": 430, "valid_targets_mean": 2816.7, "valid_targets_min": 859 }, { "epoch": 0.4252199413489736, "grad_norm": 0.7327933630295097, "learning_rate": 2.4211994421199444e-05, "loss": 0.3466, "loss_nan_ranks": 0, "loss_rank_avg": 0.3273935317993164, "step": 435, "valid_targets_mean": 2645.7, "valid_targets_min": 1098 }, { "epoch": 0.43010752688172044, "grad_norm": 0.8665670559962085, "learning_rate": 2.4490934449093446e-05, "loss": 0.3425, "loss_nan_ranks": 0, "loss_rank_avg": 0.3423697054386139, "step": 440, "valid_targets_mean": 2181.8, "valid_targets_min": 604 }, { "epoch": 0.43499511241446726, "grad_norm": 0.8580346981985594, "learning_rate": 2.4769874476987448e-05, "loss": 0.3384, "loss_nan_ranks": 0, "loss_rank_avg": 0.34883952140808105, "step": 445, "valid_targets_mean": 2146.7, "valid_targets_min": 638 }, { "epoch": 0.4398826979472141, "grad_norm": 0.8238090290163292, "learning_rate": 2.5048814504881454e-05, "loss": 0.3507, "loss_nan_ranks": 0, "loss_rank_avg": 0.31056028604507446, "step": 450, "valid_targets_mean": 2293.9, "valid_targets_min": 943 }, { "epoch": 0.4447702834799609, "grad_norm": 0.6463651486346894, "learning_rate": 2.5327754532775456e-05, "loss": 0.3203, "loss_nan_ranks": 0, "loss_rank_avg": 0.2803493142127991, "step": 455, "valid_targets_mean": 2967.7, "valid_targets_min": 865 }, { "epoch": 0.4496578690127077, "grad_norm": 0.941311131272596, "learning_rate": 2.5606694560669455e-05, "loss": 0.3452, "loss_nan_ranks": 0, "loss_rank_avg": 0.3155880570411682, "step": 460, "valid_targets_mean": 1743.8, "valid_targets_min": 764 }, { "epoch": 0.45454545454545453, "grad_norm": 0.736803043029875, "learning_rate": 2.588563458856346e-05, "loss": 0.3442, "loss_nan_ranks": 0, "loss_rank_avg": 0.36394965648651123, "step": 465, "valid_targets_mean": 2932.3, "valid_targets_min": 763 }, { "epoch": 0.45943304007820135, "grad_norm": 0.7921374525507471, "learning_rate": 2.6164574616457463e-05, "loss": 0.328, "loss_nan_ranks": 0, "loss_rank_avg": 0.3570030927658081, "step": 470, "valid_targets_mean": 3040.9, "valid_targets_min": 796 }, { "epoch": 0.46432062561094817, "grad_norm": 0.7900857884761241, "learning_rate": 2.6443514644351465e-05, "loss": 0.342, "loss_nan_ranks": 0, "loss_rank_avg": 0.37542372941970825, "step": 475, "valid_targets_mean": 3116.3, "valid_targets_min": 926 }, { "epoch": 0.46920821114369504, "grad_norm": 1.159582734344674, "learning_rate": 2.672245467224547e-05, "loss": 0.3439, "loss_nan_ranks": 0, "loss_rank_avg": 0.36254942417144775, "step": 480, "valid_targets_mean": 2185.8, "valid_targets_min": 713 }, { "epoch": 0.47409579667644186, "grad_norm": 0.7897072764788433, "learning_rate": 2.7001394700139473e-05, "loss": 0.3372, "loss_nan_ranks": 0, "loss_rank_avg": 0.33607053756713867, "step": 485, "valid_targets_mean": 2364.0, "valid_targets_min": 1086 }, { "epoch": 0.4789833822091887, "grad_norm": 0.8400859552438328, "learning_rate": 2.728033472803347e-05, "loss": 0.3359, "loss_nan_ranks": 0, "loss_rank_avg": 0.3387121856212616, "step": 490, "valid_targets_mean": 2131.7, "valid_targets_min": 640 }, { "epoch": 0.4838709677419355, "grad_norm": 0.7446625512121486, "learning_rate": 2.7559274755927477e-05, "loss": 0.334, "loss_nan_ranks": 0, "loss_rank_avg": 0.3753664493560791, "step": 495, "valid_targets_mean": 2741.8, "valid_targets_min": 548 }, { "epoch": 0.4887585532746823, "grad_norm": 0.7424189633962999, "learning_rate": 2.783821478382148e-05, "loss": 0.3449, "loss_nan_ranks": 0, "loss_rank_avg": 0.35922667384147644, "step": 500, "valid_targets_mean": 3106.8, "valid_targets_min": 668 }, { "epoch": 0.49364613880742914, "grad_norm": 0.8398560921552762, "learning_rate": 2.811715481171548e-05, "loss": 0.3178, "loss_nan_ranks": 0, "loss_rank_avg": 0.27231159806251526, "step": 505, "valid_targets_mean": 2408.9, "valid_targets_min": 742 }, { "epoch": 0.49853372434017595, "grad_norm": 0.8650127139587513, "learning_rate": 2.8396094839609487e-05, "loss": 0.3244, "loss_nan_ranks": 0, "loss_rank_avg": 0.31993523240089417, "step": 510, "valid_targets_mean": 2272.2, "valid_targets_min": 672 }, { "epoch": 0.5034213098729228, "grad_norm": 0.8145474264636156, "learning_rate": 2.867503486750349e-05, "loss": 0.3321, "loss_nan_ranks": 0, "loss_rank_avg": 0.3184545040130615, "step": 515, "valid_targets_mean": 2181.7, "valid_targets_min": 676 }, { "epoch": 0.5083088954056696, "grad_norm": 0.8995961884293948, "learning_rate": 2.8953974895397488e-05, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.34413954615592957, "step": 520, "valid_targets_mean": 2101.1, "valid_targets_min": 1055 }, { "epoch": 0.5131964809384164, "grad_norm": 0.7980166217846976, "learning_rate": 2.9232914923291494e-05, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.3372722864151001, "step": 525, "valid_targets_mean": 2395.6, "valid_targets_min": 1282 }, { "epoch": 0.5180840664711632, "grad_norm": 1.1201293160921861, "learning_rate": 2.9511854951185496e-05, "loss": 0.323, "loss_nan_ranks": 0, "loss_rank_avg": 0.31446385383605957, "step": 530, "valid_targets_mean": 2134.9, "valid_targets_min": 922 }, { "epoch": 0.52297165200391, "grad_norm": 0.7342360486498539, "learning_rate": 2.9790794979079498e-05, "loss": 0.3321, "loss_nan_ranks": 0, "loss_rank_avg": 0.30906954407691956, "step": 535, "valid_targets_mean": 2658.1, "valid_targets_min": 1076 }, { "epoch": 0.5278592375366569, "grad_norm": 0.7267057803106786, "learning_rate": 3.0069735006973504e-05, "loss": 0.32, "loss_nan_ranks": 0, "loss_rank_avg": 0.3381599187850952, "step": 540, "valid_targets_mean": 2644.8, "valid_targets_min": 814 }, { "epoch": 0.5327468230694037, "grad_norm": 0.8500045196292703, "learning_rate": 3.0348675034867506e-05, "loss": 0.3205, "loss_nan_ranks": 0, "loss_rank_avg": 0.29569292068481445, "step": 545, "valid_targets_mean": 1866.9, "valid_targets_min": 530 }, { "epoch": 0.5376344086021505, "grad_norm": 0.7412443952817233, "learning_rate": 3.062761506276151e-05, "loss": 0.3355, "loss_nan_ranks": 0, "loss_rank_avg": 0.345531165599823, "step": 550, "valid_targets_mean": 2880.6, "valid_targets_min": 905 }, { "epoch": 0.5425219941348973, "grad_norm": 0.6993041939598253, "learning_rate": 3.0906555090655514e-05, "loss": 0.3124, "loss_nan_ranks": 0, "loss_rank_avg": 0.3102779984474182, "step": 555, "valid_targets_mean": 2846.2, "valid_targets_min": 790 }, { "epoch": 0.5474095796676441, "grad_norm": 0.7359314473756243, "learning_rate": 3.118549511854951e-05, "loss": 0.3203, "loss_nan_ranks": 0, "loss_rank_avg": 0.32391446828842163, "step": 560, "valid_targets_mean": 2719.4, "valid_targets_min": 816 }, { "epoch": 0.552297165200391, "grad_norm": 0.8113820976460382, "learning_rate": 3.146443514644352e-05, "loss": 0.3409, "loss_nan_ranks": 0, "loss_rank_avg": 0.30669841170310974, "step": 565, "valid_targets_mean": 2390.4, "valid_targets_min": 669 }, { "epoch": 0.5571847507331378, "grad_norm": 0.8096140445105596, "learning_rate": 3.1743375174337524e-05, "loss": 0.2977, "loss_nan_ranks": 0, "loss_rank_avg": 0.3120150566101074, "step": 570, "valid_targets_mean": 2190.9, "valid_targets_min": 739 }, { "epoch": 0.5620723362658846, "grad_norm": 0.9110568245840788, "learning_rate": 3.202231520223152e-05, "loss": 0.314, "loss_nan_ranks": 0, "loss_rank_avg": 0.3165706992149353, "step": 575, "valid_targets_mean": 1853.4, "valid_targets_min": 722 }, { "epoch": 0.5669599217986315, "grad_norm": 0.7684538091148991, "learning_rate": 3.230125523012553e-05, "loss": 0.3162, "loss_nan_ranks": 0, "loss_rank_avg": 0.2956627607345581, "step": 580, "valid_targets_mean": 2559.9, "valid_targets_min": 987 }, { "epoch": 0.5718475073313783, "grad_norm": 0.7441624896883247, "learning_rate": 3.258019525801953e-05, "loss": 0.3292, "loss_nan_ranks": 0, "loss_rank_avg": 0.3297075033187866, "step": 585, "valid_targets_mean": 2662.0, "valid_targets_min": 711 }, { "epoch": 0.5767350928641252, "grad_norm": 0.8719735596323135, "learning_rate": 3.285913528591353e-05, "loss": 0.3205, "loss_nan_ranks": 0, "loss_rank_avg": 0.3282514214515686, "step": 590, "valid_targets_mean": 2034.2, "valid_targets_min": 851 }, { "epoch": 0.581622678396872, "grad_norm": 0.8090870634352967, "learning_rate": 3.313807531380754e-05, "loss": 0.3329, "loss_nan_ranks": 0, "loss_rank_avg": 0.31386953592300415, "step": 595, "valid_targets_mean": 2551.9, "valid_targets_min": 914 }, { "epoch": 0.5865102639296188, "grad_norm": 0.7207352022007785, "learning_rate": 3.341701534170154e-05, "loss": 0.3237, "loss_nan_ranks": 0, "loss_rank_avg": 0.3386681079864502, "step": 600, "valid_targets_mean": 2835.5, "valid_targets_min": 661 }, { "epoch": 0.5913978494623656, "grad_norm": 0.7584008460860305, "learning_rate": 3.3695955369595536e-05, "loss": 0.3284, "loss_nan_ranks": 0, "loss_rank_avg": 0.28931134939193726, "step": 605, "valid_targets_mean": 2277.4, "valid_targets_min": 1014 }, { "epoch": 0.5962854349951124, "grad_norm": 0.792721139679117, "learning_rate": 3.397489539748954e-05, "loss": 0.3312, "loss_nan_ranks": 0, "loss_rank_avg": 0.33046597242355347, "step": 610, "valid_targets_mean": 2322.7, "valid_targets_min": 704 }, { "epoch": 0.6011730205278593, "grad_norm": 0.7784271949093392, "learning_rate": 3.425383542538355e-05, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.3591078519821167, "step": 615, "valid_targets_mean": 2750.8, "valid_targets_min": 929 }, { "epoch": 0.6060606060606061, "grad_norm": 0.8776498743873912, "learning_rate": 3.4532775453277546e-05, "loss": 0.3143, "loss_nan_ranks": 0, "loss_rank_avg": 0.33385688066482544, "step": 620, "valid_targets_mean": 2140.5, "valid_targets_min": 642 }, { "epoch": 0.6109481915933529, "grad_norm": 0.746820447052271, "learning_rate": 3.481171548117155e-05, "loss": 0.3296, "loss_nan_ranks": 0, "loss_rank_avg": 0.33402806520462036, "step": 625, "valid_targets_mean": 2436.4, "valid_targets_min": 895 }, { "epoch": 0.6158357771260997, "grad_norm": 0.7897960735140778, "learning_rate": 3.509065550906556e-05, "loss": 0.3214, "loss_nan_ranks": 0, "loss_rank_avg": 0.31994372606277466, "step": 630, "valid_targets_mean": 2388.4, "valid_targets_min": 915 }, { "epoch": 0.6207233626588465, "grad_norm": 0.7255296236144402, "learning_rate": 3.5369595536959556e-05, "loss": 0.32, "loss_nan_ranks": 0, "loss_rank_avg": 0.3037095069885254, "step": 635, "valid_targets_mean": 2603.6, "valid_targets_min": 635 }, { "epoch": 0.6256109481915934, "grad_norm": 0.8068527468176921, "learning_rate": 3.564853556485356e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.31424158811569214, "step": 640, "valid_targets_mean": 2459.6, "valid_targets_min": 636 }, { "epoch": 0.6304985337243402, "grad_norm": 0.7702625587232006, "learning_rate": 3.592747559274756e-05, "loss": 0.3358, "loss_nan_ranks": 0, "loss_rank_avg": 0.3524268567562103, "step": 645, "valid_targets_mean": 2649.3, "valid_targets_min": 1140 }, { "epoch": 0.635386119257087, "grad_norm": 0.7714466133072925, "learning_rate": 3.6206415620641566e-05, "loss": 0.3286, "loss_nan_ranks": 0, "loss_rank_avg": 0.31589627265930176, "step": 650, "valid_targets_mean": 2330.5, "valid_targets_min": 657 }, { "epoch": 0.6402737047898338, "grad_norm": 0.7977408416406456, "learning_rate": 3.648535564853557e-05, "loss": 0.3244, "loss_nan_ranks": 0, "loss_rank_avg": 0.29703885316848755, "step": 655, "valid_targets_mean": 2082.4, "valid_targets_min": 725 }, { "epoch": 0.6451612903225806, "grad_norm": 0.897859600419085, "learning_rate": 3.676429567642957e-05, "loss": 0.3072, "loss_nan_ranks": 0, "loss_rank_avg": 0.32600027322769165, "step": 660, "valid_targets_mean": 2019.0, "valid_targets_min": 740 }, { "epoch": 0.6500488758553274, "grad_norm": 0.8217894407117475, "learning_rate": 3.704323570432357e-05, "loss": 0.3197, "loss_nan_ranks": 0, "loss_rank_avg": 0.2989169955253601, "step": 665, "valid_targets_mean": 2451.2, "valid_targets_min": 1105 }, { "epoch": 0.6549364613880743, "grad_norm": 0.6967345052464025, "learning_rate": 3.7322175732217575e-05, "loss": 0.298, "loss_nan_ranks": 0, "loss_rank_avg": 0.28789329528808594, "step": 670, "valid_targets_mean": 2827.7, "valid_targets_min": 692 }, { "epoch": 0.6598240469208211, "grad_norm": 0.730001904109528, "learning_rate": 3.760111576011158e-05, "loss": 0.3068, "loss_nan_ranks": 0, "loss_rank_avg": 0.31676405668258667, "step": 675, "valid_targets_mean": 2389.0, "valid_targets_min": 660 }, { "epoch": 0.6647116324535679, "grad_norm": 0.7898161538858068, "learning_rate": 3.788005578800558e-05, "loss": 0.3168, "loss_nan_ranks": 0, "loss_rank_avg": 0.29914867877960205, "step": 680, "valid_targets_mean": 2101.6, "valid_targets_min": 894 }, { "epoch": 0.6695992179863147, "grad_norm": 0.7857150534119379, "learning_rate": 3.8158995815899585e-05, "loss": 0.3295, "loss_nan_ranks": 0, "loss_rank_avg": 0.3327745199203491, "step": 685, "valid_targets_mean": 2511.1, "valid_targets_min": 744 }, { "epoch": 0.6744868035190615, "grad_norm": 0.6691932395126847, "learning_rate": 3.843793584379359e-05, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.3309377431869507, "step": 690, "valid_targets_mean": 2951.6, "valid_targets_min": 644 }, { "epoch": 0.6793743890518084, "grad_norm": 1.1193866441330809, "learning_rate": 3.871687587168759e-05, "loss": 0.3372, "loss_nan_ranks": 0, "loss_rank_avg": 0.36905205249786377, "step": 695, "valid_targets_mean": 2194.1, "valid_targets_min": 818 }, { "epoch": 0.6842619745845552, "grad_norm": 0.7857310721423778, "learning_rate": 3.8995815899581595e-05, "loss": 0.3273, "loss_nan_ranks": 0, "loss_rank_avg": 0.30003082752227783, "step": 700, "valid_targets_mean": 2174.9, "valid_targets_min": 557 }, { "epoch": 0.6891495601173021, "grad_norm": 0.7397963727859, "learning_rate": 3.9274755927475594e-05, "loss": 0.3207, "loss_nan_ranks": 0, "loss_rank_avg": 0.2808341383934021, "step": 705, "valid_targets_mean": 2378.6, "valid_targets_min": 794 }, { "epoch": 0.6940371456500489, "grad_norm": 1.068416619253061, "learning_rate": 3.95536959553696e-05, "loss": 0.3241, "loss_nan_ranks": 0, "loss_rank_avg": 0.32398268580436707, "step": 710, "valid_targets_mean": 1853.6, "valid_targets_min": 791 }, { "epoch": 0.6989247311827957, "grad_norm": 0.7883949750339846, "learning_rate": 3.9832635983263605e-05, "loss": 0.307, "loss_nan_ranks": 0, "loss_rank_avg": 0.3216050863265991, "step": 715, "valid_targets_mean": 2201.4, "valid_targets_min": 661 }, { "epoch": 0.7038123167155426, "grad_norm": 0.7210396481396164, "learning_rate": 3.999999049288738e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.32969582080841064, "step": 720, "valid_targets_mean": 2724.2, "valid_targets_min": 572 }, { "epoch": 0.7086999022482894, "grad_norm": 0.6780724521617006, "learning_rate": 3.9999883537974135e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.3392641842365265, "step": 725, "valid_targets_mean": 2957.1, "valid_targets_min": 856 }, { "epoch": 0.7135874877810362, "grad_norm": 1.4001056248209713, "learning_rate": 3.999965774489451e-05, "loss": 0.3241, "loss_nan_ranks": 0, "loss_rank_avg": 0.31240707635879517, "step": 730, "valid_targets_mean": 2448.2, "valid_targets_min": 740 }, { "epoch": 0.718475073313783, "grad_norm": 0.7066267173981833, "learning_rate": 3.999931311499014e-05, "loss": 0.2993, "loss_nan_ranks": 0, "loss_rank_avg": 0.2746642827987671, "step": 735, "valid_targets_mean": 2677.8, "valid_targets_min": 1280 }, { "epoch": 0.7233626588465298, "grad_norm": 0.9463337394740791, "learning_rate": 3.999884965030881e-05, "loss": 0.3138, "loss_nan_ranks": 0, "loss_rank_avg": 0.34243521094322205, "step": 740, "valid_targets_mean": 1775.4, "valid_targets_min": 679 }, { "epoch": 0.7282502443792767, "grad_norm": 0.7034930040606712, "learning_rate": 3.9998267353604396e-05, "loss": 0.3083, "loss_nan_ranks": 0, "loss_rank_avg": 0.3177798390388489, "step": 745, "valid_targets_mean": 2800.6, "valid_targets_min": 920 }, { "epoch": 0.7331378299120235, "grad_norm": 0.6916689022053226, "learning_rate": 3.9997566228336865e-05, "loss": 0.3207, "loss_nan_ranks": 0, "loss_rank_avg": 0.289054274559021, "step": 750, "valid_targets_mean": 2406.8, "valid_targets_min": 856 }, { "epoch": 0.7380254154447703, "grad_norm": 0.7430166452541812, "learning_rate": 3.999674627867228e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.29457688331604004, "step": 755, "valid_targets_mean": 2496.6, "valid_targets_min": 804 }, { "epoch": 0.7429130009775171, "grad_norm": 0.7604153844606187, "learning_rate": 3.9995807509482715e-05, "loss": 0.3298, "loss_nan_ranks": 0, "loss_rank_avg": 0.37004536390304565, "step": 760, "valid_targets_mean": 2459.6, "valid_targets_min": 910 }, { "epoch": 0.7478005865102639, "grad_norm": 0.7783050791408205, "learning_rate": 3.99947499263463e-05, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.26048505306243896, "step": 765, "valid_targets_mean": 1702.1, "valid_targets_min": 641 }, { "epoch": 0.7526881720430108, "grad_norm": 0.6842291009472856, "learning_rate": 3.999357353554712e-05, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.2890620529651642, "step": 770, "valid_targets_mean": 2460.7, "valid_targets_min": 741 }, { "epoch": 0.7575757575757576, "grad_norm": 0.7667053941772743, "learning_rate": 3.999227834407523e-05, "loss": 0.3122, "loss_nan_ranks": 0, "loss_rank_avg": 0.3236725330352783, "step": 775, "valid_targets_mean": 2326.1, "valid_targets_min": 1024 }, { "epoch": 0.7624633431085044, "grad_norm": 0.9459473272945332, "learning_rate": 3.9990864359626586e-05, "loss": 0.2866, "loss_nan_ranks": 0, "loss_rank_avg": 0.2749725580215454, "step": 780, "valid_targets_mean": 2354.9, "valid_targets_min": 914 }, { "epoch": 0.7673509286412512, "grad_norm": 0.7184999480991484, "learning_rate": 3.9989331590603e-05, "loss": 0.3203, "loss_nan_ranks": 0, "loss_rank_avg": 0.3461282253265381, "step": 785, "valid_targets_mean": 2811.2, "valid_targets_min": 725 }, { "epoch": 0.772238514173998, "grad_norm": 0.6593556008310089, "learning_rate": 3.998768004611209e-05, "loss": 0.3225, "loss_nan_ranks": 0, "loss_rank_avg": 0.35281455516815186, "step": 790, "valid_targets_mean": 3194.9, "valid_targets_min": 1180 }, { "epoch": 0.7771260997067448, "grad_norm": 0.7230785157141715, "learning_rate": 3.998590973596725e-05, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.3064287304878235, "step": 795, "valid_targets_mean": 2452.0, "valid_targets_min": 786 }, { "epoch": 0.7820136852394917, "grad_norm": 0.6934289312826055, "learning_rate": 3.998402067068755e-05, "loss": 0.3336, "loss_nan_ranks": 0, "loss_rank_avg": 0.3232996165752411, "step": 800, "valid_targets_mean": 2586.8, "valid_targets_min": 1015 }, { "epoch": 0.7869012707722385, "grad_norm": 0.6558930070169424, "learning_rate": 3.998201286149772e-05, "loss": 0.3206, "loss_nan_ranks": 0, "loss_rank_avg": 0.33236560225486755, "step": 805, "valid_targets_mean": 3404.1, "valid_targets_min": 660 }, { "epoch": 0.7917888563049853, "grad_norm": 0.7295217695663251, "learning_rate": 3.997988632032805e-05, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.3009946346282959, "step": 810, "valid_targets_mean": 2459.5, "valid_targets_min": 970 }, { "epoch": 0.7966764418377321, "grad_norm": 0.8584536403730917, "learning_rate": 3.99776410598143e-05, "loss": 0.3159, "loss_nan_ranks": 0, "loss_rank_avg": 0.32543686032295227, "step": 815, "valid_targets_mean": 2278.4, "valid_targets_min": 852 }, { "epoch": 0.8015640273704789, "grad_norm": 0.7449337414001902, "learning_rate": 3.997527709329772e-05, "loss": 0.317, "loss_nan_ranks": 0, "loss_rank_avg": 0.3691062927246094, "step": 820, "valid_targets_mean": 2001.3, "valid_targets_min": 625 }, { "epoch": 0.8064516129032258, "grad_norm": 0.7287752989474822, "learning_rate": 3.997279443482484e-05, "loss": 0.3146, "loss_nan_ranks": 0, "loss_rank_avg": 0.3165518045425415, "step": 825, "valid_targets_mean": 2824.4, "valid_targets_min": 1123 }, { "epoch": 0.8113391984359726, "grad_norm": 0.7414141117963199, "learning_rate": 3.997019309914747e-05, "loss": 0.3146, "loss_nan_ranks": 0, "loss_rank_avg": 0.3582077622413635, "step": 830, "valid_targets_mean": 2533.0, "valid_targets_min": 922 }, { "epoch": 0.8162267839687195, "grad_norm": 0.6604646667995736, "learning_rate": 3.996747310172261e-05, "loss": 0.2997, "loss_nan_ranks": 0, "loss_rank_avg": 0.3009747266769409, "step": 835, "valid_targets_mean": 2743.4, "valid_targets_min": 815 }, { "epoch": 0.8211143695014663, "grad_norm": 0.7869481152483848, "learning_rate": 3.996463445871233e-05, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.28774186968803406, "step": 840, "valid_targets_mean": 2012.9, "valid_targets_min": 1019 }, { "epoch": 0.8260019550342131, "grad_norm": 0.7796967007238236, "learning_rate": 3.996167718698368e-05, "loss": 0.2991, "loss_nan_ranks": 0, "loss_rank_avg": 0.28823673725128174, "step": 845, "valid_targets_mean": 1971.4, "valid_targets_min": 858 }, { "epoch": 0.83088954056696, "grad_norm": 0.7921234290446715, "learning_rate": 3.9958601304108596e-05, "loss": 0.3121, "loss_nan_ranks": 0, "loss_rank_avg": 0.29436832666397095, "step": 850, "valid_targets_mean": 2040.2, "valid_targets_min": 780 }, { "epoch": 0.8357771260997068, "grad_norm": 0.7773209045309674, "learning_rate": 3.995540682836381e-05, "loss": 0.3047, "loss_nan_ranks": 0, "loss_rank_avg": 0.320604145526886, "step": 855, "valid_targets_mean": 2100.3, "valid_targets_min": 635 }, { "epoch": 0.8406647116324536, "grad_norm": 0.7068147985901192, "learning_rate": 3.99520937787307e-05, "loss": 0.3111, "loss_nan_ranks": 0, "loss_rank_avg": 0.2897074818611145, "step": 860, "valid_targets_mean": 2451.1, "valid_targets_min": 781 }, { "epoch": 0.8455522971652004, "grad_norm": 0.6227835458943253, "learning_rate": 3.994866217489523e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.2862326502799988, "step": 865, "valid_targets_mean": 3045.1, "valid_targets_min": 892 }, { "epoch": 0.8504398826979472, "grad_norm": 0.8510089182055716, "learning_rate": 3.994511203724779e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.31772327423095703, "step": 870, "valid_targets_mean": 2259.7, "valid_targets_min": 900 }, { "epoch": 0.855327468230694, "grad_norm": 0.7031577446655919, "learning_rate": 3.9941443386883086e-05, "loss": 0.3074, "loss_nan_ranks": 0, "loss_rank_avg": 0.3305051922798157, "step": 875, "valid_targets_mean": 2753.0, "valid_targets_min": 976 }, { "epoch": 0.8602150537634409, "grad_norm": 0.7949638614035321, "learning_rate": 3.9937656245600044e-05, "loss": 0.3089, "loss_nan_ranks": 0, "loss_rank_avg": 0.3418285846710205, "step": 880, "valid_targets_mean": 2385.2, "valid_targets_min": 804 }, { "epoch": 0.8651026392961877, "grad_norm": 0.7305187723607021, "learning_rate": 3.993375063590164e-05, "loss": 0.3138, "loss_nan_ranks": 0, "loss_rank_avg": 0.3128136992454529, "step": 885, "valid_targets_mean": 2648.4, "valid_targets_min": 1208 }, { "epoch": 0.8699902248289345, "grad_norm": 1.1746959130401167, "learning_rate": 3.9929726580994775e-05, "loss": 0.306, "loss_nan_ranks": 0, "loss_rank_avg": 0.2941882610321045, "step": 890, "valid_targets_mean": 2617.6, "valid_targets_min": 904 }, { "epoch": 0.8748778103616813, "grad_norm": 0.7402990200201592, "learning_rate": 3.992558410479015e-05, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.2941339612007141, "step": 895, "valid_targets_mean": 2542.5, "valid_targets_min": 735 }, { "epoch": 0.8797653958944281, "grad_norm": 0.7737988843199513, "learning_rate": 3.992132323190214e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.2719045579433441, "step": 900, "valid_targets_mean": 1987.3, "valid_targets_min": 878 }, { "epoch": 0.884652981427175, "grad_norm": 0.7582651606562361, "learning_rate": 3.99169439876486e-05, "loss": 0.3268, "loss_nan_ranks": 0, "loss_rank_avg": 0.3535369634628296, "step": 905, "valid_targets_mean": 2560.1, "valid_targets_min": 870 }, { "epoch": 0.8895405669599218, "grad_norm": 0.7699462585158438, "learning_rate": 3.991244639805074e-05, "loss": 0.3065, "loss_nan_ranks": 0, "loss_rank_avg": 0.3052283823490143, "step": 910, "valid_targets_mean": 2282.6, "valid_targets_min": 900 }, { "epoch": 0.8944281524926686, "grad_norm": 0.7785182577824628, "learning_rate": 3.9907830489832993e-05, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.26899123191833496, "step": 915, "valid_targets_mean": 2104.2, "valid_targets_min": 676 }, { "epoch": 0.8993157380254154, "grad_norm": 0.8574210895658473, "learning_rate": 3.990309629042281e-05, "loss": 0.3052, "loss_nan_ranks": 0, "loss_rank_avg": 0.2943177819252014, "step": 920, "valid_targets_mean": 2444.8, "valid_targets_min": 1100 }, { "epoch": 0.9042033235581622, "grad_norm": 0.7284561255560225, "learning_rate": 3.989824382795055e-05, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.29493361711502075, "step": 925, "valid_targets_mean": 2599.8, "valid_targets_min": 801 }, { "epoch": 0.9090909090909091, "grad_norm": 0.6857751641162575, "learning_rate": 3.989327313124926e-05, "loss": 0.3186, "loss_nan_ranks": 0, "loss_rank_avg": 0.3466421961784363, "step": 930, "valid_targets_mean": 2798.0, "valid_targets_min": 911 }, { "epoch": 0.9139784946236559, "grad_norm": 0.7493847771371742, "learning_rate": 3.9888184229854525e-05, "loss": 0.3163, "loss_nan_ranks": 0, "loss_rank_avg": 0.32370316982269287, "step": 935, "valid_targets_mean": 2422.5, "valid_targets_min": 703 }, { "epoch": 0.9188660801564027, "grad_norm": 0.6989351581606708, "learning_rate": 3.988297715400432e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.2930717468261719, "step": 940, "valid_targets_mean": 2921.4, "valid_targets_min": 1264 }, { "epoch": 0.9237536656891495, "grad_norm": 0.7430743004739445, "learning_rate": 3.987765193463879e-05, "loss": 0.2861, "loss_nan_ranks": 0, "loss_rank_avg": 0.25492438673973083, "step": 945, "valid_targets_mean": 2135.5, "valid_targets_min": 800 }, { "epoch": 0.9286412512218963, "grad_norm": 0.6670033217086339, "learning_rate": 3.987220860340009e-05, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.3239936828613281, "step": 950, "valid_targets_mean": 3289.5, "valid_targets_min": 715 }, { "epoch": 0.9335288367546432, "grad_norm": 0.6702989912107715, "learning_rate": 3.9866647192632176e-05, "loss": 0.2958, "loss_nan_ranks": 0, "loss_rank_avg": 0.33095431327819824, "step": 955, "valid_targets_mean": 2921.6, "valid_targets_min": 1062 }, { "epoch": 0.9384164222873901, "grad_norm": 0.6929820388448079, "learning_rate": 3.986096773538063e-05, "loss": 0.3096, "loss_nan_ranks": 0, "loss_rank_avg": 0.3430343270301819, "step": 960, "valid_targets_mean": 2701.9, "valid_targets_min": 1179 }, { "epoch": 0.9433040078201369, "grad_norm": 0.7185025063166174, "learning_rate": 3.985517026539247e-05, "loss": 0.3038, "loss_nan_ranks": 0, "loss_rank_avg": 0.29739582538604736, "step": 965, "valid_targets_mean": 2256.4, "valid_targets_min": 980 }, { "epoch": 0.9481915933528837, "grad_norm": 0.7330014703291616, "learning_rate": 3.9849254817115925e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.30947941541671753, "step": 970, "valid_targets_mean": 2393.1, "valid_targets_min": 814 }, { "epoch": 0.9530791788856305, "grad_norm": 0.692392838579322, "learning_rate": 3.984322142570026e-05, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.2626379728317261, "step": 975, "valid_targets_mean": 2232.8, "valid_targets_min": 854 }, { "epoch": 0.9579667644183774, "grad_norm": 0.7858755039683706, "learning_rate": 3.983707012699554e-05, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.31549689173698425, "step": 980, "valid_targets_mean": 2162.8, "valid_targets_min": 967 }, { "epoch": 0.9628543499511242, "grad_norm": 1.1798359180734284, "learning_rate": 3.983080095755242e-05, "loss": 0.2951, "loss_nan_ranks": 0, "loss_rank_avg": 0.30286744236946106, "step": 985, "valid_targets_mean": 2232.1, "valid_targets_min": 612 }, { "epoch": 0.967741935483871, "grad_norm": 0.6652279763756077, "learning_rate": 3.982441395462196e-05, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.2915736436843872, "step": 990, "valid_targets_mean": 2793.2, "valid_targets_min": 903 }, { "epoch": 0.9726295210166178, "grad_norm": 0.7934359151694675, "learning_rate": 3.9817909156155364e-05, "loss": 0.2959, "loss_nan_ranks": 0, "loss_rank_avg": 0.3128136396408081, "step": 995, "valid_targets_mean": 2334.7, "valid_targets_min": 642 }, { "epoch": 0.9775171065493646, "grad_norm": 0.6891936895341518, "learning_rate": 3.981128660080377e-05, "loss": 0.2905, "loss_nan_ranks": 0, "loss_rank_avg": 0.2969144880771637, "step": 1000, "valid_targets_mean": 2541.0, "valid_targets_min": 634 }, { "epoch": 0.9824046920821115, "grad_norm": 0.6463480054438933, "learning_rate": 3.9804546327918025e-05, "loss": 0.3045, "loss_nan_ranks": 0, "loss_rank_avg": 0.29501742124557495, "step": 1005, "valid_targets_mean": 2564.6, "valid_targets_min": 714 }, { "epoch": 0.9872922776148583, "grad_norm": 0.6654896254454947, "learning_rate": 3.9797688377548443e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.30969366431236267, "step": 1010, "valid_targets_mean": 3066.6, "valid_targets_min": 682 }, { "epoch": 0.9921798631476051, "grad_norm": 0.6711120956545672, "learning_rate": 3.979071279044458e-05, "loss": 0.3167, "loss_nan_ranks": 0, "loss_rank_avg": 0.3256608247756958, "step": 1015, "valid_targets_mean": 2601.2, "valid_targets_min": 1157 }, { "epoch": 0.9970674486803519, "grad_norm": 0.7414237101887737, "learning_rate": 3.9783619608054976e-05, "loss": 0.3275, "loss_nan_ranks": 0, "loss_rank_avg": 0.34451091289520264, "step": 1020, "valid_targets_mean": 2595.6, "valid_targets_min": 1188 }, { "epoch": 1.0019550342130987, "grad_norm": 0.6693075231319553, "learning_rate": 3.977640887252691e-05, "loss": 0.3112, "loss_nan_ranks": 0, "loss_rank_avg": 0.29463478922843933, "step": 1025, "valid_targets_mean": 2843.2, "valid_targets_min": 985 }, { "epoch": 1.0068426197458455, "grad_norm": 0.7374854812974025, "learning_rate": 3.976908062670616e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.2664167284965515, "step": 1030, "valid_targets_mean": 2574.8, "valid_targets_min": 1291 }, { "epoch": 1.0117302052785924, "grad_norm": 0.7176161611789769, "learning_rate": 3.976163491413675e-05, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.3102620840072632, "step": 1035, "valid_targets_mean": 2583.6, "valid_targets_min": 964 }, { "epoch": 1.0166177908113392, "grad_norm": 0.6120097146085149, "learning_rate": 3.9754071779060674e-05, "loss": 0.2955, "loss_nan_ranks": 0, "loss_rank_avg": 0.29326507449150085, "step": 1040, "valid_targets_mean": 3918.3, "valid_targets_min": 812 }, { "epoch": 1.021505376344086, "grad_norm": 0.6381885490796083, "learning_rate": 3.9746391266417664e-05, "loss": 0.2767, "loss_nan_ranks": 0, "loss_rank_avg": 0.2916497588157654, "step": 1045, "valid_targets_mean": 3250.8, "valid_targets_min": 672 }, { "epoch": 1.0263929618768328, "grad_norm": 0.6912845827934561, "learning_rate": 3.973859342184487e-05, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.3102365732192993, "step": 1050, "valid_targets_mean": 3456.9, "valid_targets_min": 1028 }, { "epoch": 1.0312805474095796, "grad_norm": 0.6994698165553925, "learning_rate": 3.973067829167664e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.2805289030075073, "step": 1055, "valid_targets_mean": 2511.4, "valid_targets_min": 1131 }, { "epoch": 1.0361681329423265, "grad_norm": 0.7049190368603762, "learning_rate": 3.972264592294424e-05, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.27423086762428284, "step": 1060, "valid_targets_mean": 2325.2, "valid_targets_min": 617 }, { "epoch": 1.0410557184750733, "grad_norm": 0.803585152797481, "learning_rate": 3.971449636337553e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.3054800033569336, "step": 1065, "valid_targets_mean": 2130.8, "valid_targets_min": 633 }, { "epoch": 1.04594330400782, "grad_norm": 0.8125386640556346, "learning_rate": 3.970622966139474e-05, "loss": 0.2796, "loss_nan_ranks": 0, "loss_rank_avg": 0.3040192723274231, "step": 1070, "valid_targets_mean": 2165.8, "valid_targets_min": 726 }, { "epoch": 1.050830889540567, "grad_norm": 0.6875765301460454, "learning_rate": 3.969784586612213e-05, "loss": 0.2682, "loss_nan_ranks": 0, "loss_rank_avg": 0.2739431858062744, "step": 1075, "valid_targets_mean": 2306.1, "valid_targets_min": 750 }, { "epoch": 1.0557184750733137, "grad_norm": 0.7590315528229628, "learning_rate": 3.968934502737375e-05, "loss": 0.2849, "loss_nan_ranks": 0, "loss_rank_avg": 0.28198593854904175, "step": 1080, "valid_targets_mean": 2487.6, "valid_targets_min": 703 }, { "epoch": 1.0606060606060606, "grad_norm": 0.767363949833768, "learning_rate": 3.968072719566108e-05, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.2522793114185333, "step": 1085, "valid_targets_mean": 1953.9, "valid_targets_min": 746 }, { "epoch": 1.0654936461388074, "grad_norm": 0.763111692809638, "learning_rate": 3.96719924221908e-05, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.31584176421165466, "step": 1090, "valid_targets_mean": 2352.2, "valid_targets_min": 788 }, { "epoch": 1.0703812316715542, "grad_norm": 0.7106137161882315, "learning_rate": 3.966314075886442e-05, "loss": 0.2855, "loss_nan_ranks": 0, "loss_rank_avg": 0.2609940767288208, "step": 1095, "valid_targets_mean": 2245.1, "valid_targets_min": 867 }, { "epoch": 1.075268817204301, "grad_norm": 0.8801431366949057, "learning_rate": 3.9654172258278026e-05, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.26888507604599, "step": 1100, "valid_targets_mean": 2219.1, "valid_targets_min": 737 }, { "epoch": 1.0801564027370478, "grad_norm": 0.9630113421733234, "learning_rate": 3.964508697372194e-05, "loss": 0.2862, "loss_nan_ranks": 0, "loss_rank_avg": 0.2783164083957672, "step": 1105, "valid_targets_mean": 2106.6, "valid_targets_min": 670 }, { "epoch": 1.0850439882697946, "grad_norm": 0.7056624571864765, "learning_rate": 3.96358849591804e-05, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.2580503821372986, "step": 1110, "valid_targets_mean": 2245.5, "valid_targets_min": 830 }, { "epoch": 1.0899315738025415, "grad_norm": 0.7476404563873276, "learning_rate": 3.9626566269331254e-05, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.25160929560661316, "step": 1115, "valid_targets_mean": 2236.5, "valid_targets_min": 824 }, { "epoch": 1.0948191593352883, "grad_norm": 0.7462231828953746, "learning_rate": 3.9617130959545614e-05, "loss": 0.287, "loss_nan_ranks": 0, "loss_rank_avg": 0.28869083523750305, "step": 1120, "valid_targets_mean": 2205.5, "valid_targets_min": 548 }, { "epoch": 1.099706744868035, "grad_norm": 0.6350210512856392, "learning_rate": 3.960757908588757e-05, "loss": 0.2792, "loss_nan_ranks": 0, "loss_rank_avg": 0.29355528950691223, "step": 1125, "valid_targets_mean": 2905.8, "valid_targets_min": 990 }, { "epoch": 1.104594330400782, "grad_norm": 0.7768451815168522, "learning_rate": 3.95979107051138e-05, "loss": 0.298, "loss_nan_ranks": 0, "loss_rank_avg": 0.29628539085388184, "step": 1130, "valid_targets_mean": 1995.6, "valid_targets_min": 796 }, { "epoch": 1.1094819159335287, "grad_norm": 0.715701114754943, "learning_rate": 3.958812587467327e-05, "loss": 0.2946, "loss_nan_ranks": 0, "loss_rank_avg": 0.2757974863052368, "step": 1135, "valid_targets_mean": 2513.9, "valid_targets_min": 795 }, { "epoch": 1.1143695014662756, "grad_norm": 0.657177833956688, "learning_rate": 3.957822465270689e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.28396639227867126, "step": 1140, "valid_targets_mean": 2740.9, "valid_targets_min": 1028 }, { "epoch": 1.1192570869990224, "grad_norm": 0.7265698253166278, "learning_rate": 3.9568207098047144e-05, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.3029360771179199, "step": 1145, "valid_targets_mean": 2664.1, "valid_targets_min": 1073 }, { "epoch": 1.1241446725317692, "grad_norm": 0.6515253109002876, "learning_rate": 3.9558073270217784e-05, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.2731107771396637, "step": 1150, "valid_targets_mean": 2830.1, "valid_targets_min": 815 }, { "epoch": 1.129032258064516, "grad_norm": 0.7342300835153387, "learning_rate": 3.954782322943343e-05, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.26124700903892517, "step": 1155, "valid_targets_mean": 2346.8, "valid_targets_min": 728 }, { "epoch": 1.1339198435972628, "grad_norm": 0.7264943185964359, "learning_rate": 3.953745703659924e-05, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.29263490438461304, "step": 1160, "valid_targets_mean": 2200.6, "valid_targets_min": 912 }, { "epoch": 1.1388074291300097, "grad_norm": 0.7531165993253246, "learning_rate": 3.952697475331054e-05, "loss": 0.2727, "loss_nan_ranks": 0, "loss_rank_avg": 0.2604370415210724, "step": 1165, "valid_targets_mean": 1966.1, "valid_targets_min": 810 }, { "epoch": 1.1436950146627567, "grad_norm": 0.5807064795538424, "learning_rate": 3.951637644185245e-05, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.2689421474933624, "step": 1170, "valid_targets_mean": 3077.1, "valid_targets_min": 663 }, { "epoch": 1.1485826001955035, "grad_norm": 0.7320623987196705, "learning_rate": 3.9505662165199546e-05, "loss": 0.2666, "loss_nan_ranks": 0, "loss_rank_avg": 0.2726061940193176, "step": 1175, "valid_targets_mean": 2399.1, "valid_targets_min": 953 }, { "epoch": 1.1534701857282503, "grad_norm": 0.718063434455999, "learning_rate": 3.949483198701544e-05, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.2901926040649414, "step": 1180, "valid_targets_mean": 1989.6, "valid_targets_min": 467 }, { "epoch": 1.1583577712609971, "grad_norm": 0.7091718018989998, "learning_rate": 3.948388597165244e-05, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.2814217805862427, "step": 1185, "valid_targets_mean": 2682.6, "valid_targets_min": 977 }, { "epoch": 1.163245356793744, "grad_norm": 0.7198188497547705, "learning_rate": 3.947282418415114e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.26243048906326294, "step": 1190, "valid_targets_mean": 2464.7, "valid_targets_min": 1207 }, { "epoch": 1.1681329423264908, "grad_norm": 0.8032209187501614, "learning_rate": 3.946164669024005e-05, "loss": 0.2762, "loss_nan_ranks": 0, "loss_rank_avg": 0.2906745374202728, "step": 1195, "valid_targets_mean": 2152.6, "valid_targets_min": 1274 }, { "epoch": 1.1730205278592376, "grad_norm": 0.69719975762219, "learning_rate": 3.945035355633519e-05, "loss": 0.2792, "loss_nan_ranks": 0, "loss_rank_avg": 0.29841500520706177, "step": 1200, "valid_targets_mean": 2345.9, "valid_targets_min": 886 }, { "epoch": 1.1779081133919844, "grad_norm": 0.6974558842300727, "learning_rate": 3.943894484953974e-05, "loss": 0.2781, "loss_nan_ranks": 0, "loss_rank_avg": 0.29451218247413635, "step": 1205, "valid_targets_mean": 2422.9, "valid_targets_min": 512 }, { "epoch": 1.1827956989247312, "grad_norm": 0.7729057032255819, "learning_rate": 3.9427420637643566e-05, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.30238640308380127, "step": 1210, "valid_targets_mean": 2235.3, "valid_targets_min": 1257 }, { "epoch": 1.187683284457478, "grad_norm": 0.7935199270678439, "learning_rate": 3.941578098912288e-05, "loss": 0.2917, "loss_nan_ranks": 0, "loss_rank_avg": 0.25925132632255554, "step": 1215, "valid_targets_mean": 1819.3, "valid_targets_min": 868 }, { "epoch": 1.1925708699902249, "grad_norm": 0.7190594576509517, "learning_rate": 3.940402597313982e-05, "loss": 0.2801, "loss_nan_ranks": 0, "loss_rank_avg": 0.30240678787231445, "step": 1220, "valid_targets_mean": 2756.8, "valid_targets_min": 513 }, { "epoch": 1.1974584555229717, "grad_norm": 0.6468704089059654, "learning_rate": 3.939215565954201e-05, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.27174267172813416, "step": 1225, "valid_targets_mean": 2537.5, "valid_targets_min": 842 }, { "epoch": 1.2023460410557185, "grad_norm": 0.6638979450727887, "learning_rate": 3.938017011886217e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.25439706444740295, "step": 1230, "valid_targets_mean": 2504.9, "valid_targets_min": 857 }, { "epoch": 1.2072336265884653, "grad_norm": 0.7494764475924144, "learning_rate": 3.936806942231772e-05, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.2995947003364563, "step": 1235, "valid_targets_mean": 2547.0, "valid_targets_min": 667 }, { "epoch": 1.2121212121212122, "grad_norm": 0.7304687661971925, "learning_rate": 3.9355853641810286e-05, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.266486793756485, "step": 1240, "valid_targets_mean": 2214.6, "valid_targets_min": 309 }, { "epoch": 1.217008797653959, "grad_norm": 0.7022740270462892, "learning_rate": 3.9343522849925355e-05, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.25830769538879395, "step": 1245, "valid_targets_mean": 2205.6, "valid_targets_min": 728 }, { "epoch": 1.2218963831867058, "grad_norm": 0.6749560565367534, "learning_rate": 3.933107711993177e-05, "loss": 0.2915, "loss_nan_ranks": 0, "loss_rank_avg": 0.3063586354255676, "step": 1250, "valid_targets_mean": 2899.1, "valid_targets_min": 1467 }, { "epoch": 1.2267839687194526, "grad_norm": 0.640174555103181, "learning_rate": 3.931851652578137e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.26264217495918274, "step": 1255, "valid_targets_mean": 2715.5, "valid_targets_min": 765 }, { "epoch": 1.2316715542521994, "grad_norm": 0.7175756349653029, "learning_rate": 3.930584114210847e-05, "loss": 0.2743, "loss_nan_ranks": 0, "loss_rank_avg": 0.2843489348888397, "step": 1260, "valid_targets_mean": 2394.0, "valid_targets_min": 1130 }, { "epoch": 1.2365591397849462, "grad_norm": 0.6471066400554928, "learning_rate": 3.929305104422949e-05, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.25573495030403137, "step": 1265, "valid_targets_mean": 2673.3, "valid_targets_min": 859 }, { "epoch": 1.241446725317693, "grad_norm": 0.7057472774221171, "learning_rate": 3.928014630814245e-05, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.29683718085289, "step": 1270, "valid_targets_mean": 2584.6, "valid_targets_min": 704 }, { "epoch": 1.2463343108504399, "grad_norm": 0.7027021456995992, "learning_rate": 3.926712701052656e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.23105719685554504, "step": 1275, "valid_targets_mean": 2057.8, "valid_targets_min": 548 }, { "epoch": 1.2512218963831867, "grad_norm": 0.8306679586454391, "learning_rate": 3.925399322874175e-05, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.2782430350780487, "step": 1280, "valid_targets_mean": 1920.4, "valid_targets_min": 782 }, { "epoch": 1.2561094819159335, "grad_norm": 0.6271862299342814, "learning_rate": 3.9240745040828196e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.2829798460006714, "step": 1285, "valid_targets_mean": 3158.1, "valid_targets_min": 807 }, { "epoch": 1.2609970674486803, "grad_norm": 0.7221564579455654, "learning_rate": 3.922738252550587e-05, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.2566811740398407, "step": 1290, "valid_targets_mean": 2186.9, "valid_targets_min": 659 }, { "epoch": 1.2658846529814272, "grad_norm": 0.7065825530165445, "learning_rate": 3.921390576217408e-05, "loss": 0.2722, "loss_nan_ranks": 0, "loss_rank_avg": 0.27165934443473816, "step": 1295, "valid_targets_mean": 2100.2, "valid_targets_min": 698 }, { "epoch": 1.270772238514174, "grad_norm": 0.9761318767014419, "learning_rate": 3.9200314830910986e-05, "loss": 0.2806, "loss_nan_ranks": 0, "loss_rank_avg": 0.2744409441947937, "step": 1300, "valid_targets_mean": 1900.2, "valid_targets_min": 668 }, { "epoch": 1.2756598240469208, "grad_norm": 0.8388053078423351, "learning_rate": 3.918660981247312e-05, "loss": 0.2735, "loss_nan_ranks": 0, "loss_rank_avg": 0.2818601727485657, "step": 1305, "valid_targets_mean": 1785.4, "valid_targets_min": 769 }, { "epoch": 1.2805474095796676, "grad_norm": 0.613252199578922, "learning_rate": 3.9172790788294924e-05, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.25405043363571167, "step": 1310, "valid_targets_mean": 2779.4, "valid_targets_min": 875 }, { "epoch": 1.2854349951124144, "grad_norm": 0.702566015145273, "learning_rate": 3.9158857840488253e-05, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.2808951437473297, "step": 1315, "valid_targets_mean": 2675.1, "valid_targets_min": 770 }, { "epoch": 1.2903225806451613, "grad_norm": 0.7219389062248595, "learning_rate": 3.914481105184188e-05, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.27677303552627563, "step": 1320, "valid_targets_mean": 2169.5, "valid_targets_min": 789 }, { "epoch": 1.295210166177908, "grad_norm": 0.6230877367684657, "learning_rate": 3.913065050582103e-05, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.2999587059020996, "step": 1325, "valid_targets_mean": 3419.2, "valid_targets_min": 722 }, { "epoch": 1.300097751710655, "grad_norm": 0.6833998876959554, "learning_rate": 3.911637628656685e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.252625048160553, "step": 1330, "valid_targets_mean": 2527.4, "valid_targets_min": 849 }, { "epoch": 1.3049853372434017, "grad_norm": 0.7469165884381328, "learning_rate": 3.910198847889595e-05, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.2838708162307739, "step": 1335, "valid_targets_mean": 2485.5, "valid_targets_min": 622 }, { "epoch": 1.3098729227761485, "grad_norm": 0.6617163563012934, "learning_rate": 3.908748716829984e-05, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.29781484603881836, "step": 1340, "valid_targets_mean": 3058.6, "valid_targets_min": 961 }, { "epoch": 1.3147605083088953, "grad_norm": 0.6917934222962383, "learning_rate": 3.90728724409445e-05, "loss": 0.2703, "loss_nan_ranks": 0, "loss_rank_avg": 0.23285894095897675, "step": 1345, "valid_targets_mean": 2165.1, "valid_targets_min": 689 }, { "epoch": 1.3196480938416422, "grad_norm": 0.8112229286729639, "learning_rate": 3.90581443836698e-05, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.2841215133666992, "step": 1350, "valid_targets_mean": 2388.8, "valid_targets_min": 972 }, { "epoch": 1.324535679374389, "grad_norm": 0.7050055286781818, "learning_rate": 3.9043303083989e-05, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.2793377935886383, "step": 1355, "valid_targets_mean": 2531.8, "valid_targets_min": 839 }, { "epoch": 1.3294232649071358, "grad_norm": 0.7692436746915501, "learning_rate": 3.9028348630088285e-05, "loss": 0.2801, "loss_nan_ranks": 0, "loss_rank_avg": 0.29042643308639526, "step": 1360, "valid_targets_mean": 2408.2, "valid_targets_min": 972 }, { "epoch": 1.3343108504398826, "grad_norm": 0.7453876083199784, "learning_rate": 3.9013281110826146e-05, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.25248265266418457, "step": 1365, "valid_targets_mean": 2040.0, "valid_targets_min": 996 }, { "epoch": 1.3391984359726294, "grad_norm": 0.6300162995824621, "learning_rate": 3.899810061573293e-05, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.27708175778388977, "step": 1370, "valid_targets_mean": 2868.4, "valid_targets_min": 1109 }, { "epoch": 1.3440860215053765, "grad_norm": 0.6688370034426764, "learning_rate": 3.898280723501027e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.2765743136405945, "step": 1375, "valid_targets_mean": 2953.6, "valid_targets_min": 960 }, { "epoch": 1.3489736070381233, "grad_norm": 0.6214024065518173, "learning_rate": 3.896740105953056e-05, "loss": 0.2946, "loss_nan_ranks": 0, "loss_rank_avg": 0.2931886911392212, "step": 1380, "valid_targets_mean": 3082.7, "valid_targets_min": 1298 }, { "epoch": 1.3538611925708701, "grad_norm": 0.6750814309638632, "learning_rate": 3.895188218083641e-05, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.23927871882915497, "step": 1385, "valid_targets_mean": 2085.7, "valid_targets_min": 605 }, { "epoch": 1.358748778103617, "grad_norm": 1.0887637501386116, "learning_rate": 3.893625069114013e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.28028884530067444, "step": 1390, "valid_targets_mean": 2176.3, "valid_targets_min": 999 }, { "epoch": 1.3636363636363638, "grad_norm": 0.773730842008043, "learning_rate": 3.892050668332312e-05, "loss": 0.2833, "loss_nan_ranks": 0, "loss_rank_avg": 0.27753153443336487, "step": 1395, "valid_targets_mean": 2301.8, "valid_targets_min": 816 }, { "epoch": 1.3685239491691106, "grad_norm": 0.7189179648090815, "learning_rate": 3.890465025093538e-05, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.30436086654663086, "step": 1400, "valid_targets_mean": 2609.4, "valid_targets_min": 869 }, { "epoch": 1.3734115347018574, "grad_norm": 0.6426850788526689, "learning_rate": 3.8888681488194934e-05, "loss": 0.2796, "loss_nan_ranks": 0, "loss_rank_avg": 0.3102635145187378, "step": 1405, "valid_targets_mean": 3093.6, "valid_targets_min": 1107 }, { "epoch": 1.3782991202346042, "grad_norm": 0.734389179384258, "learning_rate": 3.887260048998726e-05, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.2662855386734009, "step": 1410, "valid_targets_mean": 2011.6, "valid_targets_min": 684 }, { "epoch": 1.383186705767351, "grad_norm": 0.6225396878904635, "learning_rate": 3.885640735186472e-05, "loss": 0.2618, "loss_nan_ranks": 0, "loss_rank_avg": 0.2845187783241272, "step": 1415, "valid_targets_mean": 3417.9, "valid_targets_min": 1093 }, { "epoch": 1.3880742913000979, "grad_norm": 0.789834712593994, "learning_rate": 3.884010217004601e-05, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.29228654503822327, "step": 1420, "valid_targets_mean": 2669.8, "valid_targets_min": 1027 }, { "epoch": 1.3929618768328447, "grad_norm": 0.7464915480075731, "learning_rate": 3.882368504141562e-05, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.28257280588150024, "step": 1425, "valid_targets_mean": 2574.6, "valid_targets_min": 1474 }, { "epoch": 1.3978494623655915, "grad_norm": 0.7059861573051313, "learning_rate": 3.8807156063523164e-05, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.2998770475387573, "step": 1430, "valid_targets_mean": 2475.3, "valid_targets_min": 570 }, { "epoch": 1.4027370478983383, "grad_norm": 0.6645964659054957, "learning_rate": 3.879051533458289e-05, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.2769964933395386, "step": 1435, "valid_targets_mean": 2476.9, "valid_targets_min": 657 }, { "epoch": 1.4076246334310851, "grad_norm": 0.7558136295073548, "learning_rate": 3.8773762953473066e-05, "loss": 0.2831, "loss_nan_ranks": 0, "loss_rank_avg": 0.2779275178909302, "step": 1440, "valid_targets_mean": 1848.9, "valid_targets_min": 762 }, { "epoch": 1.412512218963832, "grad_norm": 0.6943029966676353, "learning_rate": 3.8756899019735385e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.2840909957885742, "step": 1445, "valid_targets_mean": 2471.9, "valid_targets_min": 772 }, { "epoch": 1.4173998044965788, "grad_norm": 0.6342596835576019, "learning_rate": 3.873992363357437e-05, "loss": 0.2618, "loss_nan_ranks": 0, "loss_rank_avg": 0.2653612196445465, "step": 1450, "valid_targets_mean": 2900.2, "valid_targets_min": 1140 }, { "epoch": 1.4222873900293256, "grad_norm": 0.579209777162739, "learning_rate": 3.8722836895856814e-05, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.24776488542556763, "step": 1455, "valid_targets_mean": 2874.0, "valid_targets_min": 632 }, { "epoch": 1.4271749755620724, "grad_norm": 0.6564233693786774, "learning_rate": 3.870563890811111e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.3028268814086914, "step": 1460, "valid_targets_mean": 3045.8, "valid_targets_min": 891 }, { "epoch": 1.4320625610948192, "grad_norm": 0.6629636773046359, "learning_rate": 3.868832977252675e-05, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.27365946769714355, "step": 1465, "valid_targets_mean": 2735.8, "valid_targets_min": 799 }, { "epoch": 1.436950146627566, "grad_norm": 0.6785573010408985, "learning_rate": 3.86709095919536e-05, "loss": 0.275, "loss_nan_ranks": 0, "loss_rank_avg": 0.2917429804801941, "step": 1470, "valid_targets_mean": 2449.4, "valid_targets_min": 756 }, { "epoch": 1.4418377321603129, "grad_norm": 0.6465288698245589, "learning_rate": 3.86533784699014e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.25123557448387146, "step": 1475, "valid_targets_mean": 2389.1, "valid_targets_min": 696 }, { "epoch": 1.4467253176930597, "grad_norm": 0.7015331893695984, "learning_rate": 3.8635736510539065e-05, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.2667387127876282, "step": 1480, "valid_targets_mean": 2461.5, "valid_targets_min": 717 }, { "epoch": 1.4516129032258065, "grad_norm": 0.7629144665484076, "learning_rate": 3.861798381869412e-05, "loss": 0.2821, "loss_nan_ranks": 0, "loss_rank_avg": 0.29424476623535156, "step": 1485, "valid_targets_mean": 2159.1, "valid_targets_min": 763 }, { "epoch": 1.4565004887585533, "grad_norm": 0.752596217358227, "learning_rate": 3.860012049985204e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.25024765729904175, "step": 1490, "valid_targets_mean": 1827.2, "valid_targets_min": 888 }, { "epoch": 1.4613880742913001, "grad_norm": 0.700994546408206, "learning_rate": 3.858214666015565e-05, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.29054421186447144, "step": 1495, "valid_targets_mean": 2365.5, "valid_targets_min": 695 }, { "epoch": 1.466275659824047, "grad_norm": 0.7116021660360209, "learning_rate": 3.856406240640448e-05, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.2625944912433624, "step": 1500, "valid_targets_mean": 2130.0, "valid_targets_min": 684 }, { "epoch": 1.4711632453567938, "grad_norm": 0.7684258462239429, "learning_rate": 3.8545867846054126e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.2951001524925232, "step": 1505, "valid_targets_mean": 2052.4, "valid_targets_min": 1064 }, { "epoch": 1.4760508308895406, "grad_norm": 0.6507083544953332, "learning_rate": 3.8527563087215634e-05, "loss": 0.2742, "loss_nan_ranks": 0, "loss_rank_avg": 0.2922488749027252, "step": 1510, "valid_targets_mean": 2769.5, "valid_targets_min": 843 }, { "epoch": 1.4809384164222874, "grad_norm": 0.7751727870506968, "learning_rate": 3.8509148238654824e-05, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.24178072810173035, "step": 1515, "valid_targets_mean": 1849.9, "valid_targets_min": 780 }, { "epoch": 1.4858260019550342, "grad_norm": 0.5854852127584044, "learning_rate": 3.84906234097917e-05, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.27021411061286926, "step": 1520, "valid_targets_mean": 3099.3, "valid_targets_min": 1029 }, { "epoch": 1.490713587487781, "grad_norm": 0.6358169347672091, "learning_rate": 3.8471988710699715e-05, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.26537126302719116, "step": 1525, "valid_targets_mean": 2957.4, "valid_targets_min": 802 }, { "epoch": 1.4956011730205279, "grad_norm": 0.6204632468552115, "learning_rate": 3.8453244252105194e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.2769279181957245, "step": 1530, "valid_targets_mean": 3130.9, "valid_targets_min": 737 }, { "epoch": 1.5004887585532747, "grad_norm": 0.6411624274507086, "learning_rate": 3.843439014538664e-05, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.26065292954444885, "step": 1535, "valid_targets_mean": 2861.7, "valid_targets_min": 1023 }, { "epoch": 1.5053763440860215, "grad_norm": 0.7050285259422795, "learning_rate": 3.841542650257408e-05, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.24625875055789948, "step": 1540, "valid_targets_mean": 2171.6, "valid_targets_min": 1054 }, { "epoch": 1.5102639296187683, "grad_norm": 0.7521045411153422, "learning_rate": 3.83963534363484e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.3168919086456299, "step": 1545, "valid_targets_mean": 2370.8, "valid_targets_min": 842 }, { "epoch": 1.5151515151515151, "grad_norm": 0.7217702499392185, "learning_rate": 3.8377171060040666e-05, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.27114635705947876, "step": 1550, "valid_targets_mean": 2131.9, "valid_targets_min": 783 }, { "epoch": 1.520039100684262, "grad_norm": 0.7137936454079413, "learning_rate": 3.835787948763147e-05, "loss": 0.2767, "loss_nan_ranks": 0, "loss_rank_avg": 0.25275540351867676, "step": 1555, "valid_targets_mean": 2113.8, "valid_targets_min": 748 }, { "epoch": 1.5249266862170088, "grad_norm": 0.9545717948909013, "learning_rate": 3.833847883375022e-05, "loss": 0.2934, "loss_nan_ranks": 0, "loss_rank_avg": 0.2564704716205597, "step": 1560, "valid_targets_mean": 2187.5, "valid_targets_min": 739 }, { "epoch": 1.5298142717497556, "grad_norm": 0.7470839745811981, "learning_rate": 3.831896921367451e-05, "loss": 0.2821, "loss_nan_ranks": 0, "loss_rank_avg": 0.2791537940502167, "step": 1565, "valid_targets_mean": 1975.1, "valid_targets_min": 686 }, { "epoch": 1.5347018572825024, "grad_norm": 0.7647266073732814, "learning_rate": 3.829935074332938e-05, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.24994492530822754, "step": 1570, "valid_targets_mean": 2233.8, "valid_targets_min": 837 }, { "epoch": 1.5395894428152492, "grad_norm": 0.7045036581823351, "learning_rate": 3.827962353928667e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.26855552196502686, "step": 1575, "valid_targets_mean": 2261.9, "valid_targets_min": 763 }, { "epoch": 1.544477028347996, "grad_norm": 0.7143743531724757, "learning_rate": 3.825978771876428e-05, "loss": 0.2873, "loss_nan_ranks": 0, "loss_rank_avg": 0.3018741011619568, "step": 1580, "valid_targets_mean": 2336.8, "valid_targets_min": 663 }, { "epoch": 1.5493646138807429, "grad_norm": 0.6475010659041159, "learning_rate": 3.823984339962554e-05, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.29907166957855225, "step": 1585, "valid_targets_mean": 2830.2, "valid_targets_min": 732 }, { "epoch": 1.5542521994134897, "grad_norm": 0.6898759516125273, "learning_rate": 3.821979070037846e-05, "loss": 0.2791, "loss_nan_ranks": 0, "loss_rank_avg": 0.2999107241630554, "step": 1590, "valid_targets_mean": 2604.1, "valid_targets_min": 631 }, { "epoch": 1.5591397849462365, "grad_norm": 0.6572278395987295, "learning_rate": 3.8199629740175017e-05, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.2730094790458679, "step": 1595, "valid_targets_mean": 2485.9, "valid_targets_min": 804 }, { "epoch": 1.5640273704789833, "grad_norm": 0.7008441805523876, "learning_rate": 3.8179360638810503e-05, "loss": 0.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.2944326102733612, "step": 1600, "valid_targets_mean": 2188.3, "valid_targets_min": 669 }, { "epoch": 1.5689149560117301, "grad_norm": 0.5571584829883734, "learning_rate": 3.815898351672275e-05, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.22917650640010834, "step": 1605, "valid_targets_mean": 3037.3, "valid_targets_min": 765 }, { "epoch": 1.573802541544477, "grad_norm": 0.7410724781542547, "learning_rate": 3.813849849499146e-05, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.24475133419036865, "step": 1610, "valid_targets_mean": 1836.8, "valid_targets_min": 741 }, { "epoch": 1.5786901270772238, "grad_norm": 0.7170995982719762, "learning_rate": 3.811790569533746e-05, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.2909032106399536, "step": 1615, "valid_targets_mean": 2271.4, "valid_targets_min": 689 }, { "epoch": 1.5835777126099706, "grad_norm": 0.7023440780016095, "learning_rate": 3.8097205240121994e-05, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.3244866132736206, "step": 1620, "valid_targets_mean": 2630.7, "valid_targets_min": 752 }, { "epoch": 1.5884652981427174, "grad_norm": 0.7145272097523425, "learning_rate": 3.807639725234598e-05, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.28274455666542053, "step": 1625, "valid_targets_mean": 2337.7, "valid_targets_min": 1045 }, { "epoch": 1.5933528836754642, "grad_norm": 0.6483060882499405, "learning_rate": 3.8055481855649295e-05, "loss": 0.2719, "loss_nan_ranks": 0, "loss_rank_avg": 0.2898852825164795, "step": 1630, "valid_targets_mean": 2868.5, "valid_targets_min": 1718 }, { "epoch": 1.598240469208211, "grad_norm": 0.6154123007304795, "learning_rate": 3.8034459174310034e-05, "loss": 0.2698, "loss_nan_ranks": 0, "loss_rank_avg": 0.24204128980636597, "step": 1635, "valid_targets_mean": 2880.8, "valid_targets_min": 791 }, { "epoch": 1.6031280547409579, "grad_norm": 0.7242965707991273, "learning_rate": 3.8013329333243765e-05, "loss": 0.2746, "loss_nan_ranks": 0, "loss_rank_avg": 0.3221800923347473, "step": 1640, "valid_targets_mean": 2574.4, "valid_targets_min": 836 }, { "epoch": 1.6080156402737047, "grad_norm": 0.8256849875812563, "learning_rate": 3.7992092458002813e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.2468244880437851, "step": 1645, "valid_targets_mean": 2232.7, "valid_targets_min": 659 }, { "epoch": 1.6129032258064515, "grad_norm": 0.8957983328042407, "learning_rate": 3.797074867477545e-05, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.2847079038619995, "step": 1650, "valid_targets_mean": 1988.9, "valid_targets_min": 1107 }, { "epoch": 1.6177908113391983, "grad_norm": 0.7320454198900345, "learning_rate": 3.794929811038525e-05, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.25967937707901, "step": 1655, "valid_targets_mean": 2044.0, "valid_targets_min": 732 }, { "epoch": 1.6226783968719452, "grad_norm": 0.7944386390316857, "learning_rate": 3.7927740892290225e-05, "loss": 0.3063, "loss_nan_ranks": 0, "loss_rank_avg": 0.29300451278686523, "step": 1660, "valid_targets_mean": 1941.6, "valid_targets_min": 584 }, { "epoch": 1.627565982404692, "grad_norm": 0.7033843489197059, "learning_rate": 3.790607714858213e-05, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.27778416872024536, "step": 1665, "valid_targets_mean": 2372.6, "valid_targets_min": 625 }, { "epoch": 1.6324535679374388, "grad_norm": 0.713583282306689, "learning_rate": 3.78843070079857e-05, "loss": 0.2706, "loss_nan_ranks": 0, "loss_rank_avg": 0.2961004972457886, "step": 1670, "valid_targets_mean": 2199.5, "valid_targets_min": 867 }, { "epoch": 1.6373411534701856, "grad_norm": 0.6811625348127058, "learning_rate": 3.786243059985787e-05, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.24486398696899414, "step": 1675, "valid_targets_mean": 2072.9, "valid_targets_min": 739 }, { "epoch": 1.6422287390029324, "grad_norm": 0.6214013174128027, "learning_rate": 3.7840448054187004e-05, "loss": 0.2698, "loss_nan_ranks": 0, "loss_rank_avg": 0.2856760323047638, "step": 1680, "valid_targets_mean": 2886.9, "valid_targets_min": 868 }, { "epoch": 1.6471163245356792, "grad_norm": 0.6763894621818294, "learning_rate": 3.781835950159214e-05, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.2664475739002228, "step": 1685, "valid_targets_mean": 2352.6, "valid_targets_min": 647 }, { "epoch": 1.652003910068426, "grad_norm": 0.7476808183243178, "learning_rate": 3.7796165073322194e-05, "loss": 0.275, "loss_nan_ranks": 0, "loss_rank_avg": 0.24394232034683228, "step": 1690, "valid_targets_mean": 1998.0, "valid_targets_min": 857 }, { "epoch": 1.6568914956011729, "grad_norm": 0.6654065406280266, "learning_rate": 3.777386490125518e-05, "loss": 0.2763, "loss_nan_ranks": 0, "loss_rank_avg": 0.2673056721687317, "step": 1695, "valid_targets_mean": 2774.7, "valid_targets_min": 941 }, { "epoch": 1.6617790811339197, "grad_norm": 1.0447139479563154, "learning_rate": 3.7751459117897466e-05, "loss": 0.2648, "loss_nan_ranks": 0, "loss_rank_avg": 0.29265016317367554, "step": 1700, "valid_targets_mean": 2134.6, "valid_targets_min": 856 }, { "epoch": 1.6666666666666665, "grad_norm": 0.6756696155203493, "learning_rate": 3.772894785638292e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.29080730676651, "step": 1705, "valid_targets_mean": 2770.5, "valid_targets_min": 1168 }, { "epoch": 1.6715542521994133, "grad_norm": 0.6063804591260533, "learning_rate": 3.770633125047219e-05, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.29159295558929443, "step": 1710, "valid_targets_mean": 3060.3, "valid_targets_min": 1237 }, { "epoch": 1.6764418377321602, "grad_norm": 0.7088620832664758, "learning_rate": 3.768360943455185e-05, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.26422443985939026, "step": 1715, "valid_targets_mean": 2225.6, "valid_targets_min": 727 }, { "epoch": 1.681329423264907, "grad_norm": 0.8121289862781522, "learning_rate": 3.7660782543633634e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.271615207195282, "step": 1720, "valid_targets_mean": 2280.4, "valid_targets_min": 639 }, { "epoch": 1.6862170087976538, "grad_norm": 0.6721466708752135, "learning_rate": 3.763785071335362e-05, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.2757419943809509, "step": 1725, "valid_targets_mean": 2551.2, "valid_targets_min": 1072 }, { "epoch": 1.6911045943304008, "grad_norm": 0.7511340865178172, "learning_rate": 3.761481407997144e-05, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.3051798939704895, "step": 1730, "valid_targets_mean": 2232.9, "valid_targets_min": 884 }, { "epoch": 1.6959921798631477, "grad_norm": 0.7709735641548016, "learning_rate": 3.759167278036945e-05, "loss": 0.2687, "loss_nan_ranks": 0, "loss_rank_avg": 0.28466472029685974, "step": 1735, "valid_targets_mean": 2116.8, "valid_targets_min": 746 }, { "epoch": 1.7008797653958945, "grad_norm": 0.6541200445160277, "learning_rate": 3.7568426952051936e-05, "loss": 0.2688, "loss_nan_ranks": 0, "loss_rank_avg": 0.24498885869979858, "step": 1740, "valid_targets_mean": 2278.2, "valid_targets_min": 615 }, { "epoch": 1.7057673509286413, "grad_norm": 0.8540951314910903, "learning_rate": 3.754507673314429e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.2802680730819702, "step": 1745, "valid_targets_mean": 2895.8, "valid_targets_min": 834 }, { "epoch": 1.710654936461388, "grad_norm": 0.6993627250812203, "learning_rate": 3.752162226239216e-05, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.2634274363517761, "step": 1750, "valid_targets_mean": 2296.5, "valid_targets_min": 641 }, { "epoch": 1.715542521994135, "grad_norm": 0.7122786881252015, "learning_rate": 3.749806367916069e-05, "loss": 0.2908, "loss_nan_ranks": 0, "loss_rank_avg": 0.29387813806533813, "step": 1755, "valid_targets_mean": 2420.0, "valid_targets_min": 719 }, { "epoch": 1.7204301075268817, "grad_norm": 0.6950186797619158, "learning_rate": 3.747440112343363e-05, "loss": 0.272, "loss_nan_ranks": 0, "loss_rank_avg": 0.284950315952301, "step": 1760, "valid_targets_mean": 2666.9, "valid_targets_min": 694 }, { "epoch": 1.7253176930596286, "grad_norm": 0.6540823928470759, "learning_rate": 3.745063473581254e-05, "loss": 0.2801, "loss_nan_ranks": 0, "loss_rank_avg": 0.26305273175239563, "step": 1765, "valid_targets_mean": 2482.1, "valid_targets_min": 522 }, { "epoch": 1.7302052785923754, "grad_norm": 0.6533343607539351, "learning_rate": 3.7426764657515926e-05, "loss": 0.288, "loss_nan_ranks": 0, "loss_rank_avg": 0.32014939188957214, "step": 1770, "valid_targets_mean": 2911.1, "valid_targets_min": 1390 }, { "epoch": 1.7350928641251222, "grad_norm": 0.681180973864994, "learning_rate": 3.7402791030378446e-05, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.26099470257759094, "step": 1775, "valid_targets_mean": 2321.4, "valid_targets_min": 514 }, { "epoch": 1.739980449657869, "grad_norm": 0.8019831916932382, "learning_rate": 3.737871399685001e-05, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.27410048246383667, "step": 1780, "valid_targets_mean": 1795.9, "valid_targets_min": 760 }, { "epoch": 1.7448680351906158, "grad_norm": 0.6599982007782187, "learning_rate": 3.735453369999499e-05, "loss": 0.2677, "loss_nan_ranks": 0, "loss_rank_avg": 0.2654041647911072, "step": 1785, "valid_targets_mean": 2488.9, "valid_targets_min": 780 }, { "epoch": 1.7497556207233627, "grad_norm": 0.6985853935310431, "learning_rate": 3.7330250283491316e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.2721864581108093, "step": 1790, "valid_targets_mean": 2234.3, "valid_targets_min": 892 }, { "epoch": 1.7546432062561095, "grad_norm": 0.7815807491097794, "learning_rate": 3.730586389162968e-05, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.2551916241645813, "step": 1795, "valid_targets_mean": 2119.4, "valid_targets_min": 741 }, { "epoch": 1.7595307917888563, "grad_norm": 0.6983319157355613, "learning_rate": 3.728137466931262e-05, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.26075512170791626, "step": 1800, "valid_targets_mean": 1934.5, "valid_targets_min": 790 }, { "epoch": 1.7644183773216031, "grad_norm": 0.6167013764000374, "learning_rate": 3.72567827620537e-05, "loss": 0.2814, "loss_nan_ranks": 0, "loss_rank_avg": 0.2760656476020813, "step": 1805, "valid_targets_mean": 3027.8, "valid_targets_min": 1151 }, { "epoch": 1.76930596285435, "grad_norm": 0.6509730292742568, "learning_rate": 3.723208831597663e-05, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.275715172290802, "step": 1810, "valid_targets_mean": 2570.6, "valid_targets_min": 881 }, { "epoch": 1.7741935483870968, "grad_norm": 0.6845280114796127, "learning_rate": 3.720729147781438e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.28714922070503235, "step": 1815, "valid_targets_mean": 2509.2, "valid_targets_min": 842 }, { "epoch": 1.7790811339198436, "grad_norm": 0.692569209787489, "learning_rate": 3.718239239490838e-05, "loss": 0.2746, "loss_nan_ranks": 0, "loss_rank_avg": 0.29387450218200684, "step": 1820, "valid_targets_mean": 2449.2, "valid_targets_min": 648 }, { "epoch": 1.7839687194525904, "grad_norm": 0.6702820731559377, "learning_rate": 3.715739121520754e-05, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.28223657608032227, "step": 1825, "valid_targets_mean": 2757.1, "valid_targets_min": 758 }, { "epoch": 1.7888563049853372, "grad_norm": 0.7241156064899832, "learning_rate": 3.7132288087267444e-05, "loss": 0.2754, "loss_nan_ranks": 0, "loss_rank_avg": 0.2525007128715515, "step": 1830, "valid_targets_mean": 1929.8, "valid_targets_min": 824 }, { "epoch": 1.793743890518084, "grad_norm": 0.6959493990441359, "learning_rate": 3.710708316024945e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.29006555676460266, "step": 1835, "valid_targets_mean": 2522.8, "valid_targets_min": 887 }, { "epoch": 1.7986314760508308, "grad_norm": 1.0690505659751939, "learning_rate": 3.708177658391979e-05, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.26409053802490234, "step": 1840, "valid_targets_mean": 2085.5, "valid_targets_min": 898 }, { "epoch": 1.8035190615835777, "grad_norm": 0.6416781900383685, "learning_rate": 3.70563685086487e-05, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.2942282557487488, "step": 1845, "valid_targets_mean": 2790.2, "valid_targets_min": 518 }, { "epoch": 1.8084066471163245, "grad_norm": 0.6292212211636715, "learning_rate": 3.70308590854095e-05, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.2690730392932892, "step": 1850, "valid_targets_mean": 2605.3, "valid_targets_min": 627 }, { "epoch": 1.8132942326490715, "grad_norm": 0.7563881415657474, "learning_rate": 3.7005248465777753e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.26602309942245483, "step": 1855, "valid_targets_mean": 1989.0, "valid_targets_min": 880 }, { "epoch": 1.8181818181818183, "grad_norm": 0.6636462614146774, "learning_rate": 3.697953680193028e-05, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.2749035358428955, "step": 1860, "valid_targets_mean": 2244.6, "valid_targets_min": 1017 }, { "epoch": 1.8230694037145652, "grad_norm": 1.7607977847503449, "learning_rate": 3.695372424664433e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.29794639348983765, "step": 1865, "valid_targets_mean": 2888.2, "valid_targets_min": 843 }, { "epoch": 1.827956989247312, "grad_norm": 0.6664158354412304, "learning_rate": 3.692781095329662e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.31028884649276733, "step": 1870, "valid_targets_mean": 2667.8, "valid_targets_min": 774 }, { "epoch": 1.8328445747800588, "grad_norm": 0.6484592517147627, "learning_rate": 3.690179707586247e-05, "loss": 0.2571, "loss_nan_ranks": 0, "loss_rank_avg": 0.2612004578113556, "step": 1875, "valid_targets_mean": 2415.0, "valid_targets_min": 817 }, { "epoch": 1.8377321603128056, "grad_norm": 0.6881093759344453, "learning_rate": 3.6875682768914847e-05, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.2743026912212372, "step": 1880, "valid_targets_mean": 3187.6, "valid_targets_min": 1503 }, { "epoch": 1.8426197458455524, "grad_norm": 0.7092531777121036, "learning_rate": 3.684946818762349e-05, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.24219094216823578, "step": 1885, "valid_targets_mean": 1849.3, "valid_targets_min": 538 }, { "epoch": 1.8475073313782993, "grad_norm": 0.7102034739129834, "learning_rate": 3.682315348775392e-05, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.2451900839805603, "step": 1890, "valid_targets_mean": 2226.6, "valid_targets_min": 742 }, { "epoch": 1.852394916911046, "grad_norm": 0.6976435032370457, "learning_rate": 3.6796738825666606e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.34835338592529297, "step": 1895, "valid_targets_mean": 2488.8, "valid_targets_min": 821 }, { "epoch": 1.857282502443793, "grad_norm": 0.8345683696586109, "learning_rate": 3.6770224358315945e-05, "loss": 0.2892, "loss_nan_ranks": 0, "loss_rank_avg": 0.3025885820388794, "step": 1900, "valid_targets_mean": 2416.9, "valid_targets_min": 544 }, { "epoch": 1.8621700879765397, "grad_norm": 0.6734416069076511, "learning_rate": 3.674361024324939e-05, "loss": 0.2677, "loss_nan_ranks": 0, "loss_rank_avg": 0.2562083601951599, "step": 1905, "valid_targets_mean": 2252.0, "valid_targets_min": 1040 }, { "epoch": 1.8670576735092865, "grad_norm": 0.7258976397773823, "learning_rate": 3.67168966386065e-05, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.29352593421936035, "step": 1910, "valid_targets_mean": 2220.9, "valid_targets_min": 770 }, { "epoch": 1.8719452590420333, "grad_norm": 0.8267516235866793, "learning_rate": 3.669008370311798e-05, "loss": 0.2589, "loss_nan_ranks": 0, "loss_rank_avg": 0.26839086413383484, "step": 1915, "valid_targets_mean": 2146.9, "valid_targets_min": 906 }, { "epoch": 1.8768328445747802, "grad_norm": 0.9090846152816757, "learning_rate": 3.666317159610478e-05, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.2196088433265686, "step": 1920, "valid_targets_mean": 1943.8, "valid_targets_min": 627 }, { "epoch": 1.881720430107527, "grad_norm": 0.6328104571501864, "learning_rate": 3.6636160477477084e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.26850637793540955, "step": 1925, "valid_targets_mean": 2655.1, "valid_targets_min": 1260 }, { "epoch": 1.8866080156402738, "grad_norm": 0.734256137030361, "learning_rate": 3.6609050507733434e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.2635309100151062, "step": 1930, "valid_targets_mean": 2196.3, "valid_targets_min": 865 }, { "epoch": 1.8914956011730206, "grad_norm": 0.6466263966198653, "learning_rate": 3.6581841847959704e-05, "loss": 0.2661, "loss_nan_ranks": 0, "loss_rank_avg": 0.23648956418037415, "step": 1935, "valid_targets_mean": 2312.8, "valid_targets_min": 571 }, { "epoch": 1.8963831867057674, "grad_norm": 0.6012794126830221, "learning_rate": 3.6554534659828214e-05, "loss": 0.2612, "loss_nan_ranks": 0, "loss_rank_avg": 0.2779013514518738, "step": 1940, "valid_targets_mean": 2929.6, "valid_targets_min": 682 }, { "epoch": 1.9012707722385143, "grad_norm": 0.7694228039973774, "learning_rate": 3.652712910559671e-05, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.2838958203792572, "step": 1945, "valid_targets_mean": 2658.0, "valid_targets_min": 1149 }, { "epoch": 1.906158357771261, "grad_norm": 0.6786164917053215, "learning_rate": 3.649962534810743e-05, "loss": 0.2663, "loss_nan_ranks": 0, "loss_rank_avg": 0.2658728361129761, "step": 1950, "valid_targets_mean": 2249.3, "valid_targets_min": 714 }, { "epoch": 1.911045943304008, "grad_norm": 0.6234672172314177, "learning_rate": 3.647202355078614e-05, "loss": 0.2912, "loss_nan_ranks": 0, "loss_rank_avg": 0.2740452289581299, "step": 1955, "valid_targets_mean": 2578.2, "valid_targets_min": 720 }, { "epoch": 1.9159335288367547, "grad_norm": 0.6515984804744183, "learning_rate": 3.644432387764113e-05, "loss": 0.2743, "loss_nan_ranks": 0, "loss_rank_avg": 0.28338634967803955, "step": 1960, "valid_targets_mean": 2537.2, "valid_targets_min": 781 }, { "epoch": 1.9208211143695015, "grad_norm": 0.6925882408989057, "learning_rate": 3.641652649326228e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.28017061948776245, "step": 1965, "valid_targets_mean": 2322.9, "valid_targets_min": 790 }, { "epoch": 1.9257086999022484, "grad_norm": 0.721478062577497, "learning_rate": 3.638863156282007e-05, "loss": 0.2554, "loss_nan_ranks": 0, "loss_rank_avg": 0.2587317228317261, "step": 1970, "valid_targets_mean": 1998.3, "valid_targets_min": 818 }, { "epoch": 1.9305962854349952, "grad_norm": 0.670482355423357, "learning_rate": 3.6360639252064576e-05, "loss": 0.2743, "loss_nan_ranks": 0, "loss_rank_avg": 0.28506842255592346, "step": 1975, "valid_targets_mean": 2706.6, "valid_targets_min": 804 }, { "epoch": 1.935483870967742, "grad_norm": 0.7503529232237587, "learning_rate": 3.633254972732452e-05, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.2652524411678314, "step": 1980, "valid_targets_mean": 2164.6, "valid_targets_min": 1087 }, { "epoch": 1.9403714565004888, "grad_norm": 0.6787558928888673, "learning_rate": 3.630436315550624e-05, "loss": 0.2794, "loss_nan_ranks": 0, "loss_rank_avg": 0.24034081399440765, "step": 1985, "valid_targets_mean": 2107.4, "valid_targets_min": 771 }, { "epoch": 1.9452590420332356, "grad_norm": 0.7914047009085244, "learning_rate": 3.6276079704092755e-05, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.2761124074459076, "step": 1990, "valid_targets_mean": 2557.2, "valid_targets_min": 836 }, { "epoch": 1.9501466275659824, "grad_norm": 0.6934610377236305, "learning_rate": 3.6247699541142705e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.2904479503631592, "step": 1995, "valid_targets_mean": 2472.5, "valid_targets_min": 620 }, { "epoch": 1.9550342130987293, "grad_norm": 0.7028198944986546, "learning_rate": 3.62192228352894e-05, "loss": 0.2753, "loss_nan_ranks": 0, "loss_rank_avg": 0.30306535959243774, "step": 2000, "valid_targets_mean": 2393.2, "valid_targets_min": 820 }, { "epoch": 1.959921798631476, "grad_norm": 0.6656505685896379, "learning_rate": 3.6190649755739803e-05, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.27111366391181946, "step": 2005, "valid_targets_mean": 2641.5, "valid_targets_min": 655 }, { "epoch": 1.964809384164223, "grad_norm": 0.6548401411079302, "learning_rate": 3.616198047227353e-05, "loss": 0.267, "loss_nan_ranks": 0, "loss_rank_avg": 0.26000118255615234, "step": 2010, "valid_targets_mean": 2489.2, "valid_targets_min": 1225 }, { "epoch": 1.9696969696969697, "grad_norm": 0.7088864087296969, "learning_rate": 3.613321515524181e-05, "loss": 0.2591, "loss_nan_ranks": 0, "loss_rank_avg": 0.2879897654056549, "step": 2015, "valid_targets_mean": 2197.8, "valid_targets_min": 916 }, { "epoch": 1.9745845552297165, "grad_norm": 0.7810945047814258, "learning_rate": 3.610435397556653e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.25487759709358215, "step": 2020, "valid_targets_mean": 1809.1, "valid_targets_min": 1181 }, { "epoch": 1.9794721407624634, "grad_norm": 0.6618807198434398, "learning_rate": 3.607539710473916e-05, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.2809375524520874, "step": 2025, "valid_targets_mean": 2645.9, "valid_targets_min": 714 }, { "epoch": 1.9843597262952102, "grad_norm": 0.6889464103259075, "learning_rate": 3.6046344714819786e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.27869024872779846, "step": 2030, "valid_targets_mean": 2894.4, "valid_targets_min": 612 }, { "epoch": 1.989247311827957, "grad_norm": 0.7597436857623857, "learning_rate": 3.601719697843604e-05, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.24141916632652283, "step": 2035, "valid_targets_mean": 1800.8, "valid_targets_min": 648 }, { "epoch": 1.9941348973607038, "grad_norm": 0.6357417452126822, "learning_rate": 3.5987954068782114e-05, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.28626328706741333, "step": 2040, "valid_targets_mean": 3067.6, "valid_targets_min": 824 }, { "epoch": 1.9990224828934506, "grad_norm": 0.6268686861206388, "learning_rate": 3.595861615961771e-05, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.25856465101242065, "step": 2045, "valid_targets_mean": 2928.6, "valid_targets_min": 1156 }, { "epoch": 2.0039100684261975, "grad_norm": 0.5633104622128313, "learning_rate": 3.5929183425267e-05, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.2239726036787033, "step": 2050, "valid_targets_mean": 2999.4, "valid_targets_min": 631 }, { "epoch": 2.0087976539589443, "grad_norm": 0.7030082756993576, "learning_rate": 3.589965604061762e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.26195091009140015, "step": 2055, "valid_targets_mean": 2908.1, "valid_targets_min": 793 }, { "epoch": 2.013685239491691, "grad_norm": 0.7032018693280796, "learning_rate": 3.5870034181119605e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.23086042702198029, "step": 2060, "valid_targets_mean": 2292.1, "valid_targets_min": 748 }, { "epoch": 2.018572825024438, "grad_norm": 0.8062986669540131, "learning_rate": 3.5840318022784345e-05, "loss": 0.2279, "loss_nan_ranks": 0, "loss_rank_avg": 0.24330705404281616, "step": 2065, "valid_targets_mean": 2035.7, "valid_targets_min": 804 }, { "epoch": 2.0234604105571847, "grad_norm": 0.7456760467454644, "learning_rate": 3.5810507742183555e-05, "loss": 0.2319, "loss_nan_ranks": 0, "loss_rank_avg": 0.24097514152526855, "step": 2070, "valid_targets_mean": 2251.5, "valid_targets_min": 656 }, { "epoch": 2.0283479960899315, "grad_norm": 0.7974068850160627, "learning_rate": 3.5780603516448235e-05, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.25509095191955566, "step": 2075, "valid_targets_mean": 2308.2, "valid_targets_min": 842 }, { "epoch": 2.0332355816226784, "grad_norm": 0.7027608391523197, "learning_rate": 3.575060552326758e-05, "loss": 0.2605, "loss_nan_ranks": 0, "loss_rank_avg": 0.26107388734817505, "step": 2080, "valid_targets_mean": 2641.1, "valid_targets_min": 702 }, { "epoch": 2.038123167155425, "grad_norm": 0.6771926382902913, "learning_rate": 3.572051394088795e-05, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.254364550113678, "step": 2085, "valid_targets_mean": 3093.8, "valid_targets_min": 1095 }, { "epoch": 2.043010752688172, "grad_norm": 0.7920555868975577, "learning_rate": 3.569032894811182e-05, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.25785136222839355, "step": 2090, "valid_targets_mean": 2053.3, "valid_targets_min": 803 }, { "epoch": 2.047898338220919, "grad_norm": 0.6836448197530809, "learning_rate": 3.566005072429668e-05, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.21475102007389069, "step": 2095, "valid_targets_mean": 2353.8, "valid_targets_min": 976 }, { "epoch": 2.0527859237536656, "grad_norm": 0.712116095288442, "learning_rate": 3.562967944935402e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.23862826824188232, "step": 2100, "valid_targets_mean": 2316.5, "valid_targets_min": 768 }, { "epoch": 2.0576735092864125, "grad_norm": 0.7340036820210002, "learning_rate": 3.559921530374821e-05, "loss": 0.236, "loss_nan_ranks": 0, "loss_rank_avg": 0.2310110479593277, "step": 2105, "valid_targets_mean": 2313.2, "valid_targets_min": 763 }, { "epoch": 2.0625610948191593, "grad_norm": 0.7950851146965314, "learning_rate": 3.556865846849547e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.24690885841846466, "step": 2110, "valid_targets_mean": 1923.8, "valid_targets_min": 684 }, { "epoch": 2.067448680351906, "grad_norm": 0.9485462964048043, "learning_rate": 3.5538009125162774e-05, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.2360670119524002, "step": 2115, "valid_targets_mean": 2597.2, "valid_targets_min": 1328 }, { "epoch": 2.072336265884653, "grad_norm": 0.6042905131795798, "learning_rate": 3.550726745586677e-05, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.24113643169403076, "step": 2120, "valid_targets_mean": 3059.4, "valid_targets_min": 884 }, { "epoch": 2.0772238514173997, "grad_norm": 0.6939861915048151, "learning_rate": 3.5476433643272695e-05, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.23294597864151, "step": 2125, "valid_targets_mean": 2400.4, "valid_targets_min": 863 }, { "epoch": 2.0821114369501466, "grad_norm": 0.7426227574519302, "learning_rate": 3.5445507870593315e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.2383473813533783, "step": 2130, "valid_targets_mean": 2200.8, "valid_targets_min": 670 }, { "epoch": 2.0869990224828934, "grad_norm": 0.6868218935296267, "learning_rate": 3.54144903215878e-05, "loss": 0.2284, "loss_nan_ranks": 0, "loss_rank_avg": 0.2236156016588211, "step": 2135, "valid_targets_mean": 2512.4, "valid_targets_min": 522 }, { "epoch": 2.09188660801564, "grad_norm": 0.734071113886848, "learning_rate": 3.538338118056065e-05, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.26370787620544434, "step": 2140, "valid_targets_mean": 2402.6, "valid_targets_min": 731 }, { "epoch": 2.096774193548387, "grad_norm": 0.7089461463159339, "learning_rate": 3.5352180632360614e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.212519571185112, "step": 2145, "valid_targets_mean": 2266.1, "valid_targets_min": 504 }, { "epoch": 2.101661779081134, "grad_norm": 0.791032807011372, "learning_rate": 3.532088886237956e-05, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.2348712533712387, "step": 2150, "valid_targets_mean": 2305.6, "valid_targets_min": 746 }, { "epoch": 2.1065493646138806, "grad_norm": 0.6579340652769179, "learning_rate": 3.5289506056551414e-05, "loss": 0.2562, "loss_nan_ranks": 0, "loss_rank_avg": 0.27510562539100647, "step": 2155, "valid_targets_mean": 2961.9, "valid_targets_min": 680 }, { "epoch": 2.1114369501466275, "grad_norm": 0.7467367590945104, "learning_rate": 3.5258032401351005e-05, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.22451433539390564, "step": 2160, "valid_targets_mean": 2105.4, "valid_targets_min": 765 }, { "epoch": 2.1163245356793743, "grad_norm": 0.9754841406665122, "learning_rate": 3.522646808379299e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.2368217408657074, "step": 2165, "valid_targets_mean": 2108.7, "valid_targets_min": 618 }, { "epoch": 2.121212121212121, "grad_norm": 0.679630597898811, "learning_rate": 3.519481329143076e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.23734697699546814, "step": 2170, "valid_targets_mean": 2571.5, "valid_targets_min": 1089 }, { "epoch": 2.126099706744868, "grad_norm": 0.658153760353656, "learning_rate": 3.5163068212355274e-05, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.256761372089386, "step": 2175, "valid_targets_mean": 2925.9, "valid_targets_min": 803 }, { "epoch": 2.1309872922776147, "grad_norm": 0.7475086838003469, "learning_rate": 3.513123303519397e-05, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.22203174233436584, "step": 2180, "valid_targets_mean": 1844.1, "valid_targets_min": 692 }, { "epoch": 2.1358748778103616, "grad_norm": 0.6041239999536051, "learning_rate": 3.509930794910967e-05, "loss": 0.2367, "loss_nan_ranks": 0, "loss_rank_avg": 0.22519180178642273, "step": 2185, "valid_targets_mean": 3204.3, "valid_targets_min": 946 }, { "epoch": 2.1407624633431084, "grad_norm": 0.7509582157797575, "learning_rate": 3.506729314379941e-05, "loss": 0.2274, "loss_nan_ranks": 0, "loss_rank_avg": 0.25604188442230225, "step": 2190, "valid_targets_mean": 2394.9, "valid_targets_min": 677 }, { "epoch": 2.145650048875855, "grad_norm": 0.6750872876590103, "learning_rate": 3.5035188809493335e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.22361913323402405, "step": 2195, "valid_targets_mean": 2691.1, "valid_targets_min": 791 }, { "epoch": 2.150537634408602, "grad_norm": 0.6447663759799113, "learning_rate": 3.500299513695356e-05, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.22863362729549408, "step": 2200, "valid_targets_mean": 2783.2, "valid_targets_min": 853 }, { "epoch": 2.155425219941349, "grad_norm": 0.7166550535292393, "learning_rate": 3.497071231747306e-05, "loss": 0.2224, "loss_nan_ranks": 0, "loss_rank_avg": 0.25535690784454346, "step": 2205, "valid_targets_mean": 2722.8, "valid_targets_min": 989 }, { "epoch": 2.1603128054740957, "grad_norm": 0.8862852553501419, "learning_rate": 3.493834054287449e-05, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.24125589430332184, "step": 2210, "valid_targets_mean": 2089.8, "valid_targets_min": 787 }, { "epoch": 2.1652003910068425, "grad_norm": 0.7210539973246137, "learning_rate": 3.490588000550911e-05, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.26080626249313354, "step": 2215, "valid_targets_mean": 2307.4, "valid_targets_min": 995 }, { "epoch": 2.1700879765395893, "grad_norm": 0.6876101039598905, "learning_rate": 3.4873330898255556e-05, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.22508588433265686, "step": 2220, "valid_targets_mean": 2578.5, "valid_targets_min": 551 }, { "epoch": 2.174975562072336, "grad_norm": 0.679616490089902, "learning_rate": 3.4840693414518776e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.22549769282341003, "step": 2225, "valid_targets_mean": 2478.4, "valid_targets_min": 1293 }, { "epoch": 2.179863147605083, "grad_norm": 0.6885669807827226, "learning_rate": 3.4807967748228844e-05, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.21673941612243652, "step": 2230, "valid_targets_mean": 2484.1, "valid_targets_min": 1140 }, { "epoch": 2.1847507331378297, "grad_norm": 0.6971954496384682, "learning_rate": 3.477515409383979e-05, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.22069767117500305, "step": 2235, "valid_targets_mean": 2294.4, "valid_targets_min": 914 }, { "epoch": 2.1896383186705766, "grad_norm": 0.7601614406567037, "learning_rate": 3.474225264632847e-05, "loss": 0.2424, "loss_nan_ranks": 0, "loss_rank_avg": 0.20157967507839203, "step": 2240, "valid_targets_mean": 1873.1, "valid_targets_min": 615 }, { "epoch": 2.1945259042033234, "grad_norm": 0.6527427792093988, "learning_rate": 3.470926360119343e-05, "loss": 0.2372, "loss_nan_ranks": 0, "loss_rank_avg": 0.22357343137264252, "step": 2245, "valid_targets_mean": 2597.2, "valid_targets_min": 720 }, { "epoch": 2.19941348973607, "grad_norm": 1.2913533556146168, "learning_rate": 3.467618715445367e-05, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.2719864845275879, "step": 2250, "valid_targets_mean": 2356.8, "valid_targets_min": 1038 }, { "epoch": 2.204301075268817, "grad_norm": 0.6982533310800236, "learning_rate": 3.464302350264756e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.23422983288764954, "step": 2255, "valid_targets_mean": 2767.9, "valid_targets_min": 753 }, { "epoch": 2.209188660801564, "grad_norm": 0.7221984393019797, "learning_rate": 3.460977284283162e-05, "loss": 0.2455, "loss_nan_ranks": 0, "loss_rank_avg": 0.266290545463562, "step": 2260, "valid_targets_mean": 2269.7, "valid_targets_min": 822 }, { "epoch": 2.2140762463343107, "grad_norm": 0.7114567359248741, "learning_rate": 3.457643537257938e-05, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.19123372435569763, "step": 2265, "valid_targets_mean": 1872.2, "valid_targets_min": 570 }, { "epoch": 2.2189638318670575, "grad_norm": 0.6540588887195975, "learning_rate": 3.454301128998018e-05, "loss": 0.2204, "loss_nan_ranks": 0, "loss_rank_avg": 0.2638104259967804, "step": 2270, "valid_targets_mean": 3022.8, "valid_targets_min": 987 }, { "epoch": 2.2238514173998043, "grad_norm": 0.6898490839976488, "learning_rate": 3.4509500793638015e-05, "loss": 0.239, "loss_nan_ranks": 0, "loss_rank_avg": 0.2437189519405365, "step": 2275, "valid_targets_mean": 2453.7, "valid_targets_min": 656 }, { "epoch": 2.228739002932551, "grad_norm": 0.7463219837340317, "learning_rate": 3.447590408267034e-05, "loss": 0.2394, "loss_nan_ranks": 0, "loss_rank_avg": 0.21820449829101562, "step": 2280, "valid_targets_mean": 2064.9, "valid_targets_min": 748 }, { "epoch": 2.233626588465298, "grad_norm": 0.7810585743007555, "learning_rate": 3.444222135670688e-05, "loss": 0.2394, "loss_nan_ranks": 0, "loss_rank_avg": 0.2506566643714905, "step": 2285, "valid_targets_mean": 2264.9, "valid_targets_min": 820 }, { "epoch": 2.2385141739980448, "grad_norm": 0.7468906966516604, "learning_rate": 3.44084528158885e-05, "loss": 0.2261, "loss_nan_ranks": 0, "loss_rank_avg": 0.22076962888240814, "step": 2290, "valid_targets_mean": 2084.4, "valid_targets_min": 721 }, { "epoch": 2.2434017595307916, "grad_norm": 0.7194591472281033, "learning_rate": 3.437459866086591e-05, "loss": 0.2509, "loss_nan_ranks": 0, "loss_rank_avg": 0.23915450274944305, "step": 2295, "valid_targets_mean": 2377.3, "valid_targets_min": 650 }, { "epoch": 2.2482893450635384, "grad_norm": 0.7180690575974027, "learning_rate": 3.4340659092798594e-05, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.2506748139858246, "step": 2300, "valid_targets_mean": 2737.3, "valid_targets_min": 567 }, { "epoch": 2.253176930596285, "grad_norm": 0.6309852432550281, "learning_rate": 3.4306634313353504e-05, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.2439078688621521, "step": 2305, "valid_targets_mean": 3100.8, "valid_targets_min": 914 }, { "epoch": 2.258064516129032, "grad_norm": 0.7572600999737557, "learning_rate": 3.427252452470395e-05, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.2431081384420395, "step": 2310, "valid_targets_mean": 1790.9, "valid_targets_min": 640 }, { "epoch": 2.262952101661779, "grad_norm": 0.683772308399432, "learning_rate": 3.423832992952836e-05, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.24556618928909302, "step": 2315, "valid_targets_mean": 2683.7, "valid_targets_min": 801 }, { "epoch": 2.2678396871945257, "grad_norm": 0.8397527577042548, "learning_rate": 3.420405073100905e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.254273384809494, "step": 2320, "valid_targets_mean": 2155.0, "valid_targets_min": 867 }, { "epoch": 2.2727272727272725, "grad_norm": 0.851065317435724, "learning_rate": 3.416968713283105e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.2502952814102173, "step": 2325, "valid_targets_mean": 2122.0, "valid_targets_min": 684 }, { "epoch": 2.2776148582600193, "grad_norm": 0.6985298739440852, "learning_rate": 3.413523933918093e-05, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.22682811319828033, "step": 2330, "valid_targets_mean": 2159.1, "valid_targets_min": 795 }, { "epoch": 2.2825024437927666, "grad_norm": 0.8111962594657017, "learning_rate": 3.4100707554745495e-05, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.24102097749710083, "step": 2335, "valid_targets_mean": 2234.1, "valid_targets_min": 705 }, { "epoch": 2.2873900293255134, "grad_norm": 0.5993930502127762, "learning_rate": 3.406609198471064e-05, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.18438704311847687, "step": 2340, "valid_targets_mean": 2438.3, "valid_targets_min": 1216 }, { "epoch": 2.29227761485826, "grad_norm": 0.7265646225215977, "learning_rate": 3.403139283476011e-05, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.2278384566307068, "step": 2345, "valid_targets_mean": 2198.9, "valid_targets_min": 1056 }, { "epoch": 2.297165200391007, "grad_norm": 0.6075073209468058, "learning_rate": 3.3996610311074266e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.2122841477394104, "step": 2350, "valid_targets_mean": 2752.8, "valid_targets_min": 762 }, { "epoch": 2.302052785923754, "grad_norm": 0.6706963737298545, "learning_rate": 3.396174462032888e-05, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.241616889834404, "step": 2355, "valid_targets_mean": 2314.3, "valid_targets_min": 637 }, { "epoch": 2.3069403714565007, "grad_norm": 1.1053006675938248, "learning_rate": 3.392679596969391e-05, "loss": 0.2285, "loss_nan_ranks": 0, "loss_rank_avg": 0.232365682721138, "step": 2360, "valid_targets_mean": 2931.2, "valid_targets_min": 1234 }, { "epoch": 2.3118279569892475, "grad_norm": 0.68661451987901, "learning_rate": 3.389176456683222e-05, "loss": 0.2406, "loss_nan_ranks": 0, "loss_rank_avg": 0.2415533810853958, "step": 2365, "valid_targets_mean": 2462.8, "valid_targets_min": 748 }, { "epoch": 2.3167155425219943, "grad_norm": 0.7999782604502889, "learning_rate": 3.385665061989842e-05, "loss": 0.2181, "loss_nan_ranks": 0, "loss_rank_avg": 0.21598216891288757, "step": 2370, "valid_targets_mean": 1724.7, "valid_targets_min": 662 }, { "epoch": 2.321603128054741, "grad_norm": 0.7182473780722957, "learning_rate": 3.382145433753758e-05, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.27340924739837646, "step": 2375, "valid_targets_mean": 2582.8, "valid_targets_min": 774 }, { "epoch": 2.326490713587488, "grad_norm": 0.7676223492166587, "learning_rate": 3.3786175928883994e-05, "loss": 0.2299, "loss_nan_ranks": 0, "loss_rank_avg": 0.21359305083751678, "step": 2380, "valid_targets_mean": 1934.9, "valid_targets_min": 646 }, { "epoch": 2.3313782991202348, "grad_norm": 0.701569446945032, "learning_rate": 3.375081560355996e-05, "loss": 0.2327, "loss_nan_ranks": 0, "loss_rank_avg": 0.24448227882385254, "step": 2385, "valid_targets_mean": 2355.2, "valid_targets_min": 700 }, { "epoch": 2.3362658846529816, "grad_norm": 0.668238001789143, "learning_rate": 3.3715373571674495e-05, "loss": 0.2522, "loss_nan_ranks": 0, "loss_rank_avg": 0.24243560433387756, "step": 2390, "valid_targets_mean": 2480.6, "valid_targets_min": 1062 }, { "epoch": 2.3411534701857284, "grad_norm": 0.7311150815773109, "learning_rate": 3.367985004382216e-05, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.22406163811683655, "step": 2395, "valid_targets_mean": 1759.3, "valid_targets_min": 1058 }, { "epoch": 2.346041055718475, "grad_norm": 0.6489801175202864, "learning_rate": 3.36442452310817e-05, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.2665456533432007, "step": 2400, "valid_targets_mean": 2741.1, "valid_targets_min": 772 }, { "epoch": 2.350928641251222, "grad_norm": 0.6383014149144618, "learning_rate": 3.36085593450149e-05, "loss": 0.2314, "loss_nan_ranks": 0, "loss_rank_avg": 0.23392713069915771, "step": 2405, "valid_targets_mean": 2465.8, "valid_targets_min": 697 }, { "epoch": 2.355816226783969, "grad_norm": 0.6749587378319567, "learning_rate": 3.3572792597665244e-05, "loss": 0.2422, "loss_nan_ranks": 0, "loss_rank_avg": 0.2573961019515991, "step": 2410, "valid_targets_mean": 2782.9, "valid_targets_min": 888 }, { "epoch": 2.3607038123167157, "grad_norm": 0.9440638611034704, "learning_rate": 3.353694520155672e-05, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.24345912039279938, "step": 2415, "valid_targets_mean": 2128.4, "valid_targets_min": 1012 }, { "epoch": 2.3655913978494625, "grad_norm": 0.7148978990158092, "learning_rate": 3.350101736969249e-05, "loss": 0.2563, "loss_nan_ranks": 0, "loss_rank_avg": 0.2735242247581482, "step": 2420, "valid_targets_mean": 2309.9, "valid_targets_min": 771 }, { "epoch": 2.3704789833822093, "grad_norm": 0.8017459949388398, "learning_rate": 3.346500931555369e-05, "loss": 0.23, "loss_nan_ranks": 0, "loss_rank_avg": 0.2165670096874237, "step": 2425, "valid_targets_mean": 2131.1, "valid_targets_min": 708 }, { "epoch": 2.375366568914956, "grad_norm": 0.6221765808255351, "learning_rate": 3.3428921253098126e-05, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.26252031326293945, "step": 2430, "valid_targets_mean": 3323.1, "valid_targets_min": 1030 }, { "epoch": 2.380254154447703, "grad_norm": 0.6740618705615318, "learning_rate": 3.3392753396759e-05, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.23797520995140076, "step": 2435, "valid_targets_mean": 2207.9, "valid_targets_min": 734 }, { "epoch": 2.3851417399804498, "grad_norm": 0.7273981487589926, "learning_rate": 3.3356505961443644e-05, "loss": 0.2382, "loss_nan_ranks": 0, "loss_rank_avg": 0.23226913809776306, "step": 2440, "valid_targets_mean": 2119.9, "valid_targets_min": 685 }, { "epoch": 2.3900293255131966, "grad_norm": 0.7495183220790104, "learning_rate": 3.332017916253227e-05, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.2352924793958664, "step": 2445, "valid_targets_mean": 2707.6, "valid_targets_min": 714 }, { "epoch": 2.3949169110459434, "grad_norm": 0.7842291061024107, "learning_rate": 3.328377321587662e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.22039464116096497, "step": 2450, "valid_targets_mean": 1844.9, "valid_targets_min": 544 }, { "epoch": 2.39980449657869, "grad_norm": 0.6173507633048779, "learning_rate": 3.324728833779876e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.23128989338874817, "step": 2455, "valid_targets_mean": 2820.6, "valid_targets_min": 1219 }, { "epoch": 2.404692082111437, "grad_norm": 0.7009098945991525, "learning_rate": 3.3210724745089757e-05, "loss": 0.218, "loss_nan_ranks": 0, "loss_rank_avg": 0.20386609435081482, "step": 2460, "valid_targets_mean": 2477.1, "valid_targets_min": 622 }, { "epoch": 2.409579667644184, "grad_norm": 0.7651345366780957, "learning_rate": 3.31740826550084e-05, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.2441290318965912, "step": 2465, "valid_targets_mean": 2235.6, "valid_targets_min": 783 }, { "epoch": 2.4144672531769307, "grad_norm": 0.7279723174495759, "learning_rate": 3.313736228527987e-05, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.2114153504371643, "step": 2470, "valid_targets_mean": 2223.0, "valid_targets_min": 761 }, { "epoch": 2.4193548387096775, "grad_norm": 0.7868641978840135, "learning_rate": 3.310056385409453e-05, "loss": 0.2494, "loss_nan_ranks": 0, "loss_rank_avg": 0.26033109426498413, "step": 2475, "valid_targets_mean": 2057.3, "valid_targets_min": 770 }, { "epoch": 2.4242424242424243, "grad_norm": 0.6636689132066698, "learning_rate": 3.3063687580106544e-05, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.2515316903591156, "step": 2480, "valid_targets_mean": 2834.2, "valid_targets_min": 750 }, { "epoch": 2.429130009775171, "grad_norm": 0.7145023267491682, "learning_rate": 3.302673368243264e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.2276870310306549, "step": 2485, "valid_targets_mean": 2252.9, "valid_targets_min": 668 }, { "epoch": 2.434017595307918, "grad_norm": 0.6488982935705684, "learning_rate": 3.298970238065077e-05, "loss": 0.243, "loss_nan_ranks": 0, "loss_rank_avg": 0.250893771648407, "step": 2490, "valid_targets_mean": 2848.4, "valid_targets_min": 1069 }, { "epoch": 2.4389051808406648, "grad_norm": 0.6730474280370319, "learning_rate": 3.2952593894798796e-05, "loss": 0.236, "loss_nan_ranks": 0, "loss_rank_avg": 0.22307783365249634, "step": 2495, "valid_targets_mean": 2428.5, "valid_targets_min": 934 }, { "epoch": 2.4437927663734116, "grad_norm": 0.7947851421243562, "learning_rate": 3.291540844537324e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.2531839907169342, "step": 2500, "valid_targets_mean": 1988.7, "valid_targets_min": 690 }, { "epoch": 2.4486803519061584, "grad_norm": 0.6648566470243608, "learning_rate": 3.287814625332792e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.2527335286140442, "step": 2505, "valid_targets_mean": 2601.8, "valid_targets_min": 1007 }, { "epoch": 2.4535679374389052, "grad_norm": 0.7237098939276865, "learning_rate": 3.2840807540072644e-05, "loss": 0.2483, "loss_nan_ranks": 0, "loss_rank_avg": 0.24128659069538116, "step": 2510, "valid_targets_mean": 2112.2, "valid_targets_min": 1071 }, { "epoch": 2.458455522971652, "grad_norm": 0.671690132960215, "learning_rate": 3.280339252747192e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.24696272611618042, "step": 2515, "valid_targets_mean": 2795.6, "valid_targets_min": 610 }, { "epoch": 2.463343108504399, "grad_norm": 0.6700935950794794, "learning_rate": 3.276590143784362e-05, "loss": 0.2486, "loss_nan_ranks": 0, "loss_rank_avg": 0.21841683983802795, "step": 2520, "valid_targets_mean": 2417.8, "valid_targets_min": 676 }, { "epoch": 2.4682306940371457, "grad_norm": 0.6719669379309949, "learning_rate": 3.2728334493957654e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.22499142587184906, "step": 2525, "valid_targets_mean": 2297.1, "valid_targets_min": 699 }, { "epoch": 2.4731182795698925, "grad_norm": 0.6892705433904501, "learning_rate": 3.269069191903466e-05, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.22186297178268433, "step": 2530, "valid_targets_mean": 2068.8, "valid_targets_min": 740 }, { "epoch": 2.4780058651026393, "grad_norm": 0.7393767252579292, "learning_rate": 3.2652973936744667e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.2544059157371521, "step": 2535, "valid_targets_mean": 2338.4, "valid_targets_min": 722 }, { "epoch": 2.482893450635386, "grad_norm": 0.7561597467756237, "learning_rate": 3.261518077120578e-05, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.21395118534564972, "step": 2540, "valid_targets_mean": 1770.1, "valid_targets_min": 589 }, { "epoch": 2.487781036168133, "grad_norm": 0.753579094986984, "learning_rate": 3.257731264698283e-05, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.21489103138446808, "step": 2545, "valid_targets_mean": 1672.8, "valid_targets_min": 755 }, { "epoch": 2.4926686217008798, "grad_norm": 0.6589858003710982, "learning_rate": 3.253936978908604e-05, "loss": 0.2293, "loss_nan_ranks": 0, "loss_rank_avg": 0.24498148262500763, "step": 2550, "valid_targets_mean": 3218.2, "valid_targets_min": 1118 }, { "epoch": 2.4975562072336266, "grad_norm": 0.7002768152776646, "learning_rate": 3.250135242296971e-05, "loss": 0.2514, "loss_nan_ranks": 0, "loss_rank_avg": 0.2629767060279846, "step": 2555, "valid_targets_mean": 2427.2, "valid_targets_min": 796 }, { "epoch": 2.5024437927663734, "grad_norm": 0.786673139351379, "learning_rate": 3.246326077453087e-05, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.22290992736816406, "step": 2560, "valid_targets_mean": 1889.1, "valid_targets_min": 717 }, { "epoch": 2.5073313782991202, "grad_norm": 0.6164870341662336, "learning_rate": 3.242509507010791e-05, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.23814159631729126, "step": 2565, "valid_targets_mean": 3004.0, "valid_targets_min": 792 }, { "epoch": 2.512218963831867, "grad_norm": 0.7245474670367238, "learning_rate": 3.238685553647927e-05, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.21552202105522156, "step": 2570, "valid_targets_mean": 1887.2, "valid_targets_min": 753 }, { "epoch": 2.517106549364614, "grad_norm": 0.7481756056168739, "learning_rate": 3.2348542400862075e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.2534748911857605, "step": 2575, "valid_targets_mean": 2268.9, "valid_targets_min": 632 }, { "epoch": 2.5219941348973607, "grad_norm": 0.7224008501321807, "learning_rate": 3.231015589091079e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.2531392574310303, "step": 2580, "valid_targets_mean": 2338.6, "valid_targets_min": 882 }, { "epoch": 2.5268817204301075, "grad_norm": 0.7291916308037362, "learning_rate": 3.2271696234715866e-05, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.2746545374393463, "step": 2585, "valid_targets_mean": 2363.4, "valid_targets_min": 843 }, { "epoch": 2.5317693059628543, "grad_norm": 1.0380167495946064, "learning_rate": 3.2233163660802387e-05, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.21444106101989746, "step": 2590, "valid_targets_mean": 1598.9, "valid_targets_min": 732 }, { "epoch": 2.536656891495601, "grad_norm": 0.6544024445784333, "learning_rate": 3.219455839812871e-05, "loss": 0.2382, "loss_nan_ranks": 0, "loss_rank_avg": 0.21233348548412323, "step": 2595, "valid_targets_mean": 2456.2, "valid_targets_min": 1190 }, { "epoch": 2.541544477028348, "grad_norm": 0.628273229393255, "learning_rate": 3.21558806760851e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.2087693214416504, "step": 2600, "valid_targets_mean": 2745.5, "valid_targets_min": 700 }, { "epoch": 2.5464320625610948, "grad_norm": 0.6030343066322286, "learning_rate": 3.211713072449236e-05, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.22888022661209106, "step": 2605, "valid_targets_mean": 2916.0, "valid_targets_min": 884 }, { "epoch": 2.5513196480938416, "grad_norm": 0.7152526807779622, "learning_rate": 3.207830877360051e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.22312462329864502, "step": 2610, "valid_targets_mean": 2152.1, "valid_targets_min": 924 }, { "epoch": 2.5562072336265884, "grad_norm": 0.6731642169381366, "learning_rate": 3.203941505408736e-05, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.21658943593502045, "step": 2615, "valid_targets_mean": 2331.7, "valid_targets_min": 911 }, { "epoch": 2.5610948191593352, "grad_norm": 0.6639073922224608, "learning_rate": 3.200044979705717e-05, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.22162654995918274, "step": 2620, "valid_targets_mean": 2536.9, "valid_targets_min": 765 }, { "epoch": 2.565982404692082, "grad_norm": 0.7471285143763177, "learning_rate": 3.1961413234039267e-05, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.24290457367897034, "step": 2625, "valid_targets_mean": 2320.9, "valid_targets_min": 970 }, { "epoch": 2.570869990224829, "grad_norm": 0.7014404171599978, "learning_rate": 3.192230559698669e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.2300807237625122, "step": 2630, "valid_targets_mean": 2163.2, "valid_targets_min": 1099 }, { "epoch": 2.5757575757575757, "grad_norm": 0.7689908471529473, "learning_rate": 3.1883127118274795e-05, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.22766678035259247, "step": 2635, "valid_targets_mean": 2223.1, "valid_targets_min": 758 }, { "epoch": 2.5806451612903225, "grad_norm": 0.7524156572486015, "learning_rate": 3.1843878030699843e-05, "loss": 0.242, "loss_nan_ranks": 0, "loss_rank_avg": 0.22420425713062286, "step": 2640, "valid_targets_mean": 2231.3, "valid_targets_min": 900 }, { "epoch": 2.5855327468230693, "grad_norm": 0.6206868507870091, "learning_rate": 3.180455856747768e-05, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.23075121641159058, "step": 2645, "valid_targets_mean": 2600.9, "valid_targets_min": 1010 }, { "epoch": 2.590420332355816, "grad_norm": 0.90695340921089, "learning_rate": 3.1765168962242314e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.2378099113702774, "step": 2650, "valid_targets_mean": 3146.6, "valid_targets_min": 656 }, { "epoch": 2.595307917888563, "grad_norm": 0.7522437194650009, "learning_rate": 3.172570944904454e-05, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.24361330270767212, "step": 2655, "valid_targets_mean": 1933.7, "valid_targets_min": 607 }, { "epoch": 2.60019550342131, "grad_norm": 0.7385794100286881, "learning_rate": 3.168618026235052e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.2449553906917572, "step": 2660, "valid_targets_mean": 2196.0, "valid_targets_min": 734 }, { "epoch": 2.6050830889540566, "grad_norm": 0.6811321355025456, "learning_rate": 3.164658163704044e-05, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.2384980171918869, "step": 2665, "valid_targets_mean": 2501.2, "valid_targets_min": 826 }, { "epoch": 2.6099706744868034, "grad_norm": 0.7081141329414362, "learning_rate": 3.160691380840705e-05, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.22777023911476135, "step": 2670, "valid_targets_mean": 2467.4, "valid_targets_min": 747 }, { "epoch": 2.6148582600195502, "grad_norm": 0.6830393989705583, "learning_rate": 3.156717701215433e-05, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.21992099285125732, "step": 2675, "valid_targets_mean": 2317.6, "valid_targets_min": 950 }, { "epoch": 2.619745845552297, "grad_norm": 0.8012433854096802, "learning_rate": 3.152737148439608e-05, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.27927660942077637, "step": 2680, "valid_targets_mean": 2117.2, "valid_targets_min": 789 }, { "epoch": 2.624633431085044, "grad_norm": 0.6934903380108935, "learning_rate": 3.1487497461654435e-05, "loss": 0.2424, "loss_nan_ranks": 0, "loss_rank_avg": 0.25259506702423096, "step": 2685, "valid_targets_mean": 2417.8, "valid_targets_min": 791 }, { "epoch": 2.6295210166177907, "grad_norm": 0.7359216165404469, "learning_rate": 3.144755518085859e-05, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.24347510933876038, "step": 2690, "valid_targets_mean": 2227.3, "valid_targets_min": 1027 }, { "epoch": 2.6344086021505375, "grad_norm": 0.7767880726332548, "learning_rate": 3.1407544879343284e-05, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.24625647068023682, "step": 2695, "valid_targets_mean": 1754.9, "valid_targets_min": 689 }, { "epoch": 2.6392961876832843, "grad_norm": 0.696674510993026, "learning_rate": 3.136746679484746e-05, "loss": 0.2366, "loss_nan_ranks": 0, "loss_rank_avg": 0.2380523532629013, "step": 2700, "valid_targets_mean": 2332.2, "valid_targets_min": 790 }, { "epoch": 2.644183773216031, "grad_norm": 0.6694545044109874, "learning_rate": 3.1327321165512784e-05, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.2502917945384979, "step": 2705, "valid_targets_mean": 2535.8, "valid_targets_min": 1282 }, { "epoch": 2.649071358748778, "grad_norm": 0.6987439481563695, "learning_rate": 3.128710822988231e-05, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.21862663328647614, "step": 2710, "valid_targets_mean": 1921.0, "valid_targets_min": 823 }, { "epoch": 2.653958944281525, "grad_norm": 0.6914300177187406, "learning_rate": 3.1246828226899e-05, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.22969259321689606, "step": 2715, "valid_targets_mean": 2253.5, "valid_targets_min": 824 }, { "epoch": 2.6588465298142716, "grad_norm": 0.602200287873372, "learning_rate": 3.120648139590435e-05, "loss": 0.2455, "loss_nan_ranks": 0, "loss_rank_avg": 0.24584728479385376, "step": 2720, "valid_targets_mean": 3155.4, "valid_targets_min": 1278 }, { "epoch": 2.6637341153470184, "grad_norm": 0.7075447193702563, "learning_rate": 3.1166067976636906e-05, "loss": 0.2295, "loss_nan_ranks": 0, "loss_rank_avg": 0.2338378131389618, "step": 2725, "valid_targets_mean": 2341.6, "valid_targets_min": 533 }, { "epoch": 2.6686217008797652, "grad_norm": 0.6716820653818237, "learning_rate": 3.1125588209230914e-05, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.234563410282135, "step": 2730, "valid_targets_mean": 2494.7, "valid_targets_min": 756 }, { "epoch": 2.673509286412512, "grad_norm": 0.6350189009309046, "learning_rate": 3.108504233421482e-05, "loss": 0.2304, "loss_nan_ranks": 0, "loss_rank_avg": 0.2456614375114441, "step": 2735, "valid_targets_mean": 2821.6, "valid_targets_min": 761 }, { "epoch": 2.678396871945259, "grad_norm": 0.6980749472004388, "learning_rate": 3.104443059250992e-05, "loss": 0.2231, "loss_nan_ranks": 0, "loss_rank_avg": 0.24124208092689514, "step": 2740, "valid_targets_mean": 2521.0, "valid_targets_min": 992 }, { "epoch": 2.6832844574780057, "grad_norm": 0.67259645483737, "learning_rate": 3.1003753225428855e-05, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.22315667569637299, "step": 2745, "valid_targets_mean": 2475.1, "valid_targets_min": 859 }, { "epoch": 2.688172043010753, "grad_norm": 0.6681313606790765, "learning_rate": 3.0963010474674217e-05, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.247651606798172, "step": 2750, "valid_targets_mean": 2558.2, "valid_targets_min": 634 }, { "epoch": 2.6930596285435, "grad_norm": 0.6859361683493692, "learning_rate": 3.0922202582337115e-05, "loss": 0.2164, "loss_nan_ranks": 0, "loss_rank_avg": 0.19534924626350403, "step": 2755, "valid_targets_mean": 2257.4, "valid_targets_min": 876 }, { "epoch": 2.6979472140762466, "grad_norm": 0.6985818000049671, "learning_rate": 3.08813297908957e-05, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.25439029932022095, "step": 2760, "valid_targets_mean": 2687.1, "valid_targets_min": 958 }, { "epoch": 2.7028347996089934, "grad_norm": 0.6566705673923328, "learning_rate": 3.084039234321379e-05, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.2557886242866516, "step": 2765, "valid_targets_mean": 2698.4, "valid_targets_min": 549 }, { "epoch": 2.7077223851417402, "grad_norm": 0.6165188909289334, "learning_rate": 3.079939048253934e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.24600160121917725, "step": 2770, "valid_targets_mean": 2858.0, "valid_targets_min": 978 }, { "epoch": 2.712609970674487, "grad_norm": 0.6790410549127608, "learning_rate": 3.0758324452503065e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.2445409744977951, "step": 2775, "valid_targets_mean": 2667.5, "valid_targets_min": 740 }, { "epoch": 2.717497556207234, "grad_norm": 0.6974981732520593, "learning_rate": 3.071719449711699e-05, "loss": 0.2309, "loss_nan_ranks": 0, "loss_rank_avg": 0.23706629872322083, "step": 2780, "valid_targets_mean": 2513.4, "valid_targets_min": 1093 }, { "epoch": 2.7223851417399807, "grad_norm": 0.6737555976917173, "learning_rate": 3.0676000860772956e-05, "loss": 0.2231, "loss_nan_ranks": 0, "loss_rank_avg": 0.2328021228313446, "step": 2785, "valid_targets_mean": 2313.6, "valid_targets_min": 684 }, { "epoch": 2.7272727272727275, "grad_norm": 1.2575294841809628, "learning_rate": 3.063474378824119e-05, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.23096132278442383, "step": 2790, "valid_targets_mean": 1920.2, "valid_targets_min": 891 }, { "epoch": 2.7321603128054743, "grad_norm": 0.6273895966528873, "learning_rate": 3.0593423524668864e-05, "loss": 0.2443, "loss_nan_ranks": 0, "loss_rank_avg": 0.23225541412830353, "step": 2795, "valid_targets_mean": 2795.9, "valid_targets_min": 815 }, { "epoch": 2.737047898338221, "grad_norm": 0.750013291851974, "learning_rate": 3.055204031557863e-05, "loss": 0.2184, "loss_nan_ranks": 0, "loss_rank_avg": 0.19314704835414886, "step": 2800, "valid_targets_mean": 1944.0, "valid_targets_min": 839 }, { "epoch": 2.741935483870968, "grad_norm": 0.665083340706297, "learning_rate": 3.0510594406867153e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.23232056200504303, "step": 2805, "valid_targets_mean": 2747.2, "valid_targets_min": 893 }, { "epoch": 2.746823069403715, "grad_norm": 0.6430016293534321, "learning_rate": 3.0469086044803663e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.22754496335983276, "step": 2810, "valid_targets_mean": 2441.9, "valid_targets_min": 697 }, { "epoch": 2.7517106549364616, "grad_norm": 0.6672184525189786, "learning_rate": 3.0427515476028468e-05, "loss": 0.2329, "loss_nan_ranks": 0, "loss_rank_avg": 0.2377731204032898, "step": 2815, "valid_targets_mean": 2553.1, "valid_targets_min": 1144 }, { "epoch": 2.7565982404692084, "grad_norm": 0.6337998207855043, "learning_rate": 3.038588294755151e-05, "loss": 0.223, "loss_nan_ranks": 0, "loss_rank_avg": 0.2279859483242035, "step": 2820, "valid_targets_mean": 2683.7, "valid_targets_min": 597 }, { "epoch": 2.7614858260019552, "grad_norm": 0.6415879365422061, "learning_rate": 3.034418870675092e-05, "loss": 0.2518, "loss_nan_ranks": 0, "loss_rank_avg": 0.25901520252227783, "step": 2825, "valid_targets_mean": 3471.3, "valid_targets_min": 771 }, { "epoch": 2.766373411534702, "grad_norm": 0.6903646046533939, "learning_rate": 3.0302433001371475e-05, "loss": 0.2439, "loss_nan_ranks": 0, "loss_rank_avg": 0.2619539499282837, "step": 2830, "valid_targets_mean": 2333.2, "valid_targets_min": 890 }, { "epoch": 2.771260997067449, "grad_norm": 0.6243991438233805, "learning_rate": 3.02606160795232e-05, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.2319139838218689, "step": 2835, "valid_targets_mean": 2468.5, "valid_targets_min": 646 }, { "epoch": 2.7761485826001957, "grad_norm": 0.640200588738358, "learning_rate": 3.021873818967986e-05, "loss": 0.2408, "loss_nan_ranks": 0, "loss_rank_avg": 0.20535393059253693, "step": 2840, "valid_targets_mean": 3473.6, "valid_targets_min": 978 }, { "epoch": 2.7810361681329425, "grad_norm": 0.6766646508609335, "learning_rate": 3.0176799580677477e-05, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.23535458743572235, "step": 2845, "valid_targets_mean": 2393.3, "valid_targets_min": 861 }, { "epoch": 2.7859237536656893, "grad_norm": 0.6733786925421605, "learning_rate": 3.013480050171289e-05, "loss": 0.2263, "loss_nan_ranks": 0, "loss_rank_avg": 0.23346024751663208, "step": 2850, "valid_targets_mean": 2390.7, "valid_targets_min": 728 }, { "epoch": 2.790811339198436, "grad_norm": 0.724460745453377, "learning_rate": 3.009274120234221e-05, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.2303357571363449, "step": 2855, "valid_targets_mean": 2362.2, "valid_targets_min": 786 }, { "epoch": 2.795698924731183, "grad_norm": 0.6645986334487373, "learning_rate": 3.0050621932479402e-05, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.22619573771953583, "step": 2860, "valid_targets_mean": 2401.0, "valid_targets_min": 832 }, { "epoch": 2.80058651026393, "grad_norm": 0.6600838806245943, "learning_rate": 3.0008442942394763e-05, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.26058539748191833, "step": 2865, "valid_targets_mean": 2661.4, "valid_targets_min": 1131 }, { "epoch": 2.8054740957966766, "grad_norm": 0.64943249977253, "learning_rate": 2.9966204482713447e-05, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.22463732957839966, "step": 2870, "valid_targets_mean": 2495.8, "valid_targets_min": 680 }, { "epoch": 2.8103616813294234, "grad_norm": 0.6786818865745439, "learning_rate": 2.9923906804413966e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.2178959995508194, "step": 2875, "valid_targets_mean": 2419.3, "valid_targets_min": 826 }, { "epoch": 2.8152492668621703, "grad_norm": 0.5944406321947248, "learning_rate": 2.988155015882671e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.23274701833724976, "step": 2880, "valid_targets_mean": 3016.2, "valid_targets_min": 906 }, { "epoch": 2.820136852394917, "grad_norm": 0.7333620836779235, "learning_rate": 2.9839134797632448e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.2247675657272339, "step": 2885, "valid_targets_mean": 1883.5, "valid_targets_min": 635 }, { "epoch": 2.825024437927664, "grad_norm": 0.6805311682642338, "learning_rate": 2.9796660972860843e-05, "loss": 0.2284, "loss_nan_ranks": 0, "loss_rank_avg": 0.23136526346206665, "step": 2890, "valid_targets_mean": 2278.5, "valid_targets_min": 807 }, { "epoch": 2.8299120234604107, "grad_norm": 0.7830726431275282, "learning_rate": 2.975412893688893e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.24189212918281555, "step": 2895, "valid_targets_mean": 1769.8, "valid_targets_min": 663 }, { "epoch": 2.8347996089931575, "grad_norm": 0.6769811140537966, "learning_rate": 2.9711538942439637e-05, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.22272557020187378, "step": 2900, "valid_targets_mean": 2156.8, "valid_targets_min": 876 }, { "epoch": 2.8396871945259043, "grad_norm": 0.7674529053801956, "learning_rate": 2.9668891242580287e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.2575834095478058, "step": 2905, "valid_targets_mean": 2216.5, "valid_targets_min": 744 }, { "epoch": 2.844574780058651, "grad_norm": 0.6658603801212766, "learning_rate": 2.962618609072108e-05, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.25467610359191895, "step": 2910, "valid_targets_mean": 2915.1, "valid_targets_min": 694 }, { "epoch": 2.849462365591398, "grad_norm": 0.62994164165599, "learning_rate": 2.9583423740613583e-05, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.25572115182876587, "step": 2915, "valid_targets_mean": 2733.2, "valid_targets_min": 1002 }, { "epoch": 2.854349951124145, "grad_norm": 0.7802082469784795, "learning_rate": 2.954060444634924e-05, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.21022462844848633, "step": 2920, "valid_targets_mean": 1662.9, "valid_targets_min": 749 }, { "epoch": 2.8592375366568916, "grad_norm": 0.7025252669117502, "learning_rate": 2.9497728462357854e-05, "loss": 0.2285, "loss_nan_ranks": 0, "loss_rank_avg": 0.2211170792579651, "step": 2925, "valid_targets_mean": 1993.3, "valid_targets_min": 695 }, { "epoch": 2.8641251221896384, "grad_norm": 0.5702454921369775, "learning_rate": 2.9454796043406082e-05, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.22452156245708466, "step": 2930, "valid_targets_mean": 3428.3, "valid_targets_min": 765 }, { "epoch": 2.8690127077223853, "grad_norm": 0.737348955153242, "learning_rate": 2.9411807444595903e-05, "loss": 0.2252, "loss_nan_ranks": 0, "loss_rank_avg": 0.21879072487354279, "step": 2935, "valid_targets_mean": 2037.2, "valid_targets_min": 636 }, { "epoch": 2.873900293255132, "grad_norm": 0.7194505785174569, "learning_rate": 2.936876292136311e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.2638698220252991, "step": 2940, "valid_targets_mean": 2237.4, "valid_targets_min": 834 }, { "epoch": 2.878787878787879, "grad_norm": 0.7215626747806759, "learning_rate": 2.9325662729475808e-05, "loss": 0.2369, "loss_nan_ranks": 0, "loss_rank_avg": 0.24015557765960693, "step": 2945, "valid_targets_mean": 2293.9, "valid_targets_min": 752 }, { "epoch": 2.8836754643206257, "grad_norm": 0.6723838618072419, "learning_rate": 2.928250712503288e-05, "loss": 0.2231, "loss_nan_ranks": 0, "loss_rank_avg": 0.21491815149784088, "step": 2950, "valid_targets_mean": 2184.8, "valid_targets_min": 979 }, { "epoch": 2.8885630498533725, "grad_norm": 0.7739998699952924, "learning_rate": 2.9239296364462467e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.25200653076171875, "step": 2955, "valid_targets_mean": 2104.8, "valid_targets_min": 815 }, { "epoch": 2.8934506353861194, "grad_norm": 0.6661883736388912, "learning_rate": 2.919603070452043e-05, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.24104368686676025, "step": 2960, "valid_targets_mean": 2636.2, "valid_targets_min": 821 }, { "epoch": 2.898338220918866, "grad_norm": 0.777296307434507, "learning_rate": 2.915271040228886e-05, "loss": 0.227, "loss_nan_ranks": 0, "loss_rank_avg": 0.22833505272865295, "step": 2965, "valid_targets_mean": 1935.4, "valid_targets_min": 892 }, { "epoch": 2.903225806451613, "grad_norm": 0.6089518142750111, "learning_rate": 2.9109335715174517e-05, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.23753002285957336, "step": 2970, "valid_targets_mean": 3033.2, "valid_targets_min": 1109 }, { "epoch": 2.90811339198436, "grad_norm": 0.782726714582175, "learning_rate": 2.9065906900907318e-05, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.23450714349746704, "step": 2975, "valid_targets_mean": 1985.1, "valid_targets_min": 770 }, { "epoch": 2.9130009775171066, "grad_norm": 0.6413112020747412, "learning_rate": 2.9022424217538797e-05, "loss": 0.2295, "loss_nan_ranks": 0, "loss_rank_avg": 0.2412833422422409, "step": 2980, "valid_targets_mean": 2716.9, "valid_targets_min": 985 }, { "epoch": 2.9178885630498534, "grad_norm": 0.6854532986235314, "learning_rate": 2.8978887923440573e-05, "loss": 0.2295, "loss_nan_ranks": 0, "loss_rank_avg": 0.23968929052352905, "step": 2985, "valid_targets_mean": 2625.2, "valid_targets_min": 940 }, { "epoch": 2.9227761485826003, "grad_norm": 0.6876034052530781, "learning_rate": 2.8935298277302827e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.24147212505340576, "step": 2990, "valid_targets_mean": 2415.8, "valid_targets_min": 727 }, { "epoch": 2.927663734115347, "grad_norm": 0.6592399161754122, "learning_rate": 2.8891655538132747e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.24528644979000092, "step": 2995, "valid_targets_mean": 2493.1, "valid_targets_min": 879 }, { "epoch": 2.932551319648094, "grad_norm": 0.7330835802360961, "learning_rate": 2.8847959965252997e-05, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.24110592901706696, "step": 3000, "valid_targets_mean": 2464.8, "valid_targets_min": 714 }, { "epoch": 2.9374389051808407, "grad_norm": 0.9963806436549506, "learning_rate": 2.8804211818300175e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.24917423725128174, "step": 3005, "valid_targets_mean": 2112.3, "valid_targets_min": 635 }, { "epoch": 2.9423264907135875, "grad_norm": 0.7093645468792228, "learning_rate": 2.8760411357223274e-05, "loss": 0.2496, "loss_nan_ranks": 0, "loss_rank_avg": 0.256412148475647, "step": 3010, "valid_targets_mean": 2230.4, "valid_targets_min": 514 }, { "epoch": 2.9472140762463344, "grad_norm": 0.6313278112245672, "learning_rate": 2.8716558842282133e-05, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.21212854981422424, "step": 3015, "valid_targets_mean": 2637.0, "valid_targets_min": 916 }, { "epoch": 2.952101661779081, "grad_norm": 0.5943727879588198, "learning_rate": 2.8672654534045893e-05, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.22816044092178345, "step": 3020, "valid_targets_mean": 3090.9, "valid_targets_min": 819 }, { "epoch": 2.956989247311828, "grad_norm": 0.6972022185831341, "learning_rate": 2.8628698693391454e-05, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.24018850922584534, "step": 3025, "valid_targets_mean": 2340.3, "valid_targets_min": 807 }, { "epoch": 2.961876832844575, "grad_norm": 0.6777221287793921, "learning_rate": 2.8584691581501904e-05, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.22792454063892365, "step": 3030, "valid_targets_mean": 2147.8, "valid_targets_min": 929 }, { "epoch": 2.9667644183773216, "grad_norm": 0.608921349958511, "learning_rate": 2.8540633459864984e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.22310322523117065, "step": 3035, "valid_targets_mean": 2694.1, "valid_targets_min": 714 }, { "epoch": 2.9716520039100685, "grad_norm": 0.6960978391554294, "learning_rate": 2.8496524590271558e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.25981682538986206, "step": 3040, "valid_targets_mean": 2517.1, "valid_targets_min": 940 }, { "epoch": 2.9765395894428153, "grad_norm": 0.7378583701878564, "learning_rate": 2.8452365234813992e-05, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.1961268186569214, "step": 3045, "valid_targets_mean": 2311.8, "valid_targets_min": 740 }, { "epoch": 2.981427174975562, "grad_norm": 0.6720248721061973, "learning_rate": 2.8408155655884666e-05, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.2390064001083374, "step": 3050, "valid_targets_mean": 2484.6, "valid_targets_min": 1076 }, { "epoch": 2.986314760508309, "grad_norm": 0.6878264817723515, "learning_rate": 2.836389611617437e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.2337898164987564, "step": 3055, "valid_targets_mean": 2284.5, "valid_targets_min": 1266 }, { "epoch": 2.9912023460410557, "grad_norm": 0.6966111553176655, "learning_rate": 2.8319586878670767e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.22837823629379272, "step": 3060, "valid_targets_mean": 2068.6, "valid_targets_min": 772 }, { "epoch": 2.9960899315738025, "grad_norm": 0.6945196129457747, "learning_rate": 2.827522820665681e-05, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.2056921422481537, "step": 3065, "valid_targets_mean": 2009.1, "valid_targets_min": 612 }, { "epoch": 3.0009775171065494, "grad_norm": 0.6719993247544616, "learning_rate": 2.82308203637092e-05, "loss": 0.2409, "loss_nan_ranks": 0, "loss_rank_avg": 0.2267838567495346, "step": 3070, "valid_targets_mean": 2419.8, "valid_targets_min": 732 }, { "epoch": 3.005865102639296, "grad_norm": 0.6667645399427046, "learning_rate": 2.8186363613696807e-05, "loss": 0.2132, "loss_nan_ranks": 0, "loss_rank_avg": 0.22658130526542664, "step": 3075, "valid_targets_mean": 2837.1, "valid_targets_min": 648 }, { "epoch": 3.010752688172043, "grad_norm": 0.6995064995237391, "learning_rate": 2.81418582207791e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.21117915213108063, "step": 3080, "valid_targets_mean": 2488.8, "valid_targets_min": 746 }, { "epoch": 3.01564027370479, "grad_norm": 0.7816935143677926, "learning_rate": 2.809730444940459e-05, "loss": 0.2033, "loss_nan_ranks": 0, "loss_rank_avg": 0.19485579431056976, "step": 3085, "valid_targets_mean": 1877.2, "valid_targets_min": 585 }, { "epoch": 3.0205278592375366, "grad_norm": 0.6280789848534472, "learning_rate": 2.8052702564309232e-05, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.18880394101142883, "step": 3090, "valid_targets_mean": 2680.8, "valid_targets_min": 754 }, { "epoch": 3.0254154447702835, "grad_norm": 0.7246655595987659, "learning_rate": 2.8008052830514882e-05, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.21295440196990967, "step": 3095, "valid_targets_mean": 2274.8, "valid_targets_min": 788 }, { "epoch": 3.0303030303030303, "grad_norm": 0.7042756737696498, "learning_rate": 2.7963355513327717e-05, "loss": 0.2091, "loss_nan_ranks": 0, "loss_rank_avg": 0.23234760761260986, "step": 3100, "valid_targets_mean": 2904.4, "valid_targets_min": 708 }, { "epoch": 3.035190615835777, "grad_norm": 0.7467994069578198, "learning_rate": 2.7918610878336644e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.22012445330619812, "step": 3105, "valid_targets_mean": 2543.5, "valid_targets_min": 893 }, { "epoch": 3.040078201368524, "grad_norm": 0.6581294580719984, "learning_rate": 2.7873819191411732e-05, "loss": 0.202, "loss_nan_ranks": 0, "loss_rank_avg": 0.1838349997997284, "step": 3110, "valid_targets_mean": 2560.5, "valid_targets_min": 1434 }, { "epoch": 3.0449657869012707, "grad_norm": 0.6275202980378985, "learning_rate": 2.782898071870261e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.1899479627609253, "step": 3115, "valid_targets_mean": 2978.4, "valid_targets_min": 723 }, { "epoch": 3.0498533724340176, "grad_norm": 0.708666227527697, "learning_rate": 2.7784095726636945e-05, "loss": 0.1977, "loss_nan_ranks": 0, "loss_rank_avg": 0.2058933973312378, "step": 3120, "valid_targets_mean": 2619.5, "valid_targets_min": 1038 }, { "epoch": 3.0547409579667644, "grad_norm": 0.7252823344406546, "learning_rate": 2.773916448191879e-05, "loss": 0.2079, "loss_nan_ranks": 0, "loss_rank_avg": 0.2228691130876541, "step": 3125, "valid_targets_mean": 2502.4, "valid_targets_min": 855 }, { "epoch": 3.059628543499511, "grad_norm": 0.6775893290948455, "learning_rate": 2.7694187251527034e-05, "loss": 0.1979, "loss_nan_ranks": 0, "loss_rank_avg": 0.20811831951141357, "step": 3130, "valid_targets_mean": 2852.7, "valid_targets_min": 834 }, { "epoch": 3.064516129032258, "grad_norm": 0.6750667682794524, "learning_rate": 2.7649164302713818e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.2103792279958725, "step": 3135, "valid_targets_mean": 2695.4, "valid_targets_min": 1083 }, { "epoch": 3.069403714565005, "grad_norm": 0.6452750671952329, "learning_rate": 2.7604095903002925e-05, "loss": 0.2068, "loss_nan_ranks": 0, "loss_rank_avg": 0.19791629910469055, "step": 3140, "valid_targets_mean": 2622.8, "valid_targets_min": 851 }, { "epoch": 3.0742913000977516, "grad_norm": 0.6855575675327805, "learning_rate": 2.7558982320188228e-05, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.20340736210346222, "step": 3145, "valid_targets_mean": 2924.1, "valid_targets_min": 858 }, { "epoch": 3.0791788856304985, "grad_norm": 0.7823747155692843, "learning_rate": 2.7513823822332044e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.19628237187862396, "step": 3150, "valid_targets_mean": 1840.7, "valid_targets_min": 759 }, { "epoch": 3.0840664711632453, "grad_norm": 0.8146578281379756, "learning_rate": 2.74686206777636e-05, "loss": 0.1991, "loss_nan_ranks": 0, "loss_rank_avg": 0.20766061544418335, "step": 3155, "valid_targets_mean": 1969.3, "valid_targets_min": 918 }, { "epoch": 3.088954056695992, "grad_norm": 0.6883738938370201, "learning_rate": 2.7423373155077403e-05, "loss": 0.1978, "loss_nan_ranks": 0, "loss_rank_avg": 0.18747478723526, "step": 3160, "valid_targets_mean": 2373.4, "valid_targets_min": 856 }, { "epoch": 3.093841642228739, "grad_norm": 0.7077726637761635, "learning_rate": 2.7378081523131644e-05, "loss": 0.1966, "loss_nan_ranks": 0, "loss_rank_avg": 0.20626375079154968, "step": 3165, "valid_targets_mean": 2385.8, "valid_targets_min": 683 }, { "epoch": 3.0987292277614857, "grad_norm": 0.8627305595439234, "learning_rate": 2.7332746051046616e-05, "loss": 0.2109, "loss_nan_ranks": 0, "loss_rank_avg": 0.21347269415855408, "step": 3170, "valid_targets_mean": 2014.2, "valid_targets_min": 734 }, { "epoch": 3.1036168132942326, "grad_norm": 0.7893777089075921, "learning_rate": 2.72873670082031e-05, "loss": 0.2108, "loss_nan_ranks": 0, "loss_rank_avg": 0.2146587371826172, "step": 3175, "valid_targets_mean": 2289.4, "valid_targets_min": 642 }, { "epoch": 3.1085043988269794, "grad_norm": 0.8273291714086848, "learning_rate": 2.7241944664240792e-05, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.16076461970806122, "step": 3180, "valid_targets_mean": 1337.8, "valid_targets_min": 514 }, { "epoch": 3.113391984359726, "grad_norm": 0.729684484993837, "learning_rate": 2.719647928905666e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.20329692959785461, "step": 3185, "valid_targets_mean": 2202.4, "valid_targets_min": 1251 }, { "epoch": 3.118279569892473, "grad_norm": 0.6526019445711841, "learning_rate": 2.715097115280337e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.19159898161888123, "step": 3190, "valid_targets_mean": 2702.8, "valid_targets_min": 793 }, { "epoch": 3.12316715542522, "grad_norm": 0.7498464955317224, "learning_rate": 2.7105420525887667e-05, "loss": 0.1991, "loss_nan_ranks": 0, "loss_rank_avg": 0.2095525860786438, "step": 3195, "valid_targets_mean": 2154.8, "valid_targets_min": 916 }, { "epoch": 3.1280547409579667, "grad_norm": 0.7063138314214019, "learning_rate": 2.7059827678968775e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.19605648517608643, "step": 3200, "valid_targets_mean": 2327.6, "valid_targets_min": 916 }, { "epoch": 3.1329423264907135, "grad_norm": 0.759819492933154, "learning_rate": 2.7014192882956795e-05, "loss": 0.204, "loss_nan_ranks": 0, "loss_rank_avg": 0.2000146508216858, "step": 3205, "valid_targets_mean": 2217.5, "valid_targets_min": 682 }, { "epoch": 3.1378299120234603, "grad_norm": 0.7249197896837959, "learning_rate": 2.6968516409011073e-05, "loss": 0.2096, "loss_nan_ranks": 0, "loss_rank_avg": 0.2277396023273468, "step": 3210, "valid_targets_mean": 2899.7, "valid_targets_min": 905 }, { "epoch": 3.142717497556207, "grad_norm": 0.6645341527478739, "learning_rate": 2.6922798528538615e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.1898479163646698, "step": 3215, "valid_targets_mean": 2493.7, "valid_targets_min": 697 }, { "epoch": 3.147605083088954, "grad_norm": 0.7890579447239405, "learning_rate": 2.6877039513192452e-05, "loss": 0.1952, "loss_nan_ranks": 0, "loss_rank_avg": 0.1876201033592224, "step": 3220, "valid_targets_mean": 2037.3, "valid_targets_min": 916 }, { "epoch": 3.1524926686217007, "grad_norm": 0.7907814247477751, "learning_rate": 2.6831239634870044e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.19796785712242126, "step": 3225, "valid_targets_mean": 1733.1, "valid_targets_min": 742 }, { "epoch": 3.1573802541544476, "grad_norm": 0.7070573564286917, "learning_rate": 2.6785399165711662e-05, "loss": 0.2101, "loss_nan_ranks": 0, "loss_rank_avg": 0.19448038935661316, "step": 3230, "valid_targets_mean": 2516.5, "valid_targets_min": 1012 }, { "epoch": 3.1622678396871944, "grad_norm": 0.7496403178879768, "learning_rate": 2.673951837809874e-05, "loss": 0.1979, "loss_nan_ranks": 0, "loss_rank_avg": 0.20808371901512146, "step": 3235, "valid_targets_mean": 2226.3, "valid_targets_min": 702 }, { "epoch": 3.167155425219941, "grad_norm": 0.7481396583011426, "learning_rate": 2.669359754465231e-05, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.20283767580986023, "step": 3240, "valid_targets_mean": 2323.2, "valid_targets_min": 618 }, { "epoch": 3.172043010752688, "grad_norm": 0.7195578782630686, "learning_rate": 2.6647636938231342e-05, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.21234679222106934, "step": 3245, "valid_targets_mean": 2472.0, "valid_targets_min": 642 }, { "epoch": 3.176930596285435, "grad_norm": 0.7513145461378141, "learning_rate": 2.6601636831931134e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.21580851078033447, "step": 3250, "valid_targets_mean": 2293.7, "valid_targets_min": 521 }, { "epoch": 3.1818181818181817, "grad_norm": 0.7021834829360021, "learning_rate": 2.6555597499081694e-05, "loss": 0.202, "loss_nan_ranks": 0, "loss_rank_avg": 0.2086678445339203, "step": 3255, "valid_targets_mean": 2655.6, "valid_targets_min": 921 }, { "epoch": 3.1867057673509285, "grad_norm": 0.7337259433387169, "learning_rate": 2.6509519213246107e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.19709116220474243, "step": 3260, "valid_targets_mean": 2152.6, "valid_targets_min": 661 }, { "epoch": 3.1915933528836753, "grad_norm": 0.7732965615576772, "learning_rate": 2.646340224821892e-05, "loss": 0.1973, "loss_nan_ranks": 0, "loss_rank_avg": 0.17325511574745178, "step": 3265, "valid_targets_mean": 1718.6, "valid_targets_min": 757 }, { "epoch": 3.196480938416422, "grad_norm": 0.7642020533927616, "learning_rate": 2.64172468780245e-05, "loss": 0.2098, "loss_nan_ranks": 0, "loss_rank_avg": 0.21912142634391785, "step": 3270, "valid_targets_mean": 1914.9, "valid_targets_min": 762 }, { "epoch": 3.201368523949169, "grad_norm": 0.7137081449723205, "learning_rate": 2.6371053376915442e-05, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.1930808126926422, "step": 3275, "valid_targets_mean": 2530.1, "valid_targets_min": 1259 }, { "epoch": 3.2062561094819158, "grad_norm": 0.7965252099837399, "learning_rate": 2.6324822019370874e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.20748776197433472, "step": 3280, "valid_targets_mean": 2264.4, "valid_targets_min": 801 }, { "epoch": 3.2111436950146626, "grad_norm": 0.7194214666441809, "learning_rate": 2.6278553080094887e-05, "loss": 0.2069, "loss_nan_ranks": 0, "loss_rank_avg": 0.22017285227775574, "step": 3285, "valid_targets_mean": 2692.5, "valid_targets_min": 794 }, { "epoch": 3.2160312805474094, "grad_norm": 0.7245863184684226, "learning_rate": 2.6232246834014876e-05, "loss": 0.2015, "loss_nan_ranks": 0, "loss_rank_avg": 0.1813446581363678, "step": 3290, "valid_targets_mean": 2046.6, "valid_targets_min": 659 }, { "epoch": 3.220918866080156, "grad_norm": 0.7908976384173254, "learning_rate": 2.618590355627992e-05, "loss": 0.2037, "loss_nan_ranks": 0, "loss_rank_avg": 0.2101239562034607, "step": 3295, "valid_targets_mean": 2258.9, "valid_targets_min": 1006 }, { "epoch": 3.225806451612903, "grad_norm": 0.7977860033215038, "learning_rate": 2.613952352225912e-05, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.18104560673236847, "step": 3300, "valid_targets_mean": 1767.8, "valid_targets_min": 484 }, { "epoch": 3.23069403714565, "grad_norm": 0.6115674983154584, "learning_rate": 2.6093107007539998e-05, "loss": 0.1965, "loss_nan_ranks": 0, "loss_rank_avg": 0.17804718017578125, "step": 3305, "valid_targets_mean": 3087.1, "valid_targets_min": 818 }, { "epoch": 3.2355816226783967, "grad_norm": 0.6099669179614807, "learning_rate": 2.604665428792683e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.20128144323825836, "step": 3310, "valid_targets_mean": 3071.8, "valid_targets_min": 1057 }, { "epoch": 3.2404692082111435, "grad_norm": 0.7754454106550883, "learning_rate": 2.600016563943904e-05, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.216938778758049, "step": 3315, "valid_targets_mean": 2073.1, "valid_targets_min": 740 }, { "epoch": 3.2453567937438903, "grad_norm": 0.7143546354659018, "learning_rate": 2.5953641338309496e-05, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.19034463167190552, "step": 3320, "valid_targets_mean": 2202.1, "valid_targets_min": 737 }, { "epoch": 3.250244379276637, "grad_norm": 0.8320544699825392, "learning_rate": 2.590708166098296e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.20066097378730774, "step": 3325, "valid_targets_mean": 2138.4, "valid_targets_min": 985 }, { "epoch": 3.255131964809384, "grad_norm": 0.7253333750300228, "learning_rate": 2.586048688411437e-05, "loss": 0.2129, "loss_nan_ranks": 0, "loss_rank_avg": 0.23125603795051575, "step": 3330, "valid_targets_mean": 2893.1, "valid_targets_min": 1018 }, { "epoch": 3.2600195503421308, "grad_norm": 0.730875427222105, "learning_rate": 2.5813857284567237e-05, "loss": 0.1978, "loss_nan_ranks": 0, "loss_rank_avg": 0.19738978147506714, "step": 3335, "valid_targets_mean": 2522.3, "valid_targets_min": 859 }, { "epoch": 3.2649071358748776, "grad_norm": 0.7298430353490984, "learning_rate": 2.5767193139411964e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.20270711183547974, "step": 3340, "valid_targets_mean": 2434.2, "valid_targets_min": 467 }, { "epoch": 3.2697947214076244, "grad_norm": 1.083616521939471, "learning_rate": 2.5720494725924257e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.21499906480312347, "step": 3345, "valid_targets_mean": 1869.0, "valid_targets_min": 724 }, { "epoch": 3.274682306940371, "grad_norm": 0.6154395147501789, "learning_rate": 2.5673762321583415e-05, "loss": 0.2117, "loss_nan_ranks": 0, "loss_rank_avg": 0.21717801690101624, "step": 3350, "valid_targets_mean": 3228.8, "valid_targets_min": 974 }, { "epoch": 3.279569892473118, "grad_norm": 0.7777446446492675, "learning_rate": 2.5626996204070714e-05, "loss": 0.2065, "loss_nan_ranks": 0, "loss_rank_avg": 0.207222580909729, "step": 3355, "valid_targets_mean": 2294.8, "valid_targets_min": 705 }, { "epoch": 3.2844574780058653, "grad_norm": 0.626315557736335, "learning_rate": 2.558019665126777e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.18110740184783936, "step": 3360, "valid_targets_mean": 2922.9, "valid_targets_min": 607 }, { "epoch": 3.289345063538612, "grad_norm": 0.6898177043479149, "learning_rate": 2.5533363941254826e-05, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.18781378865242004, "step": 3365, "valid_targets_mean": 2249.1, "valid_targets_min": 740 }, { "epoch": 3.294232649071359, "grad_norm": 0.7219158135860761, "learning_rate": 2.5486498352309194e-05, "loss": 0.1993, "loss_nan_ranks": 0, "loss_rank_avg": 0.19829457998275757, "step": 3370, "valid_targets_mean": 2316.6, "valid_targets_min": 896 }, { "epoch": 3.2991202346041058, "grad_norm": 0.7339876884452256, "learning_rate": 2.5439600162903527e-05, "loss": 0.2071, "loss_nan_ranks": 0, "loss_rank_avg": 0.2177194505929947, "step": 3375, "valid_targets_mean": 2257.8, "valid_targets_min": 726 }, { "epoch": 3.3040078201368526, "grad_norm": 0.6776390716226277, "learning_rate": 2.5392669651704185e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.19257496297359467, "step": 3380, "valid_targets_mean": 2925.8, "valid_targets_min": 1060 }, { "epoch": 3.3088954056695994, "grad_norm": 0.759226279377635, "learning_rate": 2.5345707097569586e-05, "loss": 0.2066, "loss_nan_ranks": 0, "loss_rank_avg": 0.1948852837085724, "step": 3385, "valid_targets_mean": 2035.1, "valid_targets_min": 679 }, { "epoch": 3.313782991202346, "grad_norm": 0.7681252041823609, "learning_rate": 2.529871277954854e-05, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.219600647687912, "step": 3390, "valid_targets_mean": 2099.7, "valid_targets_min": 798 }, { "epoch": 3.318670576735093, "grad_norm": 0.7587652122936347, "learning_rate": 2.5251686976878618e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.18549835681915283, "step": 3395, "valid_targets_mean": 2503.0, "valid_targets_min": 847 }, { "epoch": 3.32355816226784, "grad_norm": 0.6848113837428216, "learning_rate": 2.5204629968984443e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.21900366246700287, "step": 3400, "valid_targets_mean": 2764.0, "valid_targets_min": 651 }, { "epoch": 3.3284457478005867, "grad_norm": 0.6897084263388162, "learning_rate": 2.5157542035476077e-05, "loss": 0.1946, "loss_nan_ranks": 0, "loss_rank_avg": 0.19517606496810913, "step": 3405, "valid_targets_mean": 2661.6, "valid_targets_min": 960 }, { "epoch": 3.3333333333333335, "grad_norm": 0.7517965693921952, "learning_rate": 2.5110423456147322e-05, "loss": 0.2087, "loss_nan_ranks": 0, "loss_rank_avg": 0.21612215042114258, "step": 3410, "valid_targets_mean": 2433.1, "valid_targets_min": 975 }, { "epoch": 3.3382209188660803, "grad_norm": 0.7318661225517749, "learning_rate": 2.50632745109741e-05, "loss": 0.2108, "loss_nan_ranks": 0, "loss_rank_avg": 0.1917639672756195, "step": 3415, "valid_targets_mean": 1934.4, "valid_targets_min": 771 }, { "epoch": 3.343108504398827, "grad_norm": 0.7445802916995302, "learning_rate": 2.501609548011275e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.1921059787273407, "step": 3420, "valid_targets_mean": 2087.8, "valid_targets_min": 692 }, { "epoch": 3.347996089931574, "grad_norm": 0.6673062277647884, "learning_rate": 2.4968886643898366e-05, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.18176676332950592, "step": 3425, "valid_targets_mean": 2963.6, "valid_targets_min": 1007 }, { "epoch": 3.3528836754643208, "grad_norm": 0.9097050470991745, "learning_rate": 2.4921648282843176e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.18103784322738647, "step": 3430, "valid_targets_mean": 2004.6, "valid_targets_min": 628 }, { "epoch": 3.3577712609970676, "grad_norm": 0.7122931954083914, "learning_rate": 2.4874380677634817e-05, "loss": 0.2066, "loss_nan_ranks": 0, "loss_rank_avg": 0.19356971979141235, "step": 3435, "valid_targets_mean": 2382.2, "valid_targets_min": 914 }, { "epoch": 3.3626588465298144, "grad_norm": 0.7088171184773836, "learning_rate": 2.4827084109134697e-05, "loss": 0.2163, "loss_nan_ranks": 0, "loss_rank_avg": 0.20455177128314972, "step": 3440, "valid_targets_mean": 2174.6, "valid_targets_min": 657 }, { "epoch": 3.367546432062561, "grad_norm": 0.6612005144692485, "learning_rate": 2.477975885837634e-05, "loss": 0.2057, "loss_nan_ranks": 0, "loss_rank_avg": 0.21015259623527527, "step": 3445, "valid_targets_mean": 2880.4, "valid_targets_min": 648 }, { "epoch": 3.372434017595308, "grad_norm": 0.7655924949272598, "learning_rate": 2.473240520656367e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.2177879959344864, "step": 3450, "valid_targets_mean": 2229.4, "valid_targets_min": 836 }, { "epoch": 3.377321603128055, "grad_norm": 0.7618724000532252, "learning_rate": 2.4685023435069388e-05, "loss": 0.2165, "loss_nan_ranks": 0, "loss_rank_avg": 0.23734396696090698, "step": 3455, "valid_targets_mean": 2332.8, "valid_targets_min": 621 }, { "epoch": 3.3822091886608017, "grad_norm": 0.8143707345252376, "learning_rate": 2.4637613825433277e-05, "loss": 0.1896, "loss_nan_ranks": 0, "loss_rank_avg": 0.19915053248405457, "step": 3460, "valid_targets_mean": 1512.4, "valid_targets_min": 668 }, { "epoch": 3.3870967741935485, "grad_norm": 0.8158876268350879, "learning_rate": 2.4590176659360538e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.22826993465423584, "step": 3465, "valid_targets_mean": 2035.4, "valid_targets_min": 650 }, { "epoch": 3.3919843597262953, "grad_norm": 0.6759338161481376, "learning_rate": 2.4542712218720093e-05, "loss": 0.2043, "loss_nan_ranks": 0, "loss_rank_avg": 0.18781697750091553, "step": 3470, "valid_targets_mean": 2423.6, "valid_targets_min": 738 }, { "epoch": 3.396871945259042, "grad_norm": 0.6931462841032442, "learning_rate": 2.449522078554294e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.20876827836036682, "step": 3475, "valid_targets_mean": 2486.4, "valid_targets_min": 610 }, { "epoch": 3.401759530791789, "grad_norm": 0.656880638760444, "learning_rate": 2.444770264202047e-05, "loss": 0.2045, "loss_nan_ranks": 0, "loss_rank_avg": 0.21965506672859192, "step": 3480, "valid_targets_mean": 2932.4, "valid_targets_min": 924 }, { "epoch": 3.4066471163245358, "grad_norm": 0.7793846246855756, "learning_rate": 2.4400158070502773e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.2179027497768402, "step": 3485, "valid_targets_mean": 2128.7, "valid_targets_min": 807 }, { "epoch": 3.4115347018572826, "grad_norm": 0.6366727057551457, "learning_rate": 2.435258735349699e-05, "loss": 0.2043, "loss_nan_ranks": 0, "loss_rank_avg": 0.207027405500412, "step": 3490, "valid_targets_mean": 3005.8, "valid_targets_min": 901 }, { "epoch": 3.4164222873900294, "grad_norm": 0.8083254712829566, "learning_rate": 2.4304990773665587e-05, "loss": 0.2094, "loss_nan_ranks": 0, "loss_rank_avg": 0.22201141715049744, "step": 3495, "valid_targets_mean": 2266.4, "valid_targets_min": 790 }, { "epoch": 3.421309872922776, "grad_norm": 0.7883137521426757, "learning_rate": 2.4257368613824745e-05, "loss": 0.1927, "loss_nan_ranks": 0, "loss_rank_avg": 0.18446215987205505, "step": 3500, "valid_targets_mean": 1863.5, "valid_targets_min": 1075 }, { "epoch": 3.426197458455523, "grad_norm": 0.7729853988513622, "learning_rate": 2.4209721156942615e-05, "loss": 0.1929, "loss_nan_ranks": 0, "loss_rank_avg": 0.1607511341571808, "step": 3505, "valid_targets_mean": 1680.6, "valid_targets_min": 792 }, { "epoch": 3.43108504398827, "grad_norm": 0.7615871115872819, "learning_rate": 2.416204868613765e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.2097199559211731, "step": 3510, "valid_targets_mean": 2369.9, "valid_targets_min": 809 }, { "epoch": 3.4359726295210167, "grad_norm": 0.7886947243326079, "learning_rate": 2.4114351484676975e-05, "loss": 0.2135, "loss_nan_ranks": 0, "loss_rank_avg": 0.22828155755996704, "step": 3515, "valid_targets_mean": 2259.6, "valid_targets_min": 702 }, { "epoch": 3.4408602150537635, "grad_norm": 0.6428893882305308, "learning_rate": 2.4066629835974614e-05, "loss": 0.2127, "loss_nan_ranks": 0, "loss_rank_avg": 0.22016070783138275, "step": 3520, "valid_targets_mean": 3275.2, "valid_targets_min": 1265 }, { "epoch": 3.4457478005865103, "grad_norm": 0.822974697294548, "learning_rate": 2.40188840235899e-05, "loss": 0.2002, "loss_nan_ranks": 0, "loss_rank_avg": 0.20060139894485474, "step": 3525, "valid_targets_mean": 1830.9, "valid_targets_min": 692 }, { "epoch": 3.450635386119257, "grad_norm": 0.6770812059975508, "learning_rate": 2.3971114331225715e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.20556485652923584, "step": 3530, "valid_targets_mean": 2694.8, "valid_targets_min": 642 }, { "epoch": 3.455522971652004, "grad_norm": 0.7786397671656108, "learning_rate": 2.392332104272684e-05, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.2165582925081253, "step": 3535, "valid_targets_mean": 2489.4, "valid_targets_min": 786 }, { "epoch": 3.4604105571847508, "grad_norm": 0.7323225666730152, "learning_rate": 2.3875504442078282e-05, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.21573954820632935, "step": 3540, "valid_targets_mean": 2259.0, "valid_targets_min": 713 }, { "epoch": 3.4652981427174976, "grad_norm": 0.6799054356460841, "learning_rate": 2.3827664813403537e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.1902822107076645, "step": 3545, "valid_targets_mean": 2551.8, "valid_targets_min": 627 }, { "epoch": 3.4701857282502444, "grad_norm": 0.7472013601982304, "learning_rate": 2.3779802440962958e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.20308758318424225, "step": 3550, "valid_targets_mean": 2375.5, "valid_targets_min": 982 }, { "epoch": 3.4750733137829912, "grad_norm": 0.7391959529865234, "learning_rate": 2.3731917609152023e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.21505077183246613, "step": 3555, "valid_targets_mean": 2454.9, "valid_targets_min": 704 }, { "epoch": 3.479960899315738, "grad_norm": 0.6408227234028441, "learning_rate": 2.3684010602499675e-05, "loss": 0.204, "loss_nan_ranks": 0, "loss_rank_avg": 0.18841466307640076, "step": 3560, "valid_targets_mean": 2844.4, "valid_targets_min": 736 }, { "epoch": 3.484848484848485, "grad_norm": 0.6995274259824635, "learning_rate": 2.363608170566661e-05, "loss": 0.1934, "loss_nan_ranks": 0, "loss_rank_avg": 0.19288122653961182, "step": 3565, "valid_targets_mean": 2298.1, "valid_targets_min": 593 }, { "epoch": 3.4897360703812317, "grad_norm": 0.712559649636414, "learning_rate": 2.35881312034436e-05, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.18562278151512146, "step": 3570, "valid_targets_mean": 2527.5, "valid_targets_min": 1190 }, { "epoch": 3.4946236559139785, "grad_norm": 0.7601682130608852, "learning_rate": 2.3540159380749794e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.18290041387081146, "step": 3575, "valid_targets_mean": 1959.9, "valid_targets_min": 244 }, { "epoch": 3.4995112414467253, "grad_norm": 0.6518733256350043, "learning_rate": 2.349216652263101e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.1879890263080597, "step": 3580, "valid_targets_mean": 2892.5, "valid_targets_min": 788 }, { "epoch": 3.504398826979472, "grad_norm": 0.6632097525792074, "learning_rate": 2.3444152914258087e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.19737496972084045, "step": 3585, "valid_targets_mean": 2592.2, "valid_targets_min": 694 }, { "epoch": 3.509286412512219, "grad_norm": 0.701914967587876, "learning_rate": 2.339611884092514e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.21197064220905304, "step": 3590, "valid_targets_mean": 2489.3, "valid_targets_min": 763 }, { "epoch": 3.5141739980449658, "grad_norm": 0.7664935207947431, "learning_rate": 2.3348064588047893e-05, "loss": 0.1987, "loss_nan_ranks": 0, "loss_rank_avg": 0.19324423372745514, "step": 3595, "valid_targets_mean": 1855.3, "valid_targets_min": 635 }, { "epoch": 3.5190615835777126, "grad_norm": 0.7141259014048177, "learning_rate": 2.329999044116197e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.21774733066558838, "step": 3600, "valid_targets_mean": 2392.5, "valid_targets_min": 682 }, { "epoch": 3.5239491691104594, "grad_norm": 0.6730829479768565, "learning_rate": 2.3251896685921205e-05, "loss": 0.2078, "loss_nan_ranks": 0, "loss_rank_avg": 0.19916030764579773, "step": 3605, "valid_targets_mean": 2920.2, "valid_targets_min": 821 }, { "epoch": 3.5288367546432062, "grad_norm": 0.7671142376386617, "learning_rate": 2.3203783608095954e-05, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.23348473012447357, "step": 3610, "valid_targets_mean": 2295.7, "valid_targets_min": 959 }, { "epoch": 3.533724340175953, "grad_norm": 0.7689072632328403, "learning_rate": 2.3155651493571382e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.20937813818454742, "step": 3615, "valid_targets_mean": 2182.8, "valid_targets_min": 1082 }, { "epoch": 3.5386119257087, "grad_norm": 0.7292242265860919, "learning_rate": 2.3107500628345756e-05, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.22746799886226654, "step": 3620, "valid_targets_mean": 2486.5, "valid_targets_min": 730 }, { "epoch": 3.5434995112414467, "grad_norm": 0.7976787109769994, "learning_rate": 2.3059331298528776e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.2245236039161682, "step": 3625, "valid_targets_mean": 1958.8, "valid_targets_min": 1215 }, { "epoch": 3.5483870967741935, "grad_norm": 0.7468841302577356, "learning_rate": 2.301114379033984e-05, "loss": 0.201, "loss_nan_ranks": 0, "loss_rank_avg": 0.18756568431854248, "step": 3630, "valid_targets_mean": 1843.2, "valid_targets_min": 900 }, { "epoch": 3.5532746823069403, "grad_norm": 0.7052365263985373, "learning_rate": 2.2962938390106388e-05, "loss": 0.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.190373957157135, "step": 3635, "valid_targets_mean": 2208.5, "valid_targets_min": 672 }, { "epoch": 3.558162267839687, "grad_norm": 0.7861655797997658, "learning_rate": 2.291471538426214e-05, "loss": 0.2009, "loss_nan_ranks": 0, "loss_rank_avg": 0.21023714542388916, "step": 3640, "valid_targets_mean": 2122.3, "valid_targets_min": 654 }, { "epoch": 3.563049853372434, "grad_norm": 0.7654010417442486, "learning_rate": 2.2866475059345453e-05, "loss": 0.2049, "loss_nan_ranks": 0, "loss_rank_avg": 0.21987277269363403, "step": 3645, "valid_targets_mean": 2314.6, "valid_targets_min": 872 }, { "epoch": 3.567937438905181, "grad_norm": 0.7329153965811843, "learning_rate": 2.2818217701997577e-05, "loss": 0.1947, "loss_nan_ranks": 0, "loss_rank_avg": 0.19848138093948364, "step": 3650, "valid_targets_mean": 2325.4, "valid_targets_min": 815 }, { "epoch": 3.5728250244379276, "grad_norm": 0.6582062601819844, "learning_rate": 2.276994359896099e-05, "loss": 0.2144, "loss_nan_ranks": 0, "loss_rank_avg": 0.20447036623954773, "step": 3655, "valid_targets_mean": 2623.2, "valid_targets_min": 985 }, { "epoch": 3.5777126099706744, "grad_norm": 0.6885840936099205, "learning_rate": 2.2721653037077645e-05, "loss": 0.1998, "loss_nan_ranks": 0, "loss_rank_avg": 0.2211674004793167, "step": 3660, "valid_targets_mean": 2750.7, "valid_targets_min": 701 }, { "epoch": 3.5826001955034212, "grad_norm": 0.7022727114163723, "learning_rate": 2.2673346303287297e-05, "loss": 0.2, "loss_nan_ranks": 0, "loss_rank_avg": 0.19418203830718994, "step": 3665, "valid_targets_mean": 2241.1, "valid_targets_min": 548 }, { "epoch": 3.587487781036168, "grad_norm": 0.6929148877932964, "learning_rate": 2.262502368462582e-05, "loss": 0.2081, "loss_nan_ranks": 0, "loss_rank_avg": 0.22029688954353333, "step": 3670, "valid_targets_mean": 2660.6, "valid_targets_min": 729 }, { "epoch": 3.592375366568915, "grad_norm": 0.6443170990968766, "learning_rate": 2.2576685468223444e-05, "loss": 0.2015, "loss_nan_ranks": 0, "loss_rank_avg": 0.18446439504623413, "step": 3675, "valid_targets_mean": 2688.0, "valid_targets_min": 692 }, { "epoch": 3.5972629521016617, "grad_norm": 0.600440286447225, "learning_rate": 2.2528331941303093e-05, "loss": 0.2057, "loss_nan_ranks": 0, "loss_rank_avg": 0.19318996369838715, "step": 3680, "valid_targets_mean": 3134.5, "valid_targets_min": 1041 }, { "epoch": 3.6021505376344085, "grad_norm": 0.7844338847583994, "learning_rate": 2.2479963391178657e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.21118606626987457, "step": 3685, "valid_targets_mean": 2066.8, "valid_targets_min": 814 }, { "epoch": 3.6070381231671553, "grad_norm": 0.7215085805201092, "learning_rate": 2.2431580105253313e-05, "loss": 0.2149, "loss_nan_ranks": 0, "loss_rank_avg": 0.20135241746902466, "step": 3690, "valid_targets_mean": 2184.1, "valid_targets_min": 722 }, { "epoch": 3.611925708699902, "grad_norm": 0.6656818554741202, "learning_rate": 2.238318237101778e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.20373103022575378, "step": 3695, "valid_targets_mean": 2753.5, "valid_targets_min": 975 }, { "epoch": 3.616813294232649, "grad_norm": 0.7180482881493666, "learning_rate": 2.233477047604863e-05, "loss": 0.2223, "loss_nan_ranks": 0, "loss_rank_avg": 0.1976693719625473, "step": 3700, "valid_targets_mean": 2586.9, "valid_targets_min": 692 }, { "epoch": 3.621700879765396, "grad_norm": 0.6461550790717755, "learning_rate": 2.2286344708006578e-05, "loss": 0.2125, "loss_nan_ranks": 0, "loss_rank_avg": 0.20432640612125397, "step": 3705, "valid_targets_mean": 3076.8, "valid_targets_min": 952 }, { "epoch": 3.6265884652981426, "grad_norm": 0.7135365897281873, "learning_rate": 2.2237905354634775e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.21222619712352753, "step": 3710, "valid_targets_mean": 2544.2, "valid_targets_min": 1058 }, { "epoch": 3.6314760508308894, "grad_norm": 0.7106647598992838, "learning_rate": 2.2189452703757097e-05, "loss": 0.2045, "loss_nan_ranks": 0, "loss_rank_avg": 0.1919505000114441, "step": 3715, "valid_targets_mean": 2239.9, "valid_targets_min": 700 }, { "epoch": 3.6363636363636362, "grad_norm": 0.7370346403284481, "learning_rate": 2.214098704327643e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.2074413299560547, "step": 3720, "valid_targets_mean": 2248.9, "valid_targets_min": 504 }, { "epoch": 3.641251221896383, "grad_norm": 0.6946560980334792, "learning_rate": 2.2092508661172957e-05, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.18183276057243347, "step": 3725, "valid_targets_mean": 2272.8, "valid_targets_min": 746 }, { "epoch": 3.64613880742913, "grad_norm": 0.6384613289501591, "learning_rate": 2.204401784550246e-05, "loss": 0.2039, "loss_nan_ranks": 0, "loss_rank_avg": 0.18616612255573273, "step": 3730, "valid_targets_mean": 2584.4, "valid_targets_min": 684 }, { "epoch": 3.6510263929618767, "grad_norm": 0.6909767548097899, "learning_rate": 2.1995514884394596e-05, "loss": 0.1977, "loss_nan_ranks": 0, "loss_rank_avg": 0.1910645067691803, "step": 3735, "valid_targets_mean": 2587.4, "valid_targets_min": 771 }, { "epoch": 3.6559139784946235, "grad_norm": 0.8148464145542923, "learning_rate": 2.1947000066051204e-05, "loss": 0.1957, "loss_nan_ranks": 0, "loss_rank_avg": 0.20611697435379028, "step": 3740, "valid_targets_mean": 1887.4, "valid_targets_min": 730 }, { "epoch": 3.6608015640273703, "grad_norm": 0.7056151602431089, "learning_rate": 2.189847367874454e-05, "loss": 0.2049, "loss_nan_ranks": 0, "loss_rank_avg": 0.21500477194786072, "step": 3745, "valid_targets_mean": 2486.1, "valid_targets_min": 1001 }, { "epoch": 3.665689149560117, "grad_norm": 1.0531242937391503, "learning_rate": 2.1849936010815653e-05, "loss": 0.212, "loss_nan_ranks": 0, "loss_rank_avg": 0.21067142486572266, "step": 3750, "valid_targets_mean": 1737.8, "valid_targets_min": 714 }, { "epoch": 3.670576735092864, "grad_norm": 0.7901950772244742, "learning_rate": 2.1801387350672577e-05, "loss": 0.2038, "loss_nan_ranks": 0, "loss_rank_avg": 0.20664237439632416, "step": 3755, "valid_targets_mean": 2177.6, "valid_targets_min": 627 }, { "epoch": 3.675464320625611, "grad_norm": 0.7840380182400347, "learning_rate": 2.175282798678869e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.21524584293365479, "step": 3760, "valid_targets_mean": 2213.3, "valid_targets_min": 722 }, { "epoch": 3.6803519061583576, "grad_norm": 0.7134090806306669, "learning_rate": 2.170425820770096e-05, "loss": 0.2022, "loss_nan_ranks": 0, "loss_rank_avg": 0.20987609028816223, "step": 3765, "valid_targets_mean": 2505.4, "valid_targets_min": 1124 }, { "epoch": 3.6852394916911044, "grad_norm": 0.7246436271430389, "learning_rate": 2.1655678302008232e-05, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.20697399973869324, "step": 3770, "valid_targets_mean": 2323.0, "valid_targets_min": 753 }, { "epoch": 3.6901270772238517, "grad_norm": 0.6770013885437635, "learning_rate": 2.160708855836954e-05, "loss": 0.2032, "loss_nan_ranks": 0, "loss_rank_avg": 0.1982710063457489, "step": 3775, "valid_targets_mean": 2790.8, "valid_targets_min": 715 }, { "epoch": 3.6950146627565985, "grad_norm": 0.799738720478482, "learning_rate": 2.1558489265502373e-05, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.220750093460083, "step": 3780, "valid_targets_mean": 2273.8, "valid_targets_min": 750 }, { "epoch": 3.6999022482893453, "grad_norm": 0.6508927329830108, "learning_rate": 2.1509880712180946e-05, "loss": 0.2022, "loss_nan_ranks": 0, "loss_rank_avg": 0.20443478226661682, "step": 3785, "valid_targets_mean": 2857.2, "valid_targets_min": 874 }, { "epoch": 3.704789833822092, "grad_norm": 0.6802733863979533, "learning_rate": 2.1461263187234515e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.20990541577339172, "step": 3790, "valid_targets_mean": 2561.4, "valid_targets_min": 705 }, { "epoch": 3.709677419354839, "grad_norm": 0.7028949057842757, "learning_rate": 2.141263697954563e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.2133583277463913, "step": 3795, "valid_targets_mean": 2545.5, "valid_targets_min": 881 }, { "epoch": 3.714565004887586, "grad_norm": 0.6847821139141917, "learning_rate": 2.1364002378048446e-05, "loss": 0.2063, "loss_nan_ranks": 0, "loss_rank_avg": 0.20359432697296143, "step": 3800, "valid_targets_mean": 2529.1, "valid_targets_min": 914 }, { "epoch": 3.7194525904203326, "grad_norm": 0.7683431448503167, "learning_rate": 2.1315359671726994e-05, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.20140613615512848, "step": 3805, "valid_targets_mean": 2015.9, "valid_targets_min": 740 }, { "epoch": 3.7243401759530794, "grad_norm": 0.6765983248131439, "learning_rate": 2.1266709149613448e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.19246436655521393, "step": 3810, "valid_targets_mean": 2428.9, "valid_targets_min": 870 }, { "epoch": 3.7292277614858262, "grad_norm": 0.9226737395699486, "learning_rate": 2.1218051100786443e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.1814860701560974, "step": 3815, "valid_targets_mean": 1909.5, "valid_targets_min": 779 }, { "epoch": 3.734115347018573, "grad_norm": 0.8000270533236249, "learning_rate": 2.1169385814369317e-05, "loss": 0.2032, "loss_nan_ranks": 0, "loss_rank_avg": 0.22426359355449677, "step": 3820, "valid_targets_mean": 1909.4, "valid_targets_min": 711 }, { "epoch": 3.73900293255132, "grad_norm": 0.6753953556756007, "learning_rate": 2.112071357952844e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.1894885152578354, "step": 3825, "valid_targets_mean": 2391.7, "valid_targets_min": 696 }, { "epoch": 3.7438905180840667, "grad_norm": 0.7747404427802933, "learning_rate": 2.1072034685471442e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.2056509256362915, "step": 3830, "valid_targets_mean": 1816.9, "valid_targets_min": 548 }, { "epoch": 3.7487781036168135, "grad_norm": 0.7637718123929285, "learning_rate": 2.1023349421445532e-05, "loss": 0.2095, "loss_nan_ranks": 0, "loss_rank_avg": 0.20844748616218567, "step": 3835, "valid_targets_mean": 2643.7, "valid_targets_min": 793 }, { "epoch": 3.7536656891495603, "grad_norm": 0.6354837562399616, "learning_rate": 2.0974658076735767e-05, "loss": 0.2046, "loss_nan_ranks": 0, "loss_rank_avg": 0.1894562840461731, "step": 3840, "valid_targets_mean": 2781.6, "valid_targets_min": 1309 }, { "epoch": 3.758553274682307, "grad_norm": 0.6766758246484479, "learning_rate": 2.0925960940663356e-05, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.19174224138259888, "step": 3845, "valid_targets_mean": 2529.0, "valid_targets_min": 987 }, { "epoch": 3.763440860215054, "grad_norm": 0.6892947666726518, "learning_rate": 2.087725830258389e-05, "loss": 0.2063, "loss_nan_ranks": 0, "loss_rank_avg": 0.2084968388080597, "step": 3850, "valid_targets_mean": 2646.6, "valid_targets_min": 655 }, { "epoch": 3.768328445747801, "grad_norm": 0.70291002815775, "learning_rate": 2.082855045188565e-05, "loss": 0.2095, "loss_nan_ranks": 0, "loss_rank_avg": 0.20856565237045288, "step": 3855, "valid_targets_mean": 2704.9, "valid_targets_min": 789 }, { "epoch": 3.7732160312805476, "grad_norm": 0.7692739550745331, "learning_rate": 2.0779837677987927e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.19723054766654968, "step": 3860, "valid_targets_mean": 1855.1, "valid_targets_min": 1118 }, { "epoch": 3.7781036168132944, "grad_norm": 0.7101378522156258, "learning_rate": 2.073112027033923e-05, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.21212387084960938, "step": 3865, "valid_targets_mean": 2229.6, "valid_targets_min": 1150 }, { "epoch": 3.7829912023460412, "grad_norm": 0.795515076642536, "learning_rate": 2.068239851841563e-05, "loss": 0.1954, "loss_nan_ranks": 0, "loss_rank_avg": 0.20189426839351654, "step": 3870, "valid_targets_mean": 2010.2, "valid_targets_min": 768 }, { "epoch": 3.787878787878788, "grad_norm": 0.8748951610329812, "learning_rate": 2.0633672711718975e-05, "loss": 0.2098, "loss_nan_ranks": 0, "loss_rank_avg": 0.20840033888816833, "step": 3875, "valid_targets_mean": 2443.8, "valid_targets_min": 1158 }, { "epoch": 3.792766373411535, "grad_norm": 0.6476901318697162, "learning_rate": 2.0584943139775237e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.1948857605457306, "step": 3880, "valid_targets_mean": 2858.7, "valid_targets_min": 882 }, { "epoch": 3.7976539589442817, "grad_norm": 0.7397815710205294, "learning_rate": 2.053621009213276e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.21412993967533112, "step": 3885, "valid_targets_mean": 2184.9, "valid_targets_min": 997 }, { "epoch": 3.8025415444770285, "grad_norm": 0.7146555857159458, "learning_rate": 2.0487473858360515e-05, "loss": 0.1965, "loss_nan_ranks": 0, "loss_rank_avg": 0.18842893838882446, "step": 3890, "valid_targets_mean": 2270.2, "valid_targets_min": 713 }, { "epoch": 3.8074291300097753, "grad_norm": 0.65940562297892, "learning_rate": 2.0438734728046432e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.18981792032718658, "step": 3895, "valid_targets_mean": 2287.4, "valid_targets_min": 1016 }, { "epoch": 3.812316715542522, "grad_norm": 0.8426072348378402, "learning_rate": 2.0389992990795632e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.22454825043678284, "step": 3900, "valid_targets_mean": 1866.6, "valid_targets_min": 537 }, { "epoch": 3.817204301075269, "grad_norm": 0.7342198247089646, "learning_rate": 2.0341248936228748e-05, "loss": 0.2015, "loss_nan_ranks": 0, "loss_rank_avg": 0.2228454351425171, "step": 3905, "valid_targets_mean": 2335.3, "valid_targets_min": 1021 }, { "epoch": 3.822091886608016, "grad_norm": 0.6636543015733303, "learning_rate": 2.0292502853980164e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.20288674533367157, "step": 3910, "valid_targets_mean": 2667.2, "valid_targets_min": 791 }, { "epoch": 3.8269794721407626, "grad_norm": 0.7610090323169763, "learning_rate": 2.0243755033696313e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.20183882117271423, "step": 3915, "valid_targets_mean": 2155.2, "valid_targets_min": 632 }, { "epoch": 3.8318670576735094, "grad_norm": 0.6831492165378048, "learning_rate": 2.019500576503397e-05, "loss": 0.2015, "loss_nan_ranks": 0, "loss_rank_avg": 0.1926528513431549, "step": 3920, "valid_targets_mean": 2656.8, "valid_targets_min": 1210 }, { "epoch": 3.8367546432062563, "grad_norm": 0.7402425571751615, "learning_rate": 2.0146255337658494e-05, "loss": 0.1996, "loss_nan_ranks": 0, "loss_rank_avg": 0.21684202551841736, "step": 3925, "valid_targets_mean": 2248.5, "valid_targets_min": 420 }, { "epoch": 3.841642228739003, "grad_norm": 0.6921612269978583, "learning_rate": 2.009750404124216e-05, "loss": 0.1975, "loss_nan_ranks": 0, "loss_rank_avg": 0.20540589094161987, "step": 3930, "valid_targets_mean": 2690.6, "valid_targets_min": 697 }, { "epoch": 3.84652981427175, "grad_norm": 0.7529950655294566, "learning_rate": 2.0048752165462373e-05, "loss": 0.2071, "loss_nan_ranks": 0, "loss_rank_avg": 0.21762652695178986, "step": 3935, "valid_targets_mean": 2733.9, "valid_targets_min": 844 }, { "epoch": 3.8514173998044967, "grad_norm": 0.6580479552711862, "learning_rate": 2e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.1937936544418335, "step": 3940, "valid_targets_mean": 2622.9, "valid_targets_min": 632 }, { "epoch": 3.8563049853372435, "grad_norm": 0.8321134334974649, "learning_rate": 1.9951247834537634e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.21654708683490753, "step": 3945, "valid_targets_mean": 2118.2, "valid_targets_min": 594 }, { "epoch": 3.8611925708699903, "grad_norm": 0.8110075847407984, "learning_rate": 1.9902495958757844e-05, "loss": 0.2032, "loss_nan_ranks": 0, "loss_rank_avg": 0.21147048473358154, "step": 3950, "valid_targets_mean": 2464.2, "valid_targets_min": 775 }, { "epoch": 3.866080156402737, "grad_norm": 0.8481527474330096, "learning_rate": 1.985374466234151e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.1752730906009674, "step": 3955, "valid_targets_mean": 1691.5, "valid_targets_min": 680 }, { "epoch": 3.870967741935484, "grad_norm": 0.7391679144111151, "learning_rate": 1.9804994234966036e-05, "loss": 0.2009, "loss_nan_ranks": 0, "loss_rank_avg": 0.2055065929889679, "step": 3960, "valid_targets_mean": 2255.8, "valid_targets_min": 1006 }, { "epoch": 3.875855327468231, "grad_norm": 0.6879643282262666, "learning_rate": 1.9756244966303693e-05, "loss": 0.2096, "loss_nan_ranks": 0, "loss_rank_avg": 0.21640875935554504, "step": 3965, "valid_targets_mean": 2545.9, "valid_targets_min": 750 }, { "epoch": 3.8807429130009776, "grad_norm": 0.682330103660924, "learning_rate": 1.9707497146019846e-05, "loss": 0.1957, "loss_nan_ranks": 0, "loss_rank_avg": 0.17964300513267517, "step": 3970, "valid_targets_mean": 2946.8, "valid_targets_min": 750 }, { "epoch": 3.8856304985337244, "grad_norm": 0.6624662717730248, "learning_rate": 1.9658751063771255e-05, "loss": 0.2079, "loss_nan_ranks": 0, "loss_rank_avg": 0.20151904225349426, "step": 3975, "valid_targets_mean": 3265.1, "valid_targets_min": 711 }, { "epoch": 3.8905180840664713, "grad_norm": 0.7423253354159347, "learning_rate": 1.961000700920437e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.19609767198562622, "step": 3980, "valid_targets_mean": 2088.9, "valid_targets_min": 780 }, { "epoch": 3.895405669599218, "grad_norm": 0.9813652565552392, "learning_rate": 1.956126527195358e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.2142195701599121, "step": 3985, "valid_targets_mean": 2652.4, "valid_targets_min": 759 }, { "epoch": 3.900293255131965, "grad_norm": 0.5712086066191886, "learning_rate": 1.9512526141639492e-05, "loss": 0.1891, "loss_nan_ranks": 0, "loss_rank_avg": 0.16019731760025024, "step": 3990, "valid_targets_mean": 3155.6, "valid_targets_min": 770 }, { "epoch": 3.9051808406647117, "grad_norm": 0.7587001616327813, "learning_rate": 1.9463789907867248e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.25113722681999207, "step": 3995, "valid_targets_mean": 2617.2, "valid_targets_min": 869 }, { "epoch": 3.9100684261974585, "grad_norm": 0.7046294004069471, "learning_rate": 1.941505686022476e-05, "loss": 0.2034, "loss_nan_ranks": 0, "loss_rank_avg": 0.18923306465148926, "step": 4000, "valid_targets_mean": 2173.3, "valid_targets_min": 929 }, { "epoch": 3.9149560117302054, "grad_norm": 0.6934724921753709, "learning_rate": 1.936632728828103e-05, "loss": 0.2098, "loss_nan_ranks": 0, "loss_rank_avg": 0.20533259212970734, "step": 4005, "valid_targets_mean": 2358.2, "valid_targets_min": 898 }, { "epoch": 3.919843597262952, "grad_norm": 0.8196595601053237, "learning_rate": 1.9317601481584383e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.2104458212852478, "step": 4010, "valid_targets_mean": 1972.3, "valid_targets_min": 725 }, { "epoch": 3.924731182795699, "grad_norm": 0.7849322123412164, "learning_rate": 1.926887972966077e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.269350528717041, "step": 4015, "valid_targets_mean": 2177.9, "valid_targets_min": 819 }, { "epoch": 3.929618768328446, "grad_norm": 0.7525483327532918, "learning_rate": 1.922016232201208e-05, "loss": 0.2074, "loss_nan_ranks": 0, "loss_rank_avg": 0.21186742186546326, "step": 4020, "valid_targets_mean": 2130.6, "valid_targets_min": 548 }, { "epoch": 3.9345063538611926, "grad_norm": 0.6367950186766983, "learning_rate": 1.917144954811435e-05, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.19727790355682373, "step": 4025, "valid_targets_mean": 2766.4, "valid_targets_min": 817 }, { "epoch": 3.9393939393939394, "grad_norm": 0.7362334474471227, "learning_rate": 1.9122741697416122e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.206711083650589, "step": 4030, "valid_targets_mean": 2190.1, "valid_targets_min": 771 }, { "epoch": 3.9442815249266863, "grad_norm": 0.6272342072403345, "learning_rate": 1.9074039059336654e-05, "loss": 0.2031, "loss_nan_ranks": 0, "loss_rank_avg": 0.19984391331672668, "step": 4035, "valid_targets_mean": 2838.1, "valid_targets_min": 614 }, { "epoch": 3.949169110459433, "grad_norm": 0.6758572832963811, "learning_rate": 1.902534192326423e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.21952173113822937, "step": 4040, "valid_targets_mean": 2742.6, "valid_targets_min": 1552 }, { "epoch": 3.95405669599218, "grad_norm": 0.6455921997950347, "learning_rate": 1.8976650578554475e-05, "loss": 0.1943, "loss_nan_ranks": 0, "loss_rank_avg": 0.17914989590644836, "step": 4045, "valid_targets_mean": 2462.2, "valid_targets_min": 1012 }, { "epoch": 3.9589442815249267, "grad_norm": 0.7064643550905159, "learning_rate": 1.892796531452857e-05, "loss": 0.2141, "loss_nan_ranks": 0, "loss_rank_avg": 0.22437229752540588, "step": 4050, "valid_targets_mean": 2798.8, "valid_targets_min": 572 }, { "epoch": 3.9638318670576735, "grad_norm": 0.7269435964183898, "learning_rate": 1.8879286420471562e-05, "loss": 0.2105, "loss_nan_ranks": 0, "loss_rank_avg": 0.22988593578338623, "step": 4055, "valid_targets_mean": 2328.2, "valid_targets_min": 584 }, { "epoch": 3.9687194525904204, "grad_norm": 0.6243634215768921, "learning_rate": 1.8830614185630686e-05, "loss": 0.2017, "loss_nan_ranks": 0, "loss_rank_avg": 0.19760319590568542, "step": 4060, "valid_targets_mean": 3104.0, "valid_targets_min": 665 }, { "epoch": 3.973607038123167, "grad_norm": 0.7229402835170321, "learning_rate": 1.8781948899213563e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.19763663411140442, "step": 4065, "valid_targets_mean": 2293.1, "valid_targets_min": 1080 }, { "epoch": 3.978494623655914, "grad_norm": 0.7692945667783568, "learning_rate": 1.8733290850386556e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.2350245714187622, "step": 4070, "valid_targets_mean": 2153.9, "valid_targets_min": 522 }, { "epoch": 3.983382209188661, "grad_norm": 0.7485634972600307, "learning_rate": 1.8684640328273013e-05, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.2132551074028015, "step": 4075, "valid_targets_mean": 2146.8, "valid_targets_min": 533 }, { "epoch": 3.9882697947214076, "grad_norm": 0.7868285556946475, "learning_rate": 1.8635997621951554e-05, "loss": 0.2055, "loss_nan_ranks": 0, "loss_rank_avg": 0.21789923310279846, "step": 4080, "valid_targets_mean": 1982.0, "valid_targets_min": 1146 }, { "epoch": 3.9931573802541545, "grad_norm": 0.6520687750578001, "learning_rate": 1.858736302045438e-05, "loss": 0.2106, "loss_nan_ranks": 0, "loss_rank_avg": 0.2020658552646637, "step": 4085, "valid_targets_mean": 2626.5, "valid_targets_min": 1214 }, { "epoch": 3.9980449657869013, "grad_norm": 0.6705009639669899, "learning_rate": 1.8538736812765495e-05, "loss": 0.2127, "loss_nan_ranks": 0, "loss_rank_avg": 0.2510734796524048, "step": 4090, "valid_targets_mean": 2900.7, "valid_targets_min": 823 }, { "epoch": 4.002932551319648, "grad_norm": 0.6983984686970028, "learning_rate": 1.8490119287819058e-05, "loss": 0.1852, "loss_nan_ranks": 0, "loss_rank_avg": 0.1645195633172989, "step": 4095, "valid_targets_mean": 2202.6, "valid_targets_min": 706 }, { "epoch": 4.007820136852395, "grad_norm": 0.7590415869647605, "learning_rate": 1.844151073449763e-05, "loss": 0.1727, "loss_nan_ranks": 0, "loss_rank_avg": 0.1695270985364914, "step": 4100, "valid_targets_mean": 2045.4, "valid_targets_min": 484 }, { "epoch": 4.012707722385142, "grad_norm": 0.8500063167328339, "learning_rate": 1.8392911441630458e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.1960211545228958, "step": 4105, "valid_targets_mean": 1932.2, "valid_targets_min": 886 }, { "epoch": 4.0175953079178885, "grad_norm": 0.6876315958843118, "learning_rate": 1.8344321697991775e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.17042392492294312, "step": 4110, "valid_targets_mean": 2488.9, "valid_targets_min": 984 }, { "epoch": 4.022482893450635, "grad_norm": 0.6267560608434691, "learning_rate": 1.8295741792299054e-05, "loss": 0.1857, "loss_nan_ranks": 0, "loss_rank_avg": 0.1570637822151184, "step": 4115, "valid_targets_mean": 2911.5, "valid_targets_min": 998 }, { "epoch": 4.027370478983382, "grad_norm": 0.6860515522522642, "learning_rate": 1.8247172013211316e-05, "loss": 0.17, "loss_nan_ranks": 0, "loss_rank_avg": 0.17035432159900665, "step": 4120, "valid_targets_mean": 2804.3, "valid_targets_min": 1062 }, { "epoch": 4.032258064516129, "grad_norm": 0.658990742688263, "learning_rate": 1.819861264932743e-05, "loss": 0.1688, "loss_nan_ranks": 0, "loss_rank_avg": 0.1729648858308792, "step": 4125, "valid_targets_mean": 3242.4, "valid_targets_min": 952 }, { "epoch": 4.037145650048876, "grad_norm": 0.8278627891112406, "learning_rate": 1.815006398918435e-05, "loss": 0.1708, "loss_nan_ranks": 0, "loss_rank_avg": 0.17281252145767212, "step": 4130, "valid_targets_mean": 1954.6, "valid_targets_min": 746 }, { "epoch": 4.042033235581623, "grad_norm": 0.7070945916212567, "learning_rate": 1.8101526321255464e-05, "loss": 0.1886, "loss_nan_ranks": 0, "loss_rank_avg": 0.18609067797660828, "step": 4135, "valid_targets_mean": 2809.1, "valid_targets_min": 725 }, { "epoch": 4.0469208211143695, "grad_norm": 0.732269604211766, "learning_rate": 1.805299993394881e-05, "loss": 0.1709, "loss_nan_ranks": 0, "loss_rank_avg": 0.1601986289024353, "step": 4140, "valid_targets_mean": 2153.6, "valid_targets_min": 895 }, { "epoch": 4.051808406647116, "grad_norm": 0.7644694368274649, "learning_rate": 1.8004485115605407e-05, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.17084315419197083, "step": 4145, "valid_targets_mean": 2271.1, "valid_targets_min": 900 }, { "epoch": 4.056695992179863, "grad_norm": 0.680277205771116, "learning_rate": 1.7955982154497545e-05, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.18231913447380066, "step": 4150, "valid_targets_mean": 2801.8, "valid_targets_min": 1152 }, { "epoch": 4.06158357771261, "grad_norm": 0.7619020216747033, "learning_rate": 1.7907491338827053e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.17396214604377747, "step": 4155, "valid_targets_mean": 2283.8, "valid_targets_min": 649 }, { "epoch": 4.066471163245357, "grad_norm": 0.7954884604214785, "learning_rate": 1.7859012956723577e-05, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.17803660035133362, "step": 4160, "valid_targets_mean": 2164.9, "valid_targets_min": 784 }, { "epoch": 4.0713587487781036, "grad_norm": 0.70348085226897, "learning_rate": 1.781054729624291e-05, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.16010019183158875, "step": 4165, "valid_targets_mean": 2553.6, "valid_targets_min": 843 }, { "epoch": 4.07624633431085, "grad_norm": 1.026152425313603, "learning_rate": 1.7762094645365225e-05, "loss": 0.1763, "loss_nan_ranks": 0, "loss_rank_avg": 0.18153509497642517, "step": 4170, "valid_targets_mean": 2432.5, "valid_targets_min": 615 }, { "epoch": 4.081133919843597, "grad_norm": 0.7254831762036433, "learning_rate": 1.7713655291993426e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.20568543672561646, "step": 4175, "valid_targets_mean": 2840.9, "valid_targets_min": 881 }, { "epoch": 4.086021505376344, "grad_norm": 0.697671859067687, "learning_rate": 1.766522952395138e-05, "loss": 0.1728, "loss_nan_ranks": 0, "loss_rank_avg": 0.19269169867038727, "step": 4180, "valid_targets_mean": 3086.3, "valid_targets_min": 746 }, { "epoch": 4.090909090909091, "grad_norm": 0.7479636389963256, "learning_rate": 1.7616817628982225e-05, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.16542398929595947, "step": 4185, "valid_targets_mean": 2449.9, "valid_targets_min": 1025 }, { "epoch": 4.095796676441838, "grad_norm": 0.8012001808352684, "learning_rate": 1.7568419894746694e-05, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.15177610516548157, "step": 4190, "valid_targets_mean": 1801.7, "valid_targets_min": 567 }, { "epoch": 4.1006842619745845, "grad_norm": 0.6599199969261322, "learning_rate": 1.7520036608821343e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.16316524147987366, "step": 4195, "valid_targets_mean": 2802.2, "valid_targets_min": 607 }, { "epoch": 4.105571847507331, "grad_norm": 0.660475255360126, "learning_rate": 1.7471668058696917e-05, "loss": 0.1701, "loss_nan_ranks": 0, "loss_rank_avg": 0.16640618443489075, "step": 4200, "valid_targets_mean": 2976.4, "valid_targets_min": 821 }, { "epoch": 4.110459433040078, "grad_norm": 0.7767208027973069, "learning_rate": 1.7423314531776566e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.16882777214050293, "step": 4205, "valid_targets_mean": 2222.6, "valid_targets_min": 627 }, { "epoch": 4.115347018572825, "grad_norm": 0.6976329404563815, "learning_rate": 1.737497631537418e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.17232577502727509, "step": 4210, "valid_targets_mean": 2611.0, "valid_targets_min": 869 }, { "epoch": 4.120234604105572, "grad_norm": 0.8087989717723046, "learning_rate": 1.7326653696712706e-05, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.1771789789199829, "step": 4215, "valid_targets_mean": 2261.4, "valid_targets_min": 551 }, { "epoch": 4.125122189638319, "grad_norm": 0.7223726297736563, "learning_rate": 1.7278346962922365e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.17196297645568848, "step": 4220, "valid_targets_mean": 2553.8, "valid_targets_min": 791 }, { "epoch": 4.130009775171065, "grad_norm": 0.8038120785795847, "learning_rate": 1.7230056401039014e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.1827443540096283, "step": 4225, "valid_targets_mean": 1950.0, "valid_targets_min": 744 }, { "epoch": 4.134897360703812, "grad_norm": 0.8507666081146841, "learning_rate": 1.7181782298002426e-05, "loss": 0.1919, "loss_nan_ranks": 0, "loss_rank_avg": 0.1930236965417862, "step": 4230, "valid_targets_mean": 1955.8, "valid_targets_min": 837 }, { "epoch": 4.139784946236559, "grad_norm": 0.72829350980729, "learning_rate": 1.713352494065455e-05, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.1770409643650055, "step": 4235, "valid_targets_mean": 2629.4, "valid_targets_min": 728 }, { "epoch": 4.144672531769306, "grad_norm": 0.8739112255295849, "learning_rate": 1.708528461573787e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.17912176251411438, "step": 4240, "valid_targets_mean": 1731.5, "valid_targets_min": 829 }, { "epoch": 4.149560117302053, "grad_norm": 0.6736533471138151, "learning_rate": 1.703706160989362e-05, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.17516711354255676, "step": 4245, "valid_targets_mean": 3023.8, "valid_targets_min": 726 }, { "epoch": 4.1544477028347995, "grad_norm": 0.7146049815510215, "learning_rate": 1.6988856209660162e-05, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.18740811944007874, "step": 4250, "valid_targets_mean": 3117.8, "valid_targets_min": 895 }, { "epoch": 4.159335288367546, "grad_norm": 0.8287505524072367, "learning_rate": 1.694066870147123e-05, "loss": 0.165, "loss_nan_ranks": 0, "loss_rank_avg": 0.17309562861919403, "step": 4255, "valid_targets_mean": 2429.8, "valid_targets_min": 613 }, { "epoch": 4.164222873900293, "grad_norm": 0.8384682014231488, "learning_rate": 1.689249937165425e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.17695944011211395, "step": 4260, "valid_targets_mean": 1893.6, "valid_targets_min": 622 }, { "epoch": 4.16911045943304, "grad_norm": 0.8023347194519758, "learning_rate": 1.6844348506428624e-05, "loss": 0.1709, "loss_nan_ranks": 0, "loss_rank_avg": 0.1862003207206726, "step": 4265, "valid_targets_mean": 2379.9, "valid_targets_min": 996 }, { "epoch": 4.173998044965787, "grad_norm": 0.7189754762701044, "learning_rate": 1.679621639190405e-05, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.18278726935386658, "step": 4270, "valid_targets_mean": 2820.7, "valid_targets_min": 981 }, { "epoch": 4.178885630498534, "grad_norm": 0.7689815704124234, "learning_rate": 1.6748103314078795e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.15576958656311035, "step": 4275, "valid_targets_mean": 2550.9, "valid_targets_min": 830 }, { "epoch": 4.18377321603128, "grad_norm": 0.7790069715413338, "learning_rate": 1.6700009558838034e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.1859605610370636, "step": 4280, "valid_targets_mean": 2325.7, "valid_targets_min": 765 }, { "epoch": 4.188660801564027, "grad_norm": 0.7059772286515155, "learning_rate": 1.6651935411952117e-05, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.18116068840026855, "step": 4285, "valid_targets_mean": 2637.1, "valid_targets_min": 981 }, { "epoch": 4.193548387096774, "grad_norm": 0.8478026456180225, "learning_rate": 1.6603881159074864e-05, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.1635878086090088, "step": 4290, "valid_targets_mean": 2021.2, "valid_targets_min": 728 }, { "epoch": 4.198435972629521, "grad_norm": 0.7892671310342947, "learning_rate": 1.655584708574192e-05, "loss": 0.1728, "loss_nan_ranks": 0, "loss_rank_avg": 0.16756808757781982, "step": 4295, "valid_targets_mean": 2019.6, "valid_targets_min": 694 }, { "epoch": 4.203323558162268, "grad_norm": 0.7866619457000387, "learning_rate": 1.6507833477368994e-05, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.1662808358669281, "step": 4300, "valid_targets_mean": 2019.4, "valid_targets_min": 824 }, { "epoch": 4.2082111436950145, "grad_norm": 0.8459519999111245, "learning_rate": 1.6459840619250217e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.1930123269557953, "step": 4305, "valid_targets_mean": 2161.1, "valid_targets_min": 817 }, { "epoch": 4.213098729227761, "grad_norm": 0.8021367267841367, "learning_rate": 1.6411868796556408e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.18006908893585205, "step": 4310, "valid_targets_mean": 2118.6, "valid_targets_min": 572 }, { "epoch": 4.217986314760508, "grad_norm": 0.8090359446901784, "learning_rate": 1.6363918294333395e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.15488529205322266, "step": 4315, "valid_targets_mean": 1977.8, "valid_targets_min": 727 }, { "epoch": 4.222873900293255, "grad_norm": 0.6855591904703289, "learning_rate": 1.6315989397500332e-05, "loss": 0.1668, "loss_nan_ranks": 0, "loss_rank_avg": 0.16280516982078552, "step": 4320, "valid_targets_mean": 3256.6, "valid_targets_min": 958 }, { "epoch": 4.227761485826002, "grad_norm": 0.809105744787128, "learning_rate": 1.6268082390847983e-05, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.15723910927772522, "step": 4325, "valid_targets_mean": 1953.2, "valid_targets_min": 746 }, { "epoch": 4.232649071358749, "grad_norm": 0.7131155432880343, "learning_rate": 1.6220197559037045e-05, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.18179753422737122, "step": 4330, "valid_targets_mean": 2626.1, "valid_targets_min": 1086 }, { "epoch": 4.237536656891495, "grad_norm": 0.7455797655769655, "learning_rate": 1.617233518659647e-05, "loss": 0.1711, "loss_nan_ranks": 0, "loss_rank_avg": 0.16530537605285645, "step": 4335, "valid_targets_mean": 2392.8, "valid_targets_min": 770 }, { "epoch": 4.242424242424242, "grad_norm": 0.7439354451578698, "learning_rate": 1.6124495557921725e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.173561230301857, "step": 4340, "valid_targets_mean": 2214.4, "valid_targets_min": 671 }, { "epoch": 4.247311827956989, "grad_norm": 0.7373073806467637, "learning_rate": 1.6076678957273162e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.17753678560256958, "step": 4345, "valid_targets_mean": 2657.6, "valid_targets_min": 734 }, { "epoch": 4.252199413489736, "grad_norm": 0.7000837897806548, "learning_rate": 1.602888566877429e-05, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.17242294549942017, "step": 4350, "valid_targets_mean": 2792.0, "valid_targets_min": 770 }, { "epoch": 4.257086999022483, "grad_norm": 0.7271682426991912, "learning_rate": 1.59811159764101e-05, "loss": 0.1721, "loss_nan_ranks": 0, "loss_rank_avg": 0.16193613409996033, "step": 4355, "valid_targets_mean": 2416.5, "valid_targets_min": 907 }, { "epoch": 4.2619745845552295, "grad_norm": 0.7944206346753406, "learning_rate": 1.593337016402539e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.17991730570793152, "step": 4360, "valid_targets_mean": 2064.8, "valid_targets_min": 655 }, { "epoch": 4.266862170087976, "grad_norm": 0.7010001037382477, "learning_rate": 1.5885648515323028e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.16409370303153992, "step": 4365, "valid_targets_mean": 2635.2, "valid_targets_min": 930 }, { "epoch": 4.271749755620723, "grad_norm": 0.6568280133407176, "learning_rate": 1.5837951313862352e-05, "loss": 0.184, "loss_nan_ranks": 0, "loss_rank_avg": 0.18202292919158936, "step": 4370, "valid_targets_mean": 3231.6, "valid_targets_min": 671 }, { "epoch": 4.27663734115347, "grad_norm": 0.8085208993831905, "learning_rate": 1.5790278843057395e-05, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.18638502061367035, "step": 4375, "valid_targets_mean": 2588.2, "valid_targets_min": 665 }, { "epoch": 4.281524926686217, "grad_norm": 0.8087448136164485, "learning_rate": 1.5742631386175255e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.17984755337238312, "step": 4380, "valid_targets_mean": 2140.7, "valid_targets_min": 701 }, { "epoch": 4.286412512218964, "grad_norm": 0.7073051473557163, "learning_rate": 1.569500922633442e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.16911262273788452, "step": 4385, "valid_targets_mean": 2626.2, "valid_targets_min": 694 }, { "epoch": 4.29130009775171, "grad_norm": 0.7422208850214889, "learning_rate": 1.5647412646503025e-05, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.17553281784057617, "step": 4390, "valid_targets_mean": 2183.2, "valid_targets_min": 1272 }, { "epoch": 4.296187683284457, "grad_norm": 0.7592007757916336, "learning_rate": 1.5599841929497234e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.17773813009262085, "step": 4395, "valid_targets_mean": 2256.4, "valid_targets_min": 771 }, { "epoch": 4.301075268817204, "grad_norm": 0.7553316641615674, "learning_rate": 1.555229735797954e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.18115384876728058, "step": 4400, "valid_targets_mean": 2220.1, "valid_targets_min": 733 }, { "epoch": 4.305962854349951, "grad_norm": 0.7811092431468514, "learning_rate": 1.5504779214457064e-05, "loss": 0.1695, "loss_nan_ranks": 0, "loss_rank_avg": 0.17034941911697388, "step": 4405, "valid_targets_mean": 1985.4, "valid_targets_min": 872 }, { "epoch": 4.310850439882698, "grad_norm": 0.6751967572463863, "learning_rate": 1.5457287781279914e-05, "loss": 0.1739, "loss_nan_ranks": 0, "loss_rank_avg": 0.1524028480052948, "step": 4410, "valid_targets_mean": 2459.4, "valid_targets_min": 768 }, { "epoch": 4.3157380254154445, "grad_norm": 0.7006365562513612, "learning_rate": 1.5409823340639472e-05, "loss": 0.174, "loss_nan_ranks": 0, "loss_rank_avg": 0.1530303657054901, "step": 4415, "valid_targets_mean": 2240.3, "valid_targets_min": 809 }, { "epoch": 4.320625610948191, "grad_norm": 0.8127996699553531, "learning_rate": 1.5362386174566727e-05, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.1497165858745575, "step": 4420, "valid_targets_mean": 1762.8, "valid_targets_min": 672 }, { "epoch": 4.325513196480938, "grad_norm": 0.7509544790056238, "learning_rate": 1.5314976564930616e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.215011328458786, "step": 4425, "valid_targets_mean": 2781.2, "valid_targets_min": 870 }, { "epoch": 4.330400782013685, "grad_norm": 0.7344537959086179, "learning_rate": 1.526759479343634e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.1870063692331314, "step": 4430, "valid_targets_mean": 2725.8, "valid_targets_min": 1240 }, { "epoch": 4.335288367546432, "grad_norm": 0.672200316438301, "learning_rate": 1.5220241141623666e-05, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.1690032184123993, "step": 4435, "valid_targets_mean": 3031.5, "valid_targets_min": 1266 }, { "epoch": 4.340175953079179, "grad_norm": 0.6666959910156269, "learning_rate": 1.517291589086531e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.15352541208267212, "step": 4440, "valid_targets_mean": 2541.2, "valid_targets_min": 749 }, { "epoch": 4.345063538611925, "grad_norm": 0.7100554914799727, "learning_rate": 1.512561932236519e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.16762804985046387, "step": 4445, "valid_targets_mean": 2549.6, "valid_targets_min": 978 }, { "epoch": 4.349951124144672, "grad_norm": 0.7579351582413887, "learning_rate": 1.507835171715683e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.19213947653770447, "step": 4450, "valid_targets_mean": 2302.4, "valid_targets_min": 893 }, { "epoch": 4.354838709677419, "grad_norm": 0.7076551024584983, "learning_rate": 1.503111335610164e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.16405513882637024, "step": 4455, "valid_targets_mean": 2656.4, "valid_targets_min": 662 }, { "epoch": 4.359726295210166, "grad_norm": 0.6577102500804493, "learning_rate": 1.4983904519887257e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.18623942136764526, "step": 4460, "valid_targets_mean": 3397.5, "valid_targets_min": 869 }, { "epoch": 4.364613880742913, "grad_norm": 0.8364738050383415, "learning_rate": 1.4936725489025907e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.18252325057983398, "step": 4465, "valid_targets_mean": 2765.1, "valid_targets_min": 740 }, { "epoch": 4.3695014662756595, "grad_norm": 0.7332207981929358, "learning_rate": 1.4889576543852679e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.18655236065387726, "step": 4470, "valid_targets_mean": 2426.7, "valid_targets_min": 759 }, { "epoch": 4.374389051808406, "grad_norm": 0.7291042324534501, "learning_rate": 1.4842457964523932e-05, "loss": 0.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.1768685281276703, "step": 4475, "valid_targets_mean": 2585.4, "valid_targets_min": 776 }, { "epoch": 4.379276637341153, "grad_norm": 0.7241032428052671, "learning_rate": 1.4795370031015562e-05, "loss": 0.1686, "loss_nan_ranks": 0, "loss_rank_avg": 0.15364965796470642, "step": 4480, "valid_targets_mean": 2301.1, "valid_targets_min": 968 }, { "epoch": 4.3841642228739, "grad_norm": 0.8029472975208416, "learning_rate": 1.4748313023121385e-05, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.17943759262561798, "step": 4485, "valid_targets_mean": 2096.1, "valid_targets_min": 698 }, { "epoch": 4.389051808406647, "grad_norm": 0.7738811474250595, "learning_rate": 1.4701287220451463e-05, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.18864920735359192, "step": 4490, "valid_targets_mean": 2364.0, "valid_targets_min": 761 }, { "epoch": 4.393939393939394, "grad_norm": 0.8073103577600892, "learning_rate": 1.4654292902430424e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.1911054402589798, "step": 4495, "valid_targets_mean": 2996.8, "valid_targets_min": 912 }, { "epoch": 4.39882697947214, "grad_norm": 0.7781332848101631, "learning_rate": 1.4607330348295821e-05, "loss": 0.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.20065414905548096, "step": 4500, "valid_targets_mean": 2334.9, "valid_targets_min": 620 }, { "epoch": 4.403714565004887, "grad_norm": 0.8238449326675337, "learning_rate": 1.4560399837096478e-05, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.1719534993171692, "step": 4505, "valid_targets_mean": 1942.7, "valid_targets_min": 1107 }, { "epoch": 4.408602150537634, "grad_norm": 0.7909535037694309, "learning_rate": 1.4513501647690804e-05, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.15581440925598145, "step": 4510, "valid_targets_mean": 2048.7, "valid_targets_min": 680 }, { "epoch": 4.413489736070381, "grad_norm": 0.667844663877056, "learning_rate": 1.4466636058745179e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.16047389805316925, "step": 4515, "valid_targets_mean": 2790.1, "valid_targets_min": 697 }, { "epoch": 4.418377321603128, "grad_norm": 0.7179178500193523, "learning_rate": 1.4419803348732245e-05, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.16572578251361847, "step": 4520, "valid_targets_mean": 2572.5, "valid_targets_min": 923 }, { "epoch": 4.4232649071358745, "grad_norm": 0.7482497307829565, "learning_rate": 1.4373003795929287e-05, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.17924658954143524, "step": 4525, "valid_targets_mean": 2537.1, "valid_targets_min": 1124 }, { "epoch": 4.428152492668621, "grad_norm": 0.7983711495940576, "learning_rate": 1.4326237678416588e-05, "loss": 0.1709, "loss_nan_ranks": 0, "loss_rank_avg": 0.15910127758979797, "step": 4530, "valid_targets_mean": 2120.4, "valid_targets_min": 865 }, { "epoch": 4.433040078201368, "grad_norm": 0.7219070798034924, "learning_rate": 1.4279505274075743e-05, "loss": 0.165, "loss_nan_ranks": 0, "loss_rank_avg": 0.17049354314804077, "step": 4535, "valid_targets_mean": 2468.0, "valid_targets_min": 1040 }, { "epoch": 4.437927663734115, "grad_norm": 0.6820006015545326, "learning_rate": 1.423280686058804e-05, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.17498445510864258, "step": 4540, "valid_targets_mean": 2878.1, "valid_targets_min": 814 }, { "epoch": 4.442815249266862, "grad_norm": 0.7956975533298152, "learning_rate": 1.4186142715432775e-05, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.15380510687828064, "step": 4545, "valid_targets_mean": 1974.9, "valid_targets_min": 788 }, { "epoch": 4.447702834799609, "grad_norm": 0.6688865610533883, "learning_rate": 1.4139513115885635e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.18294396996498108, "step": 4550, "valid_targets_mean": 3151.7, "valid_targets_min": 1199 }, { "epoch": 4.452590420332355, "grad_norm": 0.7510655980124383, "learning_rate": 1.4092918339017046e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.17913363873958588, "step": 4555, "valid_targets_mean": 2332.2, "valid_targets_min": 875 }, { "epoch": 4.457478005865102, "grad_norm": 0.7147653866732739, "learning_rate": 1.4046358661690515e-05, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.15671703219413757, "step": 4560, "valid_targets_mean": 2355.0, "valid_targets_min": 648 }, { "epoch": 4.462365591397849, "grad_norm": 0.8146269315094486, "learning_rate": 1.3999834360560969e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.18449649214744568, "step": 4565, "valid_targets_mean": 2228.4, "valid_targets_min": 798 }, { "epoch": 4.467253176930596, "grad_norm": 0.8549012646003764, "learning_rate": 1.3953345712073172e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.20259252190589905, "step": 4570, "valid_targets_mean": 1910.8, "valid_targets_min": 698 }, { "epoch": 4.472140762463344, "grad_norm": 0.6930221111338045, "learning_rate": 1.3906892992460004e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.19013884663581848, "step": 4575, "valid_targets_mean": 2861.4, "valid_targets_min": 1011 }, { "epoch": 4.4770283479960895, "grad_norm": 0.8136412327729154, "learning_rate": 1.3860476477740883e-05, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.1534624695777893, "step": 4580, "valid_targets_mean": 1744.6, "valid_targets_min": 650 }, { "epoch": 4.481915933528837, "grad_norm": 0.7069363998150793, "learning_rate": 1.3814096443720091e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.16891230642795563, "step": 4585, "valid_targets_mean": 2515.7, "valid_targets_min": 696 }, { "epoch": 4.486803519061583, "grad_norm": 0.801344597413106, "learning_rate": 1.3767753165985126e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.14025087654590607, "step": 4590, "valid_targets_mean": 1840.0, "valid_targets_min": 818 }, { "epoch": 4.491691104594331, "grad_norm": 0.7759235567696053, "learning_rate": 1.3721446919905121e-05, "loss": 0.1697, "loss_nan_ranks": 0, "loss_rank_avg": 0.16802477836608887, "step": 4595, "valid_targets_mean": 2318.0, "valid_targets_min": 698 }, { "epoch": 4.496578690127077, "grad_norm": 0.7746563734745292, "learning_rate": 1.3675177980629135e-05, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.17537719011306763, "step": 4600, "valid_targets_mean": 2127.3, "valid_targets_min": 625 }, { "epoch": 4.5014662756598245, "grad_norm": 0.692029862169816, "learning_rate": 1.3628946623084563e-05, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.1666170358657837, "step": 4605, "valid_targets_mean": 2804.1, "valid_targets_min": 1352 }, { "epoch": 4.50635386119257, "grad_norm": 0.7747220358157921, "learning_rate": 1.3582753121975502e-05, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.16754350066184998, "step": 4610, "valid_targets_mean": 2106.8, "valid_targets_min": 1041 }, { "epoch": 4.511241446725318, "grad_norm": 0.794400474753371, "learning_rate": 1.3536597751781082e-05, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.15418118238449097, "step": 4615, "valid_targets_mean": 2122.1, "valid_targets_min": 623 }, { "epoch": 4.516129032258064, "grad_norm": 0.8630490069683876, "learning_rate": 1.3490480786753901e-05, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.1692330241203308, "step": 4620, "valid_targets_mean": 1878.2, "valid_targets_min": 864 }, { "epoch": 4.521016617790812, "grad_norm": 0.6949929703480787, "learning_rate": 1.3444402500918314e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.19203145802021027, "step": 4625, "valid_targets_mean": 2929.6, "valid_targets_min": 1109 }, { "epoch": 4.525904203323558, "grad_norm": 0.7212230561742061, "learning_rate": 1.3398363168068871e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.1773679554462433, "step": 4630, "valid_targets_mean": 3018.6, "valid_targets_min": 852 }, { "epoch": 4.530791788856305, "grad_norm": 0.7491901926461985, "learning_rate": 1.3352363061768668e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.19477087259292603, "step": 4635, "valid_targets_mean": 2341.3, "valid_targets_min": 548 }, { "epoch": 4.535679374389051, "grad_norm": 0.7218327291631365, "learning_rate": 1.3306402455347693e-05, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.15920904278755188, "step": 4640, "valid_targets_mean": 2138.7, "valid_targets_min": 749 }, { "epoch": 4.540566959921799, "grad_norm": 0.7886843070822219, "learning_rate": 1.3260481621901269e-05, "loss": 0.1691, "loss_nan_ranks": 0, "loss_rank_avg": 0.20281338691711426, "step": 4645, "valid_targets_mean": 2345.5, "valid_targets_min": 700 }, { "epoch": 4.545454545454545, "grad_norm": 0.7254460885818595, "learning_rate": 1.3214600834288351e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.18300187587738037, "step": 4650, "valid_targets_mean": 2600.0, "valid_targets_min": 818 }, { "epoch": 4.550342130987293, "grad_norm": 0.7303419088042947, "learning_rate": 1.3168760365129958e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.1488429307937622, "step": 4655, "valid_targets_mean": 2088.1, "valid_targets_min": 957 }, { "epoch": 4.555229716520039, "grad_norm": 0.8187576278617511, "learning_rate": 1.3122960486807551e-05, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.1666831523180008, "step": 4660, "valid_targets_mean": 2028.4, "valid_targets_min": 734 }, { "epoch": 4.560117302052786, "grad_norm": 0.7689970727875466, "learning_rate": 1.3077201471461396e-05, "loss": 0.183, "loss_nan_ranks": 0, "loss_rank_avg": 0.19278375804424286, "step": 4665, "valid_targets_mean": 2721.1, "valid_targets_min": 1050 }, { "epoch": 4.565004887585533, "grad_norm": 0.7136026943772088, "learning_rate": 1.3031483590988932e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.18920962512493134, "step": 4670, "valid_targets_mean": 3069.2, "valid_targets_min": 703 }, { "epoch": 4.56989247311828, "grad_norm": 0.6768328311866438, "learning_rate": 1.2985807117043212e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.170124351978302, "step": 4675, "valid_targets_mean": 3036.4, "valid_targets_min": 750 }, { "epoch": 4.574780058651027, "grad_norm": 0.7065627099385119, "learning_rate": 1.2940172321031228e-05, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.17484335601329803, "step": 4680, "valid_targets_mean": 2361.8, "valid_targets_min": 985 }, { "epoch": 4.579667644183774, "grad_norm": 0.7870866877498359, "learning_rate": 1.2894579474112336e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.17841269075870514, "step": 4685, "valid_targets_mean": 2178.9, "valid_targets_min": 673 }, { "epoch": 4.58455522971652, "grad_norm": 0.7992856974999708, "learning_rate": 1.2849028847196642e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.18455563485622406, "step": 4690, "valid_targets_mean": 2120.1, "valid_targets_min": 522 }, { "epoch": 4.589442815249267, "grad_norm": 0.7236365680919709, "learning_rate": 1.2803520710943345e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.1834551990032196, "step": 4695, "valid_targets_mean": 2806.9, "valid_targets_min": 683 }, { "epoch": 4.594330400782014, "grad_norm": 0.7328506697251148, "learning_rate": 1.2758055335759214e-05, "loss": 0.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.16841992735862732, "step": 4700, "valid_targets_mean": 2405.8, "valid_targets_min": 830 }, { "epoch": 4.599217986314761, "grad_norm": 0.7488482580131285, "learning_rate": 1.27126329917969e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.20795467495918274, "step": 4705, "valid_targets_mean": 2736.6, "valid_targets_min": 740 }, { "epoch": 4.604105571847508, "grad_norm": 0.701924815848274, "learning_rate": 1.2667253948953392e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.16952826082706451, "step": 4710, "valid_targets_mean": 2894.4, "valid_targets_min": 805 }, { "epoch": 4.6089931573802545, "grad_norm": 0.7638018479267547, "learning_rate": 1.262191847686837e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.17446717619895935, "step": 4715, "valid_targets_mean": 2210.6, "valid_targets_min": 1220 }, { "epoch": 4.613880742913001, "grad_norm": 0.9146808729960212, "learning_rate": 1.2576626844922602e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.19167935848236084, "step": 4720, "valid_targets_mean": 2399.1, "valid_targets_min": 743 }, { "epoch": 4.618768328445748, "grad_norm": 0.7745900925140338, "learning_rate": 1.2531379322236403e-05, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.17140185832977295, "step": 4725, "valid_targets_mean": 2393.5, "valid_targets_min": 850 }, { "epoch": 4.623655913978495, "grad_norm": 0.776866808386388, "learning_rate": 1.2486176177667963e-05, "loss": 0.178, "loss_nan_ranks": 0, "loss_rank_avg": 0.1710333526134491, "step": 4730, "valid_targets_mean": 2295.1, "valid_targets_min": 635 }, { "epoch": 4.628543499511242, "grad_norm": 0.9138199933637996, "learning_rate": 1.2441017679811777e-05, "loss": 0.1711, "loss_nan_ranks": 0, "loss_rank_avg": 0.17593233287334442, "step": 4735, "valid_targets_mean": 1879.2, "valid_targets_min": 661 }, { "epoch": 4.633431085043989, "grad_norm": 0.7080266048721636, "learning_rate": 1.2395904096997082e-05, "loss": 0.1688, "loss_nan_ranks": 0, "loss_rank_avg": 0.17759348452091217, "step": 4740, "valid_targets_mean": 2714.9, "valid_targets_min": 715 }, { "epoch": 4.638318670576735, "grad_norm": 0.7107351831118239, "learning_rate": 1.2350835697286185e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.1701585203409195, "step": 4745, "valid_targets_mean": 2465.2, "valid_targets_min": 836 }, { "epoch": 4.643206256109482, "grad_norm": 0.7110148275686181, "learning_rate": 1.2305812748472969e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.16965368390083313, "step": 4750, "valid_targets_mean": 2887.4, "valid_targets_min": 1056 }, { "epoch": 4.648093841642229, "grad_norm": 0.7808205504531988, "learning_rate": 1.2260835518081216e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.1801660656929016, "step": 4755, "valid_targets_mean": 2264.4, "valid_targets_min": 537 }, { "epoch": 4.652981427174976, "grad_norm": 0.6736174438322065, "learning_rate": 1.2215904273363055e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.16034579277038574, "step": 4760, "valid_targets_mean": 2747.2, "valid_targets_min": 878 }, { "epoch": 4.657869012707723, "grad_norm": 0.8172833092442401, "learning_rate": 1.2171019281297397e-05, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.18934208154678345, "step": 4765, "valid_targets_mean": 2011.7, "valid_targets_min": 689 }, { "epoch": 4.6627565982404695, "grad_norm": 0.7810540506761577, "learning_rate": 1.2126180808588281e-05, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.19872036576271057, "step": 4770, "valid_targets_mean": 2411.7, "valid_targets_min": 858 }, { "epoch": 4.667644183773216, "grad_norm": 0.7414123362578164, "learning_rate": 1.2081389121663361e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.19137006998062134, "step": 4775, "valid_targets_mean": 2429.5, "valid_targets_min": 996 }, { "epoch": 4.672531769305963, "grad_norm": 0.7992138573951394, "learning_rate": 1.2036644486672287e-05, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.18999941647052765, "step": 4780, "valid_targets_mean": 2264.3, "valid_targets_min": 800 }, { "epoch": 4.67741935483871, "grad_norm": 0.7629820940559762, "learning_rate": 1.199194716948512e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.18513910472393036, "step": 4785, "valid_targets_mean": 2405.6, "valid_targets_min": 548 }, { "epoch": 4.682306940371457, "grad_norm": 0.712753687411961, "learning_rate": 1.1947297435690772e-05, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.18980765342712402, "step": 4790, "valid_targets_mean": 2899.6, "valid_targets_min": 916 }, { "epoch": 4.687194525904204, "grad_norm": 0.7285016261064938, "learning_rate": 1.190269555059542e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.17685630917549133, "step": 4795, "valid_targets_mean": 2543.8, "valid_targets_min": 779 }, { "epoch": 4.69208211143695, "grad_norm": 0.7186549073765208, "learning_rate": 1.1858141779220902e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.17428386211395264, "step": 4800, "valid_targets_mean": 2633.2, "valid_targets_min": 781 }, { "epoch": 4.696969696969697, "grad_norm": 0.7081619736005064, "learning_rate": 1.1813636386303196e-05, "loss": 0.1697, "loss_nan_ranks": 0, "loss_rank_avg": 0.1797652244567871, "step": 4805, "valid_targets_mean": 2718.8, "valid_targets_min": 776 }, { "epoch": 4.701857282502444, "grad_norm": 0.8451059412061002, "learning_rate": 1.1769179636290801e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.18409138917922974, "step": 4810, "valid_targets_mean": 2124.2, "valid_targets_min": 847 }, { "epoch": 4.706744868035191, "grad_norm": 0.8202631061205068, "learning_rate": 1.1724771793343192e-05, "loss": 0.17, "loss_nan_ranks": 0, "loss_rank_avg": 0.17531917989253998, "step": 4815, "valid_targets_mean": 2052.2, "valid_targets_min": 700 }, { "epoch": 4.711632453567938, "grad_norm": 0.6836107410471749, "learning_rate": 1.1680413121329243e-05, "loss": 0.1862, "loss_nan_ranks": 0, "loss_rank_avg": 0.17793884873390198, "step": 4820, "valid_targets_mean": 3199.6, "valid_targets_min": 1120 }, { "epoch": 4.7165200391006845, "grad_norm": 0.7484449202460228, "learning_rate": 1.1636103883825636e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.1955634206533432, "step": 4825, "valid_targets_mean": 2796.8, "valid_targets_min": 1038 }, { "epoch": 4.721407624633431, "grad_norm": 0.8765114876948064, "learning_rate": 1.1591844344115346e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.16911789774894714, "step": 4830, "valid_targets_mean": 1774.6, "valid_targets_min": 637 }, { "epoch": 4.726295210166178, "grad_norm": 0.730247866586368, "learning_rate": 1.1547634765186016e-05, "loss": 0.1701, "loss_nan_ranks": 0, "loss_rank_avg": 0.16497325897216797, "step": 4835, "valid_targets_mean": 2376.2, "valid_targets_min": 818 }, { "epoch": 4.731182795698925, "grad_norm": 0.8018221641880683, "learning_rate": 1.1503475409728448e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.17386886477470398, "step": 4840, "valid_targets_mean": 2089.1, "valid_targets_min": 1032 }, { "epoch": 4.736070381231672, "grad_norm": 0.7294276842415255, "learning_rate": 1.1459366540135019e-05, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.1633351594209671, "step": 4845, "valid_targets_mean": 2460.2, "valid_targets_min": 870 }, { "epoch": 4.740957966764419, "grad_norm": 0.7012095976697436, "learning_rate": 1.1415308418498104e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.1733730584383011, "step": 4850, "valid_targets_mean": 2616.0, "valid_targets_min": 644 }, { "epoch": 4.745845552297165, "grad_norm": 0.6630187702111296, "learning_rate": 1.137130130660855e-05, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.16590818762779236, "step": 4855, "valid_targets_mean": 3160.9, "valid_targets_min": 1147 }, { "epoch": 4.750733137829912, "grad_norm": 0.9413915512130215, "learning_rate": 1.1327345465954109e-05, "loss": 0.1788, "loss_nan_ranks": 0, "loss_rank_avg": 0.1672978401184082, "step": 4860, "valid_targets_mean": 1737.2, "valid_targets_min": 744 }, { "epoch": 4.755620723362659, "grad_norm": 0.7740192526311673, "learning_rate": 1.128344115771787e-05, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.14710134267807007, "step": 4865, "valid_targets_mean": 2162.9, "valid_targets_min": 612 }, { "epoch": 4.760508308895406, "grad_norm": 0.7042101370968502, "learning_rate": 1.1239588642776736e-05, "loss": 0.178, "loss_nan_ranks": 0, "loss_rank_avg": 0.1820552498102188, "step": 4870, "valid_targets_mean": 2700.5, "valid_targets_min": 856 }, { "epoch": 4.765395894428153, "grad_norm": 0.846516777206178, "learning_rate": 1.1195788181699829e-05, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.16076403856277466, "step": 4875, "valid_targets_mean": 1912.6, "valid_targets_min": 607 }, { "epoch": 4.7702834799608995, "grad_norm": 0.8117401631836421, "learning_rate": 1.1152040034747005e-05, "loss": 0.1709, "loss_nan_ranks": 0, "loss_rank_avg": 0.19138172268867493, "step": 4880, "valid_targets_mean": 2053.1, "valid_targets_min": 679 }, { "epoch": 4.775171065493646, "grad_norm": 0.8090125882585804, "learning_rate": 1.1108344461867256e-05, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.18099914491176605, "step": 4885, "valid_targets_mean": 2086.2, "valid_targets_min": 875 }, { "epoch": 4.780058651026393, "grad_norm": 0.7869706404872734, "learning_rate": 1.1064701722697171e-05, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.17875008285045624, "step": 4890, "valid_targets_mean": 2636.2, "valid_targets_min": 789 }, { "epoch": 4.78494623655914, "grad_norm": 0.8338533349319971, "learning_rate": 1.102111207655943e-05, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.1614495813846588, "step": 4895, "valid_targets_mean": 2010.5, "valid_targets_min": 1178 }, { "epoch": 4.789833822091887, "grad_norm": 0.8181674038081255, "learning_rate": 1.0977575782461215e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.16135358810424805, "step": 4900, "valid_targets_mean": 1836.6, "valid_targets_min": 704 }, { "epoch": 4.794721407624634, "grad_norm": 0.7134765702982729, "learning_rate": 1.0934093099092684e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.18349812924861908, "step": 4905, "valid_targets_mean": 2678.9, "valid_targets_min": 1270 }, { "epoch": 4.79960899315738, "grad_norm": 0.7321067232072485, "learning_rate": 1.0890664284825488e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.1972254067659378, "step": 4910, "valid_targets_mean": 2744.4, "valid_targets_min": 991 }, { "epoch": 4.804496578690127, "grad_norm": 0.7586910224470423, "learning_rate": 1.0847289597711144e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.1841929405927658, "step": 4915, "valid_targets_mean": 2455.1, "valid_targets_min": 881 }, { "epoch": 4.809384164222874, "grad_norm": 0.7967660614928856, "learning_rate": 1.0803969295479577e-05, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.16611838340759277, "step": 4920, "valid_targets_mean": 1992.2, "valid_targets_min": 699 }, { "epoch": 4.814271749755621, "grad_norm": 0.7051736092585311, "learning_rate": 1.076070363553754e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.14659056067466736, "step": 4925, "valid_targets_mean": 2598.4, "valid_targets_min": 904 }, { "epoch": 4.819159335288368, "grad_norm": 0.8074487953089629, "learning_rate": 1.071749287496712e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.18871314823627472, "step": 4930, "valid_targets_mean": 2446.9, "valid_targets_min": 917 }, { "epoch": 4.8240469208211145, "grad_norm": 0.7358191683646678, "learning_rate": 1.0674337270524195e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.15642912685871124, "step": 4935, "valid_targets_mean": 2261.7, "valid_targets_min": 659 }, { "epoch": 4.828934506353861, "grad_norm": 0.7772322735086833, "learning_rate": 1.06312370786369e-05, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.16359858214855194, "step": 4940, "valid_targets_mean": 2106.1, "valid_targets_min": 706 }, { "epoch": 4.833822091886608, "grad_norm": 0.7984734484679462, "learning_rate": 1.0588192555404106e-05, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.1786036491394043, "step": 4945, "valid_targets_mean": 1923.9, "valid_targets_min": 1242 }, { "epoch": 4.838709677419355, "grad_norm": 0.7509801685683009, "learning_rate": 1.0545203956593922e-05, "loss": 0.1676, "loss_nan_ranks": 0, "loss_rank_avg": 0.16603411734104156, "step": 4950, "valid_targets_mean": 2316.3, "valid_targets_min": 917 }, { "epoch": 4.843597262952102, "grad_norm": 0.6961656843543814, "learning_rate": 1.0502271537642144e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.17675796151161194, "step": 4955, "valid_targets_mean": 2698.9, "valid_targets_min": 825 }, { "epoch": 4.848484848484849, "grad_norm": 0.8051523733028211, "learning_rate": 1.0459395553650767e-05, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.18461185693740845, "step": 4960, "valid_targets_mean": 1971.4, "valid_targets_min": 727 }, { "epoch": 4.853372434017595, "grad_norm": 0.8334702591345402, "learning_rate": 1.041657625938643e-05, "loss": 0.1942, "loss_nan_ranks": 0, "loss_rank_avg": 0.19902193546295166, "step": 4965, "valid_targets_mean": 2607.7, "valid_targets_min": 1300 }, { "epoch": 4.858260019550342, "grad_norm": 0.7868464417093073, "learning_rate": 1.0373813909278926e-05, "loss": 0.1807, "loss_nan_ranks": 0, "loss_rank_avg": 0.20459884405136108, "step": 4970, "valid_targets_mean": 2319.3, "valid_targets_min": 861 }, { "epoch": 4.863147605083089, "grad_norm": 0.757600709591517, "learning_rate": 1.0331108757419715e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.1869640350341797, "step": 4975, "valid_targets_mean": 2491.2, "valid_targets_min": 567 }, { "epoch": 4.868035190615836, "grad_norm": 0.7221664526957879, "learning_rate": 1.0288461057560361e-05, "loss": 0.1843, "loss_nan_ranks": 0, "loss_rank_avg": 0.17515313625335693, "step": 4980, "valid_targets_mean": 2669.4, "valid_targets_min": 1520 }, { "epoch": 4.872922776148583, "grad_norm": 0.7579422903647014, "learning_rate": 1.0245871063111077e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.1622183918952942, "step": 4985, "valid_targets_mean": 2357.6, "valid_targets_min": 912 }, { "epoch": 4.8778103616813295, "grad_norm": 0.8067790989051661, "learning_rate": 1.0203339027139167e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.16633889079093933, "step": 4990, "valid_targets_mean": 1989.5, "valid_targets_min": 632 }, { "epoch": 4.882697947214076, "grad_norm": 0.7758521837897394, "learning_rate": 1.0160865202367556e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.1709386706352234, "step": 4995, "valid_targets_mean": 2203.2, "valid_targets_min": 829 }, { "epoch": 4.887585532746823, "grad_norm": 0.8248140895342541, "learning_rate": 1.0118449841173294e-05, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.18402284383773804, "step": 5000, "valid_targets_mean": 2114.4, "valid_targets_min": 720 }, { "epoch": 4.89247311827957, "grad_norm": 0.6897458976588339, "learning_rate": 1.0076093195586043e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.16674119234085083, "step": 5005, "valid_targets_mean": 2625.1, "valid_targets_min": 708 }, { "epoch": 4.897360703812317, "grad_norm": 0.6687153559969188, "learning_rate": 1.0033795517286558e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.17733493447303772, "step": 5010, "valid_targets_mean": 2868.8, "valid_targets_min": 922 }, { "epoch": 4.902248289345064, "grad_norm": 0.8576695321729364, "learning_rate": 9.991557057605244e-06, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.18968823552131653, "step": 5015, "valid_targets_mean": 1945.0, "valid_targets_min": 704 }, { "epoch": 4.9071358748778104, "grad_norm": 0.639640416335708, "learning_rate": 9.949378067520601e-06, "loss": 0.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.14256887137889862, "step": 5020, "valid_targets_mean": 2694.2, "valid_targets_min": 656 }, { "epoch": 4.912023460410557, "grad_norm": 0.6732914788931557, "learning_rate": 9.90725879765779e-06, "loss": 0.1771, "loss_nan_ranks": 0, "loss_rank_avg": 0.1720367670059204, "step": 5025, "valid_targets_mean": 3006.6, "valid_targets_min": 1307 }, { "epoch": 4.916911045943304, "grad_norm": 0.7100316647560853, "learning_rate": 9.865199498287118e-06, "loss": 0.1862, "loss_nan_ranks": 0, "loss_rank_avg": 0.16838201880455017, "step": 5030, "valid_targets_mean": 2566.2, "valid_targets_min": 826 }, { "epoch": 4.921798631476051, "grad_norm": 0.7460391948002998, "learning_rate": 9.823200419322523e-06, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.16970403492450714, "step": 5035, "valid_targets_mean": 2189.6, "valid_targets_min": 737 }, { "epoch": 4.926686217008798, "grad_norm": 0.7470863844930459, "learning_rate": 9.781261810320151e-06, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.17340749502182007, "step": 5040, "valid_targets_mean": 2428.0, "valid_targets_min": 647 }, { "epoch": 4.9315738025415445, "grad_norm": 0.7125845379627102, "learning_rate": 9.739383920476806e-06, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.16167551279067993, "step": 5045, "valid_targets_mean": 2554.8, "valid_targets_min": 544 }, { "epoch": 4.936461388074291, "grad_norm": 0.7572669890789546, "learning_rate": 9.69756699862853e-06, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.22088664770126343, "step": 5050, "valid_targets_mean": 2523.8, "valid_targets_min": 944 }, { "epoch": 4.941348973607038, "grad_norm": 0.7472631938735368, "learning_rate": 9.65581129324909e-06, "loss": 0.176, "loss_nan_ranks": 0, "loss_rank_avg": 0.17298045754432678, "step": 5055, "valid_targets_mean": 2148.9, "valid_targets_min": 591 }, { "epoch": 4.946236559139785, "grad_norm": 0.7406653369418025, "learning_rate": 9.614117052448488e-06, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.12865734100341797, "step": 5060, "valid_targets_mean": 2030.6, "valid_targets_min": 842 }, { "epoch": 4.951124144672532, "grad_norm": 0.7621843768822362, "learning_rate": 9.572484523971544e-06, "loss": 0.1709, "loss_nan_ranks": 0, "loss_rank_avg": 0.17717863619327545, "step": 5065, "valid_targets_mean": 2430.3, "valid_targets_min": 704 }, { "epoch": 4.956011730205279, "grad_norm": 0.7498657834356395, "learning_rate": 9.530913955196344e-06, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.18062527477741241, "step": 5070, "valid_targets_mean": 2419.0, "valid_targets_min": 824 }, { "epoch": 4.9608993157380255, "grad_norm": 0.8141850556767372, "learning_rate": 9.489405593132846e-06, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.15304099023342133, "step": 5075, "valid_targets_mean": 2178.5, "valid_targets_min": 780 }, { "epoch": 4.965786901270772, "grad_norm": 0.6380568455457596, "learning_rate": 9.447959684421374e-06, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.16023944318294525, "step": 5080, "valid_targets_mean": 3038.6, "valid_targets_min": 1137 }, { "epoch": 4.970674486803519, "grad_norm": 0.7983753521526253, "learning_rate": 9.40657647533114e-06, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.18773408234119415, "step": 5085, "valid_targets_mean": 2392.6, "valid_targets_min": 753 }, { "epoch": 4.975562072336266, "grad_norm": 0.7019559841529516, "learning_rate": 9.365256211758819e-06, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.18119125068187714, "step": 5090, "valid_targets_mean": 2740.1, "valid_targets_min": 797 }, { "epoch": 4.980449657869013, "grad_norm": 0.8008073853070248, "learning_rate": 9.323999139227051e-06, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.18562883138656616, "step": 5095, "valid_targets_mean": 2072.8, "valid_targets_min": 764 }, { "epoch": 4.9853372434017595, "grad_norm": 0.7313841730070882, "learning_rate": 9.282805502883007e-06, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.1831430047750473, "step": 5100, "valid_targets_mean": 2517.4, "valid_targets_min": 754 }, { "epoch": 4.990224828934506, "grad_norm": 0.8078162384967679, "learning_rate": 9.241675547496938e-06, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.17006579041481018, "step": 5105, "valid_targets_mean": 2003.2, "valid_targets_min": 714 }, { "epoch": 4.995112414467253, "grad_norm": 0.8091777933799764, "learning_rate": 9.200609517460675e-06, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.18514806032180786, "step": 5110, "valid_targets_mean": 2168.2, "valid_targets_min": 680 }, { "epoch": 5.0, "grad_norm": 0.7870915330741979, "learning_rate": 9.159607656786222e-06, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.16797024011611938, "step": 5115, "valid_targets_mean": 2128.8, "valid_targets_min": 887 }, { "epoch": 5.004887585532747, "grad_norm": 0.7747894970742039, "learning_rate": 9.1186702091043e-06, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.16766156256198883, "step": 5120, "valid_targets_mean": 2120.5, "valid_targets_min": 675 }, { "epoch": 5.009775171065494, "grad_norm": 0.6475219132787013, "learning_rate": 9.077797417662888e-06, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.16814623773097992, "step": 5125, "valid_targets_mean": 3438.9, "valid_targets_min": 621 }, { "epoch": 5.0146627565982405, "grad_norm": 0.6877209083156904, "learning_rate": 9.036989525325788e-06, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.151102676987648, "step": 5130, "valid_targets_mean": 3217.8, "valid_targets_min": 768 }, { "epoch": 5.019550342130987, "grad_norm": 0.7324938421863219, "learning_rate": 8.996246774571159e-06, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.12554004788398743, "step": 5135, "valid_targets_mean": 2168.3, "valid_targets_min": 1037 }, { "epoch": 5.024437927663734, "grad_norm": 0.7753610298141373, "learning_rate": 8.95556940749009e-06, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.14286714792251587, "step": 5140, "valid_targets_mean": 2078.7, "valid_targets_min": 668 }, { "epoch": 5.029325513196481, "grad_norm": 0.7395423291733766, "learning_rate": 8.914957665785184e-06, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.16619789600372314, "step": 5145, "valid_targets_mean": 2746.6, "valid_targets_min": 986 }, { "epoch": 5.034213098729228, "grad_norm": 0.6439026975349222, "learning_rate": 8.874411790769093e-06, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.12593859434127808, "step": 5150, "valid_targets_mean": 2663.3, "valid_targets_min": 1334 }, { "epoch": 5.0391006842619745, "grad_norm": 0.7324203667912003, "learning_rate": 8.833932023363096e-06, "loss": 0.145, "loss_nan_ranks": 0, "loss_rank_avg": 0.16145989298820496, "step": 5155, "valid_targets_mean": 2840.1, "valid_targets_min": 1147 }, { "epoch": 5.043988269794721, "grad_norm": 1.2076159147090062, "learning_rate": 8.793518604095659e-06, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.16184774041175842, "step": 5160, "valid_targets_mean": 2118.9, "valid_targets_min": 985 }, { "epoch": 5.048875855327468, "grad_norm": 0.8370647289954567, "learning_rate": 8.753171773101e-06, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.15503370761871338, "step": 5165, "valid_targets_mean": 2071.8, "valid_targets_min": 741 }, { "epoch": 5.053763440860215, "grad_norm": 1.3707229780441046, "learning_rate": 8.712891770117693e-06, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.1608889102935791, "step": 5170, "valid_targets_mean": 2661.7, "valid_targets_min": 807 }, { "epoch": 5.058651026392962, "grad_norm": 0.8818514323414521, "learning_rate": 8.672678834487228e-06, "loss": 0.1424, "loss_nan_ranks": 0, "loss_rank_avg": 0.1271866112947464, "step": 5175, "valid_targets_mean": 1782.8, "valid_targets_min": 933 }, { "epoch": 5.063538611925709, "grad_norm": 0.7996369140231598, "learning_rate": 8.632533205152553e-06, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.14621879160404205, "step": 5180, "valid_targets_mean": 2618.7, "valid_targets_min": 771 }, { "epoch": 5.0684261974584555, "grad_norm": 0.7632406562623092, "learning_rate": 8.592455120656726e-06, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.15845827758312225, "step": 5185, "valid_targets_mean": 2956.1, "valid_targets_min": 636 }, { "epoch": 5.073313782991202, "grad_norm": 0.8154709547280357, "learning_rate": 8.552444819141413e-06, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.15961962938308716, "step": 5190, "valid_targets_mean": 2535.6, "valid_targets_min": 727 }, { "epoch": 5.078201368523949, "grad_norm": 0.7508882761061626, "learning_rate": 8.512502538345568e-06, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.13347077369689941, "step": 5195, "valid_targets_mean": 2393.2, "valid_targets_min": 625 }, { "epoch": 5.083088954056696, "grad_norm": 0.7503877902892744, "learning_rate": 8.472628515603936e-06, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.1839996576309204, "step": 5200, "valid_targets_mean": 3139.9, "valid_targets_min": 1167 }, { "epoch": 5.087976539589443, "grad_norm": 0.814409890229622, "learning_rate": 8.43282298784567e-06, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.16277194023132324, "step": 5205, "valid_targets_mean": 2501.2, "valid_targets_min": 949 }, { "epoch": 5.0928641251221896, "grad_norm": 0.7086407404966241, "learning_rate": 8.393086191592963e-06, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.15189936757087708, "step": 5210, "valid_targets_mean": 3098.6, "valid_targets_min": 1159 }, { "epoch": 5.097751710654936, "grad_norm": 0.8089395622560438, "learning_rate": 8.353418362959564e-06, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.1489260196685791, "step": 5215, "valid_targets_mean": 2491.1, "valid_targets_min": 644 }, { "epoch": 5.102639296187683, "grad_norm": 0.8056121720254122, "learning_rate": 8.313819737649483e-06, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.15654730796813965, "step": 5220, "valid_targets_mean": 2591.2, "valid_targets_min": 801 }, { "epoch": 5.10752688172043, "grad_norm": 0.8044880648557395, "learning_rate": 8.274290550955468e-06, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.13206225633621216, "step": 5225, "valid_targets_mean": 2005.5, "valid_targets_min": 1094 }, { "epoch": 5.112414467253177, "grad_norm": 0.7613818292118435, "learning_rate": 8.234831037757687e-06, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.17657440900802612, "step": 5230, "valid_targets_mean": 2638.0, "valid_targets_min": 765 }, { "epoch": 5.117302052785924, "grad_norm": 0.6877071433658863, "learning_rate": 8.195441432522324e-06, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.1490596979856491, "step": 5235, "valid_targets_mean": 3027.0, "valid_targets_min": 874 }, { "epoch": 5.1221896383186705, "grad_norm": 0.7403615217739022, "learning_rate": 8.156121969300168e-06, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.1425008326768875, "step": 5240, "valid_targets_mean": 2339.8, "valid_targets_min": 659 }, { "epoch": 5.127077223851417, "grad_norm": 0.7526140740334464, "learning_rate": 8.116872881725213e-06, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.1776733696460724, "step": 5245, "valid_targets_mean": 3384.4, "valid_targets_min": 1031 }, { "epoch": 5.131964809384164, "grad_norm": 0.7793267157176477, "learning_rate": 8.077694403013312e-06, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.1542745679616928, "step": 5250, "valid_targets_mean": 2364.7, "valid_targets_min": 712 }, { "epoch": 5.136852394916911, "grad_norm": 0.7971711756751064, "learning_rate": 8.038586765960735e-06, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.1412791758775711, "step": 5255, "valid_targets_mean": 1963.4, "valid_targets_min": 641 }, { "epoch": 5.141739980449658, "grad_norm": 0.7033271354224208, "learning_rate": 7.999550202942833e-06, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.16525672376155853, "step": 5260, "valid_targets_mean": 3219.7, "valid_targets_min": 809 }, { "epoch": 5.146627565982405, "grad_norm": 0.7247341620856336, "learning_rate": 7.960584945912649e-06, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.16547167301177979, "step": 5265, "valid_targets_mean": 2777.9, "valid_targets_min": 744 }, { "epoch": 5.151515151515151, "grad_norm": 0.8520459168069531, "learning_rate": 7.921691226399492e-06, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.15888334810733795, "step": 5270, "valid_targets_mean": 2529.7, "valid_targets_min": 816 }, { "epoch": 5.156402737047898, "grad_norm": 0.7059577585280569, "learning_rate": 7.882869275507648e-06, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.13361497223377228, "step": 5275, "valid_targets_mean": 2845.0, "valid_targets_min": 704 }, { "epoch": 5.161290322580645, "grad_norm": 0.6859160374477156, "learning_rate": 7.844119323914918e-06, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.14880457520484924, "step": 5280, "valid_targets_mean": 3074.0, "valid_targets_min": 764 }, { "epoch": 5.166177908113392, "grad_norm": 0.6951765797767238, "learning_rate": 7.805441601871292e-06, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.1490635871887207, "step": 5285, "valid_targets_mean": 3103.2, "valid_targets_min": 1018 }, { "epoch": 5.171065493646139, "grad_norm": 0.7792674902926341, "learning_rate": 7.766836339197617e-06, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.1745825558900833, "step": 5290, "valid_targets_mean": 2414.8, "valid_targets_min": 972 }, { "epoch": 5.1759530791788855, "grad_norm": 0.7243392727575753, "learning_rate": 7.728303765284136e-06, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.1535375863313675, "step": 5295, "valid_targets_mean": 2897.2, "valid_targets_min": 932 }, { "epoch": 5.180840664711632, "grad_norm": 0.7297677901128055, "learning_rate": 7.689844109089217e-06, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.14912715554237366, "step": 5300, "valid_targets_mean": 2656.3, "valid_targets_min": 1004 }, { "epoch": 5.185728250244379, "grad_norm": 0.7467264254993835, "learning_rate": 7.651457599137929e-06, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.14847451448440552, "step": 5305, "valid_targets_mean": 2904.3, "valid_targets_min": 638 }, { "epoch": 5.190615835777126, "grad_norm": 0.8720410023528405, "learning_rate": 7.613144463520732e-06, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.1656719148159027, "step": 5310, "valid_targets_mean": 2167.3, "valid_targets_min": 734 }, { "epoch": 5.195503421309873, "grad_norm": 0.7908689871901836, "learning_rate": 7.574904929892093e-06, "loss": 0.1513, "loss_nan_ranks": 0, "loss_rank_avg": 0.16172878444194794, "step": 5315, "valid_targets_mean": 2394.0, "valid_targets_min": 898 }, { "epoch": 5.20039100684262, "grad_norm": 0.755139638023909, "learning_rate": 7.53673922546913e-06, "loss": 0.1367, "loss_nan_ranks": 0, "loss_rank_avg": 0.14658725261688232, "step": 5320, "valid_targets_mean": 2478.6, "valid_targets_min": 810 }, { "epoch": 5.205278592375366, "grad_norm": 0.8778718952166356, "learning_rate": 7.498647577030291e-06, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.14963701367378235, "step": 5325, "valid_targets_mean": 2121.1, "valid_targets_min": 635 }, { "epoch": 5.210166177908113, "grad_norm": 0.8376481931091295, "learning_rate": 7.460630210913964e-06, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.14989005029201508, "step": 5330, "valid_targets_mean": 1952.4, "valid_targets_min": 648 }, { "epoch": 5.21505376344086, "grad_norm": 0.8652589359238804, "learning_rate": 7.422687353017173e-06, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.15695667266845703, "step": 5335, "valid_targets_mean": 1941.1, "valid_targets_min": 795 }, { "epoch": 5.219941348973607, "grad_norm": 0.8041415349342634, "learning_rate": 7.384819228794222e-06, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.1654549539089203, "step": 5340, "valid_targets_mean": 2202.2, "valid_targets_min": 1217 }, { "epoch": 5.224828934506354, "grad_norm": 0.7245646950191174, "learning_rate": 7.347026063255338e-06, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.14550118148326874, "step": 5345, "valid_targets_mean": 2840.0, "valid_targets_min": 1225 }, { "epoch": 5.2297165200391005, "grad_norm": 0.761083682415506, "learning_rate": 7.309308080965345e-06, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.15238893032073975, "step": 5350, "valid_targets_mean": 2448.1, "valid_targets_min": 953 }, { "epoch": 5.234604105571847, "grad_norm": 0.8141359878753163, "learning_rate": 7.271665506042349e-06, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.1655212789773941, "step": 5355, "valid_targets_mean": 2414.3, "valid_targets_min": 750 }, { "epoch": 5.239491691104594, "grad_norm": 0.7925319949059126, "learning_rate": 7.234098562156382e-06, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.14529694616794586, "step": 5360, "valid_targets_mean": 2259.9, "valid_targets_min": 796 }, { "epoch": 5.244379276637341, "grad_norm": 0.8281189537598208, "learning_rate": 7.196607472528083e-06, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.15511846542358398, "step": 5365, "valid_targets_mean": 2057.9, "valid_targets_min": 696 }, { "epoch": 5.249266862170088, "grad_norm": 0.9202487657550533, "learning_rate": 7.1591924599273646e-06, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.16870905458927155, "step": 5370, "valid_targets_mean": 2043.6, "valid_targets_min": 806 }, { "epoch": 5.254154447702835, "grad_norm": 0.7490177593952363, "learning_rate": 7.121853746672087e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.1420806646347046, "step": 5375, "valid_targets_mean": 2500.4, "valid_targets_min": 1353 }, { "epoch": 5.259042033235581, "grad_norm": 0.7953194730901839, "learning_rate": 7.084591554626761e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.15275171399116516, "step": 5380, "valid_targets_mean": 2575.5, "valid_targets_min": 920 }, { "epoch": 5.263929618768328, "grad_norm": 0.8052676980006547, "learning_rate": 7.047406105201202e-06, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.14699678122997284, "step": 5385, "valid_targets_mean": 2143.2, "valid_targets_min": 514 }, { "epoch": 5.268817204301075, "grad_norm": 0.8178962169352656, "learning_rate": 7.010297619349238e-06, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.14148107171058655, "step": 5390, "valid_targets_mean": 1963.5, "valid_targets_min": 642 }, { "epoch": 5.273704789833822, "grad_norm": 0.7553088050684637, "learning_rate": 6.973266317567364e-06, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.1751079261302948, "step": 5395, "valid_targets_mean": 2179.1, "valid_targets_min": 829 }, { "epoch": 5.278592375366569, "grad_norm": 0.7418479058847184, "learning_rate": 6.936312419893458e-06, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.1365339756011963, "step": 5400, "valid_targets_mean": 2537.8, "valid_targets_min": 923 }, { "epoch": 5.2834799608993155, "grad_norm": 0.8557491666172627, "learning_rate": 6.899436145905474e-06, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.15646493434906006, "step": 5405, "valid_targets_mean": 2075.5, "valid_targets_min": 648 }, { "epoch": 5.288367546432062, "grad_norm": 0.8021756331273079, "learning_rate": 6.862637714720138e-06, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.1329081803560257, "step": 5410, "valid_targets_mean": 1917.8, "valid_targets_min": 682 }, { "epoch": 5.293255131964809, "grad_norm": 0.7229260402895247, "learning_rate": 6.825917344991611e-06, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.15381160378456116, "step": 5415, "valid_targets_mean": 2806.7, "valid_targets_min": 994 }, { "epoch": 5.298142717497556, "grad_norm": 0.8535602266976685, "learning_rate": 6.789275254910246e-06, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.13848789036273956, "step": 5420, "valid_targets_mean": 1859.3, "valid_targets_min": 713 }, { "epoch": 5.303030303030303, "grad_norm": 0.8074188447585233, "learning_rate": 6.752711662201241e-06, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.15609613060951233, "step": 5425, "valid_targets_mean": 2341.6, "valid_targets_min": 806 }, { "epoch": 5.30791788856305, "grad_norm": 0.877202839044622, "learning_rate": 6.716226784123383e-06, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.16460809111595154, "step": 5430, "valid_targets_mean": 2276.0, "valid_targets_min": 662 }, { "epoch": 5.312805474095796, "grad_norm": 0.7588859531837344, "learning_rate": 6.6798208374677384e-06, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.16514082252979279, "step": 5435, "valid_targets_mean": 2550.6, "valid_targets_min": 761 }, { "epoch": 5.317693059628543, "grad_norm": 0.7981982898217473, "learning_rate": 6.643494038556355e-06, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.17266137897968292, "step": 5440, "valid_targets_mean": 2877.4, "valid_targets_min": 1372 }, { "epoch": 5.32258064516129, "grad_norm": 0.7362910731569113, "learning_rate": 6.607246603241009e-06, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.15483227372169495, "step": 5445, "valid_targets_mean": 2524.4, "valid_targets_min": 884 }, { "epoch": 5.327468230694037, "grad_norm": 0.7656377794863742, "learning_rate": 6.571078746901878e-06, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.14594011008739471, "step": 5450, "valid_targets_mean": 2367.2, "valid_targets_min": 768 }, { "epoch": 5.332355816226784, "grad_norm": 0.6850050225914522, "learning_rate": 6.53499068444631e-06, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.1416652500629425, "step": 5455, "valid_targets_mean": 2953.6, "valid_targets_min": 704 }, { "epoch": 5.3372434017595305, "grad_norm": 0.7391512591400116, "learning_rate": 6.498982630307518e-06, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.1710202693939209, "step": 5460, "valid_targets_mean": 2936.5, "valid_targets_min": 863 }, { "epoch": 5.342130987292277, "grad_norm": 0.7660416451265245, "learning_rate": 6.463054798443287e-06, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.16152888536453247, "step": 5465, "valid_targets_mean": 2735.8, "valid_targets_min": 1110 }, { "epoch": 5.347018572825024, "grad_norm": 0.8252295444761306, "learning_rate": 6.4272074023347606e-06, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.15773028135299683, "step": 5470, "valid_targets_mean": 2095.6, "valid_targets_min": 893 }, { "epoch": 5.351906158357771, "grad_norm": 0.9055114549440841, "learning_rate": 6.391440654985106e-06, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.17055881023406982, "step": 5475, "valid_targets_mean": 1950.2, "valid_targets_min": 684 }, { "epoch": 5.356793743890518, "grad_norm": 0.6588127218396698, "learning_rate": 6.355754768918301e-06, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.13662315905094147, "step": 5480, "valid_targets_mean": 3307.9, "valid_targets_min": 747 }, { "epoch": 5.361681329423265, "grad_norm": 0.7472617276476732, "learning_rate": 6.32014995617785e-06, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.15279489755630493, "step": 5485, "valid_targets_mean": 2531.1, "valid_targets_min": 645 }, { "epoch": 5.366568914956011, "grad_norm": 0.7945430057967098, "learning_rate": 6.284626428325504e-06, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.13775640726089478, "step": 5490, "valid_targets_mean": 2237.1, "valid_targets_min": 793 }, { "epoch": 5.371456500488758, "grad_norm": 1.1165361040355197, "learning_rate": 6.249184396440053e-06, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.15144461393356323, "step": 5495, "valid_targets_mean": 2468.8, "valid_targets_min": 615 }, { "epoch": 5.376344086021505, "grad_norm": 0.7782637843895414, "learning_rate": 6.2138240711160125e-06, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.1696222573518753, "step": 5500, "valid_targets_mean": 2696.6, "valid_targets_min": 699 }, { "epoch": 5.381231671554252, "grad_norm": 0.7825515135644441, "learning_rate": 6.178545662462425e-06, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.16258756816387177, "step": 5505, "valid_targets_mean": 2587.4, "valid_targets_min": 754 }, { "epoch": 5.386119257086999, "grad_norm": 0.8421569052905954, "learning_rate": 6.1433493801015865e-06, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.13311320543289185, "step": 5510, "valid_targets_mean": 1930.4, "valid_targets_min": 617 }, { "epoch": 5.3910068426197455, "grad_norm": 0.8261937566397005, "learning_rate": 6.108235433167791e-06, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.16040858626365662, "step": 5515, "valid_targets_mean": 2021.9, "valid_targets_min": 684 }, { "epoch": 5.395894428152492, "grad_norm": 0.7936724009453671, "learning_rate": 6.073204030306101e-06, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.14740975201129913, "step": 5520, "valid_targets_mean": 2411.1, "valid_targets_min": 636 }, { "epoch": 5.400782013685239, "grad_norm": 0.8088963586124284, "learning_rate": 6.038255379671121e-06, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.15532401204109192, "step": 5525, "valid_targets_mean": 2203.5, "valid_targets_min": 678 }, { "epoch": 5.405669599217986, "grad_norm": 0.8249172911213923, "learning_rate": 6.003389688925736e-06, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.13733899593353271, "step": 5530, "valid_targets_mean": 2478.9, "valid_targets_min": 738 }, { "epoch": 5.410557184750733, "grad_norm": 0.6793605880624324, "learning_rate": 5.968607165239897e-06, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.14237245917320251, "step": 5535, "valid_targets_mean": 3130.7, "valid_targets_min": 1230 }, { "epoch": 5.41544477028348, "grad_norm": 0.9530584429559311, "learning_rate": 5.933908015289367e-06, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.17519810795783997, "step": 5540, "valid_targets_mean": 1629.4, "valid_targets_min": 512 }, { "epoch": 5.420332355816226, "grad_norm": 0.7526914536401272, "learning_rate": 5.89929244525451e-06, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.16908365488052368, "step": 5545, "valid_targets_mean": 2734.1, "valid_targets_min": 1191 }, { "epoch": 5.425219941348973, "grad_norm": 0.7626748112290224, "learning_rate": 5.864760660819073e-06, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.16685664653778076, "step": 5550, "valid_targets_mean": 2915.1, "valid_targets_min": 1098 }, { "epoch": 5.43010752688172, "grad_norm": 0.8034530660024547, "learning_rate": 5.830312867168948e-06, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.14739468693733215, "step": 5555, "valid_targets_mean": 2265.8, "valid_targets_min": 692 }, { "epoch": 5.434995112414467, "grad_norm": 0.7652321619302118, "learning_rate": 5.795949268990964e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.14698611199855804, "step": 5560, "valid_targets_mean": 2454.2, "valid_targets_min": 717 }, { "epoch": 5.439882697947214, "grad_norm": 0.8333089448649366, "learning_rate": 5.7616700704716545e-06, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.15633103251457214, "step": 5565, "valid_targets_mean": 2116.5, "valid_targets_min": 848 }, { "epoch": 5.4447702834799605, "grad_norm": 0.8009884901164667, "learning_rate": 5.727475475296047e-06, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.15122680366039276, "step": 5570, "valid_targets_mean": 2134.5, "valid_targets_min": 900 }, { "epoch": 5.449657869012707, "grad_norm": 0.8124584053736166, "learning_rate": 5.693365686646501e-06, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.16159634292125702, "step": 5575, "valid_targets_mean": 2173.5, "valid_targets_min": 809 }, { "epoch": 5.454545454545454, "grad_norm": 0.7935256921202335, "learning_rate": 5.659340907201418e-06, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.16111275553703308, "step": 5580, "valid_targets_mean": 2267.2, "valid_targets_min": 701 }, { "epoch": 5.459433040078201, "grad_norm": 0.6835989696344518, "learning_rate": 5.625401339134093e-06, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.14738526940345764, "step": 5585, "valid_targets_mean": 3000.6, "valid_targets_min": 879 }, { "epoch": 5.464320625610948, "grad_norm": 0.7930964833671504, "learning_rate": 5.591547184111514e-06, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.1674892157316208, "step": 5590, "valid_targets_mean": 2696.9, "valid_targets_min": 687 }, { "epoch": 5.469208211143695, "grad_norm": 0.744501626898747, "learning_rate": 5.557778643293117e-06, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.16441041231155396, "step": 5595, "valid_targets_mean": 2941.3, "valid_targets_min": 1195 }, { "epoch": 5.474095796676442, "grad_norm": 0.7910032892994638, "learning_rate": 5.524095917329668e-06, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.16341263055801392, "step": 5600, "valid_targets_mean": 2293.9, "valid_targets_min": 1001 }, { "epoch": 5.478983382209188, "grad_norm": 0.8189803335488413, "learning_rate": 5.490499206361992e-06, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.1621970534324646, "step": 5605, "valid_targets_mean": 2192.6, "valid_targets_min": 1044 }, { "epoch": 5.483870967741936, "grad_norm": 0.8435168373600971, "learning_rate": 5.456988710019822e-06, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.1423211395740509, "step": 5610, "valid_targets_mean": 1718.4, "valid_targets_min": 756 }, { "epoch": 5.488758553274682, "grad_norm": 0.8432435824638052, "learning_rate": 5.4235646274206185e-06, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.15067586302757263, "step": 5615, "valid_targets_mean": 2142.1, "valid_targets_min": 632 }, { "epoch": 5.49364613880743, "grad_norm": 0.8434772077306247, "learning_rate": 5.3902271571683815e-06, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.15619194507598877, "step": 5620, "valid_targets_mean": 2239.2, "valid_targets_min": 719 }, { "epoch": 5.4985337243401755, "grad_norm": 0.7932516543133425, "learning_rate": 5.356976497352442e-06, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.14296786487102509, "step": 5625, "valid_targets_mean": 2430.8, "valid_targets_min": 878 }, { "epoch": 5.503421309872923, "grad_norm": 0.7340907560380051, "learning_rate": 5.323812845546334e-06, "loss": 0.158, "loss_nan_ranks": 0, "loss_rank_avg": 0.15341924130916595, "step": 5630, "valid_targets_mean": 2661.9, "valid_targets_min": 889 }, { "epoch": 5.508308895405669, "grad_norm": 0.9584349909909398, "learning_rate": 5.290736398806575e-06, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.17308732867240906, "step": 5635, "valid_targets_mean": 1577.6, "valid_targets_min": 848 }, { "epoch": 5.513196480938417, "grad_norm": 0.8019713328945052, "learning_rate": 5.2577473536715275e-06, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.16516554355621338, "step": 5640, "valid_targets_mean": 2460.1, "valid_targets_min": 1066 }, { "epoch": 5.518084066471163, "grad_norm": 0.8191884705772617, "learning_rate": 5.224845906160219e-06, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.15267640352249146, "step": 5645, "valid_targets_mean": 2165.6, "valid_targets_min": 752 }, { "epoch": 5.5229716520039105, "grad_norm": 0.8330339846872703, "learning_rate": 5.1920322517711615e-06, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.15274596214294434, "step": 5650, "valid_targets_mean": 2050.2, "valid_targets_min": 591 }, { "epoch": 5.527859237536656, "grad_norm": 0.7824632706097082, "learning_rate": 5.1593065854812294e-06, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.1320272833108902, "step": 5655, "valid_targets_mean": 2084.6, "valid_targets_min": 789 }, { "epoch": 5.532746823069404, "grad_norm": 0.8015604744159438, "learning_rate": 5.1266691017444505e-06, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.1577574610710144, "step": 5660, "valid_targets_mean": 2387.2, "valid_targets_min": 800 }, { "epoch": 5.53763440860215, "grad_norm": 0.7592693450999322, "learning_rate": 5.094119994490898e-06, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.16440163552761078, "step": 5665, "valid_targets_mean": 2866.8, "valid_targets_min": 772 }, { "epoch": 5.542521994134898, "grad_norm": 0.7921173779072441, "learning_rate": 5.061659457125514e-06, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.15453504025936127, "step": 5670, "valid_targets_mean": 2380.8, "valid_targets_min": 1188 }, { "epoch": 5.547409579667644, "grad_norm": 0.8120586505606648, "learning_rate": 5.029287682526949e-06, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.16854724287986755, "step": 5675, "valid_targets_mean": 2460.8, "valid_targets_min": 742 }, { "epoch": 5.552297165200391, "grad_norm": 0.8499742573768506, "learning_rate": 4.997004863046446e-06, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.1677948236465454, "step": 5680, "valid_targets_mean": 2218.1, "valid_targets_min": 1013 }, { "epoch": 5.557184750733137, "grad_norm": 0.8783081648919876, "learning_rate": 4.964811190506671e-06, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.18013803660869598, "step": 5685, "valid_targets_mean": 2322.4, "valid_targets_min": 692 }, { "epoch": 5.562072336265885, "grad_norm": 0.7709090075615438, "learning_rate": 4.932706856200589e-06, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.14455710351467133, "step": 5690, "valid_targets_mean": 2390.8, "valid_targets_min": 626 }, { "epoch": 5.566959921798632, "grad_norm": 0.8439698983111165, "learning_rate": 4.90069205089033e-06, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.16360528767108917, "step": 5695, "valid_targets_mean": 2045.9, "valid_targets_min": 708 }, { "epoch": 5.571847507331379, "grad_norm": 0.8445073532119768, "learning_rate": 4.868766964806029e-06, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.16692796349525452, "step": 5700, "valid_targets_mean": 2184.8, "valid_targets_min": 970 }, { "epoch": 5.5767350928641255, "grad_norm": 0.7247679212006615, "learning_rate": 4.8369317876447365e-06, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.15431565046310425, "step": 5705, "valid_targets_mean": 3089.9, "valid_targets_min": 1388 }, { "epoch": 5.581622678396872, "grad_norm": 0.7600528639537043, "learning_rate": 4.805186708569245e-06, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.17368043959140778, "step": 5710, "valid_targets_mean": 2844.1, "valid_targets_min": 958 }, { "epoch": 5.586510263929619, "grad_norm": 0.7391855729545126, "learning_rate": 4.773531916207008e-06, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.13605889678001404, "step": 5715, "valid_targets_mean": 2471.4, "valid_targets_min": 992 }, { "epoch": 5.591397849462366, "grad_norm": 0.769129841502073, "learning_rate": 4.741967598649002e-06, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.15731492638587952, "step": 5720, "valid_targets_mean": 2548.4, "valid_targets_min": 711 }, { "epoch": 5.596285434995113, "grad_norm": 1.1287691604840524, "learning_rate": 4.7104939434485884e-06, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.1409187912940979, "step": 5725, "valid_targets_mean": 2582.1, "valid_targets_min": 892 }, { "epoch": 5.60117302052786, "grad_norm": 0.9156130590977292, "learning_rate": 4.679111137620442e-06, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.1329200565814972, "step": 5730, "valid_targets_mean": 1692.3, "valid_targets_min": 591 }, { "epoch": 5.606060606060606, "grad_norm": 0.8263554263382872, "learning_rate": 4.64781936763939e-06, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.14420738816261292, "step": 5735, "valid_targets_mean": 2274.1, "valid_targets_min": 830 }, { "epoch": 5.610948191593353, "grad_norm": 0.7412321177836615, "learning_rate": 4.616618819439353e-06, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.1455959975719452, "step": 5740, "valid_targets_mean": 2443.1, "valid_targets_min": 875 }, { "epoch": 5.6158357771261, "grad_norm": 0.7056612270287848, "learning_rate": 4.585509678412208e-06, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.15663772821426392, "step": 5745, "valid_targets_mean": 3141.4, "valid_targets_min": 1052 }, { "epoch": 5.620723362658847, "grad_norm": 0.8069910406282396, "learning_rate": 4.5544921294066935e-06, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.14563411474227905, "step": 5750, "valid_targets_mean": 2318.9, "valid_targets_min": 1035 }, { "epoch": 5.625610948191594, "grad_norm": 0.8114201491577269, "learning_rate": 4.523566356727309e-06, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.1693604439496994, "step": 5755, "valid_targets_mean": 2370.1, "valid_targets_min": 869 }, { "epoch": 5.6304985337243405, "grad_norm": 0.8443036168376865, "learning_rate": 4.492732544133236e-06, "loss": 0.158, "loss_nan_ranks": 0, "loss_rank_avg": 0.15634265542030334, "step": 5760, "valid_targets_mean": 1911.4, "valid_targets_min": 700 }, { "epoch": 5.635386119257087, "grad_norm": 0.787586816101732, "learning_rate": 4.461990874837227e-06, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.15353325009346008, "step": 5765, "valid_targets_mean": 2510.8, "valid_targets_min": 762 }, { "epoch": 5.640273704789834, "grad_norm": 0.8265538830295129, "learning_rate": 4.431341531504536e-06, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.17224039137363434, "step": 5770, "valid_targets_mean": 2606.2, "valid_targets_min": 897 }, { "epoch": 5.645161290322581, "grad_norm": 0.9987858614241965, "learning_rate": 4.400784696251801e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.1915130913257599, "step": 5775, "valid_targets_mean": 2068.2, "valid_targets_min": 1206 }, { "epoch": 5.650048875855328, "grad_norm": 0.8197168076239274, "learning_rate": 4.37032055064599e-06, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.1514715850353241, "step": 5780, "valid_targets_mean": 2108.2, "valid_targets_min": 629 }, { "epoch": 5.654936461388075, "grad_norm": 0.7371445886865936, "learning_rate": 4.3399492757033235e-06, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.20320241153240204, "step": 5785, "valid_targets_mean": 2937.3, "valid_targets_min": 720 }, { "epoch": 5.659824046920821, "grad_norm": 0.860820707417868, "learning_rate": 4.309671051888187e-06, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.14680787920951843, "step": 5790, "valid_targets_mean": 1897.9, "valid_targets_min": 534 }, { "epoch": 5.664711632453568, "grad_norm": 0.7425530568167907, "learning_rate": 4.27948605911205e-06, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.18525880575180054, "step": 5795, "valid_targets_mean": 2515.6, "valid_targets_min": 752 }, { "epoch": 5.669599217986315, "grad_norm": 0.7672403302530817, "learning_rate": 4.2493944767324245e-06, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.17380796372890472, "step": 5800, "valid_targets_mean": 2673.0, "valid_targets_min": 701 }, { "epoch": 5.674486803519062, "grad_norm": 0.8190685848445297, "learning_rate": 4.2193964835517656e-06, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.1683279573917389, "step": 5805, "valid_targets_mean": 2120.9, "valid_targets_min": 965 }, { "epoch": 5.679374389051809, "grad_norm": 1.002164296776056, "learning_rate": 4.189492257816443e-06, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.14651206135749817, "step": 5810, "valid_targets_mean": 2480.2, "valid_targets_min": 740 }, { "epoch": 5.6842619745845555, "grad_norm": 0.8097394342502438, "learning_rate": 4.159681977215663e-06, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.17866715788841248, "step": 5815, "valid_targets_mean": 2452.8, "valid_targets_min": 867 }, { "epoch": 5.689149560117302, "grad_norm": 0.8423732358599466, "learning_rate": 4.1299658188804015e-06, "loss": 0.158, "loss_nan_ranks": 0, "loss_rank_avg": 0.1501942276954651, "step": 5820, "valid_targets_mean": 2100.3, "valid_targets_min": 741 }, { "epoch": 5.694037145650049, "grad_norm": 0.7237945688434769, "learning_rate": 4.1003439593823865e-06, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.15869738161563873, "step": 5825, "valid_targets_mean": 2729.0, "valid_targets_min": 986 }, { "epoch": 5.698924731182796, "grad_norm": 0.7467148363318494, "learning_rate": 4.070816574733003e-06, "loss": 0.1454, "loss_nan_ranks": 0, "loss_rank_avg": 0.14755885303020477, "step": 5830, "valid_targets_mean": 2749.3, "valid_targets_min": 980 }, { "epoch": 5.703812316715543, "grad_norm": 0.7867120070266118, "learning_rate": 4.041383840382294e-06, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.161052405834198, "step": 5835, "valid_targets_mean": 2601.4, "valid_targets_min": 1062 }, { "epoch": 5.70869990224829, "grad_norm": 0.9049628718004302, "learning_rate": 4.01204593121789e-06, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.15240147709846497, "step": 5840, "valid_targets_mean": 1931.8, "valid_targets_min": 722 }, { "epoch": 5.713587487781036, "grad_norm": 0.8698769453803369, "learning_rate": 3.982803021563961e-06, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.14392434060573578, "step": 5845, "valid_targets_mean": 2359.8, "valid_targets_min": 790 }, { "epoch": 5.718475073313783, "grad_norm": 0.7228885339388987, "learning_rate": 3.953655285180223e-06, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.14013831317424774, "step": 5850, "valid_targets_mean": 2797.0, "valid_targets_min": 640 }, { "epoch": 5.72336265884653, "grad_norm": 0.7537686797769533, "learning_rate": 3.924602895260843e-06, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.12795598804950714, "step": 5855, "valid_targets_mean": 2317.8, "valid_targets_min": 715 }, { "epoch": 5.728250244379277, "grad_norm": 0.7471691429860486, "learning_rate": 3.895646024433475e-06, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.15418082475662231, "step": 5860, "valid_targets_mean": 2598.8, "valid_targets_min": 734 }, { "epoch": 5.733137829912024, "grad_norm": 0.7549943500132472, "learning_rate": 3.866784844758196e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.1698361039161682, "step": 5865, "valid_targets_mean": 2571.3, "valid_targets_min": 1006 }, { "epoch": 5.7380254154447705, "grad_norm": 0.7902697956389423, "learning_rate": 3.838019527726478e-06, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.15650413930416107, "step": 5870, "valid_targets_mean": 2332.9, "valid_targets_min": 748 }, { "epoch": 5.742913000977517, "grad_norm": 0.7626167489885958, "learning_rate": 3.8093502442602037e-06, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.1520456075668335, "step": 5875, "valid_targets_mean": 2732.3, "valid_targets_min": 851 }, { "epoch": 5.747800586510264, "grad_norm": 0.890203614110944, "learning_rate": 3.7807771647106073e-06, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.16833049058914185, "step": 5880, "valid_targets_mean": 2514.6, "valid_targets_min": 1051 }, { "epoch": 5.752688172043011, "grad_norm": 0.7072501670025816, "learning_rate": 3.752300458857303e-06, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.15029340982437134, "step": 5885, "valid_targets_mean": 3031.2, "valid_targets_min": 837 }, { "epoch": 5.757575757575758, "grad_norm": 0.7640980023033417, "learning_rate": 3.723920295907255e-06, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.1618524044752121, "step": 5890, "valid_targets_mean": 2569.4, "valid_targets_min": 728 }, { "epoch": 5.762463343108505, "grad_norm": 0.7319035255044318, "learning_rate": 3.695636844493764e-06, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.16255182027816772, "step": 5895, "valid_targets_mean": 3114.8, "valid_targets_min": 951 }, { "epoch": 5.767350928641251, "grad_norm": 0.8063750882434633, "learning_rate": 3.66745027267549e-06, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.1666271686553955, "step": 5900, "valid_targets_mean": 2507.8, "valid_targets_min": 986 }, { "epoch": 5.772238514173998, "grad_norm": 0.8345912032783375, "learning_rate": 3.6393607479354275e-06, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.15384799242019653, "step": 5905, "valid_targets_mean": 1862.2, "valid_targets_min": 635 }, { "epoch": 5.777126099706745, "grad_norm": 0.7061819113437781, "learning_rate": 3.611368437179934e-06, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.18276137113571167, "step": 5910, "valid_targets_mean": 3247.3, "valid_targets_min": 1489 }, { "epoch": 5.782013685239492, "grad_norm": 0.8167005148421289, "learning_rate": 3.583473506737727e-06, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.1597469002008438, "step": 5915, "valid_targets_mean": 2362.9, "valid_targets_min": 759 }, { "epoch": 5.786901270772239, "grad_norm": 0.7711204073304082, "learning_rate": 3.555676122358884e-06, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.1491527557373047, "step": 5920, "valid_targets_mean": 2585.6, "valid_targets_min": 1306 }, { "epoch": 5.7917888563049855, "grad_norm": 0.7283811601045469, "learning_rate": 3.5279764492138724e-06, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.17027896642684937, "step": 5925, "valid_targets_mean": 3067.6, "valid_targets_min": 522 }, { "epoch": 5.796676441837732, "grad_norm": 0.7011679340720517, "learning_rate": 3.500374651892573e-06, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.1561456024646759, "step": 5930, "valid_targets_mean": 2874.4, "valid_targets_min": 851 }, { "epoch": 5.801564027370479, "grad_norm": 0.9979178900846251, "learning_rate": 3.472870894403291e-06, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.1694871187210083, "step": 5935, "valid_targets_mean": 2362.9, "valid_targets_min": 513 }, { "epoch": 5.806451612903226, "grad_norm": 0.8639990166797461, "learning_rate": 3.4454653401717896e-06, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.12851397693157196, "step": 5940, "valid_targets_mean": 1915.4, "valid_targets_min": 746 }, { "epoch": 5.811339198435973, "grad_norm": 0.6986837988916482, "learning_rate": 3.4181581520403005e-06, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.15324917435646057, "step": 5945, "valid_targets_mean": 3119.9, "valid_targets_min": 1011 }, { "epoch": 5.81622678396872, "grad_norm": 0.8313260438961377, "learning_rate": 3.390949492266569e-06, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.1447916030883789, "step": 5950, "valid_targets_mean": 2159.3, "valid_targets_min": 800 }, { "epoch": 5.821114369501466, "grad_norm": 0.885127583979189, "learning_rate": 3.363839522522916e-06, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.15982311964035034, "step": 5955, "valid_targets_mean": 1842.9, "valid_targets_min": 607 }, { "epoch": 5.826001955034213, "grad_norm": 0.7808780924503399, "learning_rate": 3.336828403895227e-06, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.1592644453048706, "step": 5960, "valid_targets_mean": 2727.3, "valid_targets_min": 1050 }, { "epoch": 5.83088954056696, "grad_norm": 0.685353500101023, "learning_rate": 3.309916296882021e-06, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.1466306447982788, "step": 5965, "valid_targets_mean": 2775.5, "valid_targets_min": 627 }, { "epoch": 5.835777126099707, "grad_norm": 1.2671880923497407, "learning_rate": 3.2831033613935092e-06, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.15228471159934998, "step": 5970, "valid_targets_mean": 2204.8, "valid_targets_min": 1143 }, { "epoch": 5.840664711632454, "grad_norm": 0.7532578861942046, "learning_rate": 3.256389756750613e-06, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.13797354698181152, "step": 5975, "valid_targets_mean": 2369.1, "valid_targets_min": 788 }, { "epoch": 5.8455522971652005, "grad_norm": 0.7743267560564064, "learning_rate": 3.229775641684063e-06, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.16579267382621765, "step": 5980, "valid_targets_mean": 2343.3, "valid_targets_min": 888 }, { "epoch": 5.850439882697947, "grad_norm": 0.7015726455253567, "learning_rate": 3.203261174333403e-06, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.14441198110580444, "step": 5985, "valid_targets_mean": 2980.8, "valid_targets_min": 807 }, { "epoch": 5.855327468230694, "grad_norm": 0.7070459951461793, "learning_rate": 3.1768465122460813e-06, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.1486390233039856, "step": 5990, "valid_targets_mean": 2794.2, "valid_targets_min": 824 }, { "epoch": 5.860215053763441, "grad_norm": 0.7969197667556421, "learning_rate": 3.1505318123765137e-06, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.16264227032661438, "step": 5995, "valid_targets_mean": 2405.8, "valid_targets_min": 1005 }, { "epoch": 5.865102639296188, "grad_norm": 0.7190738114648545, "learning_rate": 3.12431723108515e-06, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.1532568335533142, "step": 6000, "valid_targets_mean": 2788.5, "valid_targets_min": 903 }, { "epoch": 5.869990224828935, "grad_norm": 0.7936029883530649, "learning_rate": 3.0982029241375343e-06, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.16097313165664673, "step": 6005, "valid_targets_mean": 2423.9, "valid_targets_min": 911 }, { "epoch": 5.874877810361681, "grad_norm": 0.7946199748419005, "learning_rate": 3.0721890467033866e-06, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.1583392471075058, "step": 6010, "valid_targets_mean": 2257.8, "valid_targets_min": 654 }, { "epoch": 5.879765395894428, "grad_norm": 0.8074320913746822, "learning_rate": 3.0462757533556784e-06, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.13972869515419006, "step": 6015, "valid_targets_mean": 2338.6, "valid_targets_min": 708 }, { "epoch": 5.884652981427175, "grad_norm": 0.8929139568223418, "learning_rate": 3.020463198069721e-06, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.16818490624427795, "step": 6020, "valid_targets_mean": 2117.4, "valid_targets_min": 727 }, { "epoch": 5.889540566959922, "grad_norm": 0.6713747500739194, "learning_rate": 2.994751534222251e-06, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.1403338611125946, "step": 6025, "valid_targets_mean": 2784.2, "valid_targets_min": 1212 }, { "epoch": 5.894428152492669, "grad_norm": 0.7757304779081556, "learning_rate": 2.969140914590498e-06, "loss": 0.1488, "loss_nan_ranks": 0, "loss_rank_avg": 0.14841482043266296, "step": 6030, "valid_targets_mean": 2193.8, "valid_targets_min": 790 }, { "epoch": 5.8993157380254155, "grad_norm": 0.8629820125294086, "learning_rate": 2.943631491351311e-06, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.15556024014949799, "step": 6035, "valid_targets_mean": 2002.3, "valid_targets_min": 1163 }, { "epoch": 5.904203323558162, "grad_norm": 0.8188534807515834, "learning_rate": 2.918223416080219e-06, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.16173824667930603, "step": 6040, "valid_targets_mean": 2232.9, "valid_targets_min": 891 }, { "epoch": 5.909090909090909, "grad_norm": 0.8132660493437572, "learning_rate": 2.892916839750557e-06, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.1494334191083908, "step": 6045, "valid_targets_mean": 2253.3, "valid_targets_min": 732 }, { "epoch": 5.913978494623656, "grad_norm": 0.654182287461871, "learning_rate": 2.8677119127325625e-06, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.15798476338386536, "step": 6050, "valid_targets_mean": 3594.9, "valid_targets_min": 1150 }, { "epoch": 5.918866080156403, "grad_norm": 0.6693246221511635, "learning_rate": 2.8426087847924643e-06, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.13518929481506348, "step": 6055, "valid_targets_mean": 2902.4, "valid_targets_min": 1123 }, { "epoch": 5.92375366568915, "grad_norm": 0.8107053745570154, "learning_rate": 2.8176076050916255e-06, "loss": 0.1463, "loss_nan_ranks": 0, "loss_rank_avg": 0.15758317708969116, "step": 6060, "valid_targets_mean": 2398.6, "valid_targets_min": 711 }, { "epoch": 5.9286412512218964, "grad_norm": 0.9021761140325874, "learning_rate": 2.7927085221856185e-06, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.15211939811706543, "step": 6065, "valid_targets_mean": 1915.1, "valid_targets_min": 619 }, { "epoch": 5.933528836754643, "grad_norm": 0.7392044459110118, "learning_rate": 2.7679116840233788e-06, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.1442590355873108, "step": 6070, "valid_targets_mean": 2682.1, "valid_targets_min": 837 }, { "epoch": 5.93841642228739, "grad_norm": 0.7909706387505339, "learning_rate": 2.7432172379463073e-06, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.1507616639137268, "step": 6075, "valid_targets_mean": 2728.3, "valid_targets_min": 1133 }, { "epoch": 5.943304007820137, "grad_norm": 0.6858517709489104, "learning_rate": 2.718625330687381e-06, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.1569923758506775, "step": 6080, "valid_targets_mean": 3103.2, "valid_targets_min": 698 }, { "epoch": 5.948191593352884, "grad_norm": 0.7282489397560563, "learning_rate": 2.6941361083703244e-06, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.15824103355407715, "step": 6085, "valid_targets_mean": 3084.2, "valid_targets_min": 1098 }, { "epoch": 5.9530791788856305, "grad_norm": 0.8200856694692574, "learning_rate": 2.6697497165086826e-06, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.14971165359020233, "step": 6090, "valid_targets_mean": 1849.7, "valid_targets_min": 690 }, { "epoch": 5.957966764418377, "grad_norm": 0.8145406485221162, "learning_rate": 2.645466300005013e-06, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.14848312735557556, "step": 6095, "valid_targets_mean": 2086.6, "valid_targets_min": 765 }, { "epoch": 5.962854349951124, "grad_norm": 0.7660068981755783, "learning_rate": 2.6212860031499942e-06, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.14158686995506287, "step": 6100, "valid_targets_mean": 2279.2, "valid_targets_min": 1033 }, { "epoch": 5.967741935483871, "grad_norm": 0.8064378082219088, "learning_rate": 2.597208969621561e-06, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.14924579858779907, "step": 6105, "valid_targets_mean": 2187.1, "valid_targets_min": 777 }, { "epoch": 5.972629521016618, "grad_norm": 0.7501577303291025, "learning_rate": 2.5732353424840817e-06, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.14925900101661682, "step": 6110, "valid_targets_mean": 2335.9, "valid_targets_min": 634 }, { "epoch": 5.977517106549365, "grad_norm": 0.7898048269613115, "learning_rate": 2.549365264187469e-06, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.15726542472839355, "step": 6115, "valid_targets_mean": 2276.5, "valid_targets_min": 1190 }, { "epoch": 5.9824046920821115, "grad_norm": 0.7940500094930575, "learning_rate": 2.525598876566371e-06, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.1534472405910492, "step": 6120, "valid_targets_mean": 2346.0, "valid_targets_min": 809 }, { "epoch": 5.987292277614858, "grad_norm": 0.882710433816707, "learning_rate": 2.5019363208393133e-06, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.18637877702713013, "step": 6125, "valid_targets_mean": 1959.3, "valid_targets_min": 1010 }, { "epoch": 5.992179863147605, "grad_norm": 0.798333765699043, "learning_rate": 2.4783777376078443e-06, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.15766102075576782, "step": 6130, "valid_targets_mean": 2160.6, "valid_targets_min": 1137 }, { "epoch": 5.997067448680352, "grad_norm": 0.8188870991896096, "learning_rate": 2.4549232668557154e-06, "loss": 0.1668, "loss_nan_ranks": 0, "loss_rank_avg": 0.15294690430164337, "step": 6135, "valid_targets_mean": 2066.3, "valid_targets_min": 733 }, { "epoch": 6.001955034213099, "grad_norm": 0.772371500976364, "learning_rate": 2.4315730479480614e-06, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.14228251576423645, "step": 6140, "valid_targets_mean": 2113.5, "valid_targets_min": 941 }, { "epoch": 6.0068426197458455, "grad_norm": 0.6951812269111425, "learning_rate": 2.4083272196305483e-06, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.12359236180782318, "step": 6145, "valid_targets_mean": 2279.8, "valid_targets_min": 901 }, { "epoch": 6.011730205278592, "grad_norm": 0.7341125048499366, "learning_rate": 2.385185920028563e-06, "loss": 0.1344, "loss_nan_ranks": 0, "loss_rank_avg": 0.12021429091691971, "step": 6150, "valid_targets_mean": 2476.9, "valid_targets_min": 834 }, { "epoch": 6.016617790811339, "grad_norm": 0.8580978920271629, "learning_rate": 2.3621492866463845e-06, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.14868280291557312, "step": 6155, "valid_targets_mean": 2026.8, "valid_targets_min": 776 }, { "epoch": 6.021505376344086, "grad_norm": 0.8292027396293019, "learning_rate": 2.3392174563663716e-06, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.154433935880661, "step": 6160, "valid_targets_mean": 2073.4, "valid_targets_min": 610 }, { "epoch": 6.026392961876833, "grad_norm": 0.8083140379382482, "learning_rate": 2.3163905654481524e-06, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.15254239737987518, "step": 6165, "valid_targets_mean": 2362.4, "valid_targets_min": 988 }, { "epoch": 6.03128054740958, "grad_norm": 0.711249329248669, "learning_rate": 2.293668749527809e-06, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.13382339477539062, "step": 6170, "valid_targets_mean": 2892.4, "valid_targets_min": 761 }, { "epoch": 6.0361681329423265, "grad_norm": 0.7271334674837908, "learning_rate": 2.2710521436170807e-06, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.15734508633613586, "step": 6175, "valid_targets_mean": 3120.2, "valid_targets_min": 1168 }, { "epoch": 6.041055718475073, "grad_norm": 0.8320574708134784, "learning_rate": 2.2485408821025435e-06, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.15673065185546875, "step": 6180, "valid_targets_mean": 2314.8, "valid_targets_min": 676 }, { "epoch": 6.04594330400782, "grad_norm": 0.7618387380481915, "learning_rate": 2.226135098744824e-06, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.15294227004051208, "step": 6185, "valid_targets_mean": 2752.2, "valid_targets_min": 1263 }, { "epoch": 6.050830889540567, "grad_norm": 0.7682499575279256, "learning_rate": 2.2038349266778146e-06, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.16213871538639069, "step": 6190, "valid_targets_mean": 2590.8, "valid_targets_min": 764 }, { "epoch": 6.055718475073314, "grad_norm": 0.835630554054457, "learning_rate": 2.1816404984078664e-06, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.14952757954597473, "step": 6195, "valid_targets_mean": 2388.6, "valid_targets_min": 678 }, { "epoch": 6.0606060606060606, "grad_norm": 0.7123162200549785, "learning_rate": 2.1595519458129967e-06, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.13014379143714905, "step": 6200, "valid_targets_mean": 2729.5, "valid_targets_min": 815 }, { "epoch": 6.065493646138807, "grad_norm": 0.8818566517853015, "learning_rate": 2.1375694001421343e-06, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.15553683042526245, "step": 6205, "valid_targets_mean": 1978.7, "valid_targets_min": 761 }, { "epoch": 6.070381231671554, "grad_norm": 0.7715315446565182, "learning_rate": 2.115692992014304e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.15126900374889374, "step": 6210, "valid_targets_mean": 2411.3, "valid_targets_min": 1339 }, { "epoch": 6.075268817204301, "grad_norm": 0.8184332591539848, "learning_rate": 2.0939228514178735e-06, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.146785169839859, "step": 6215, "valid_targets_mean": 2621.6, "valid_targets_min": 892 }, { "epoch": 6.080156402737048, "grad_norm": 0.8703651745159651, "learning_rate": 2.0722591077097844e-06, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.14825935661792755, "step": 6220, "valid_targets_mean": 1934.5, "valid_targets_min": 621 }, { "epoch": 6.085043988269795, "grad_norm": 0.8574526478965231, "learning_rate": 2.0507018896147525e-06, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.1470494568347931, "step": 6225, "valid_targets_mean": 2009.9, "valid_targets_min": 591 }, { "epoch": 6.0899315738025415, "grad_norm": 0.8481048091940785, "learning_rate": 2.0292513252245507e-06, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.15715302526950836, "step": 6230, "valid_targets_mean": 2249.1, "valid_targets_min": 750 }, { "epoch": 6.094819159335288, "grad_norm": 0.8473826531669545, "learning_rate": 2.0079075419971937e-06, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.15390710532665253, "step": 6235, "valid_targets_mean": 2229.1, "valid_targets_min": 659 }, { "epoch": 6.099706744868035, "grad_norm": 0.813390106542457, "learning_rate": 1.986670666756234e-06, "loss": 0.1407, "loss_nan_ranks": 0, "loss_rank_avg": 0.1278359740972519, "step": 6240, "valid_targets_mean": 2046.5, "valid_targets_min": 814 }, { "epoch": 6.104594330400782, "grad_norm": 0.8400309752046771, "learning_rate": 1.9655408256899713e-06, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.15281391143798828, "step": 6245, "valid_targets_mean": 2291.9, "valid_targets_min": 733 }, { "epoch": 6.109481915933529, "grad_norm": 0.7250372273390747, "learning_rate": 1.944518144350709e-06, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.1458112895488739, "step": 6250, "valid_targets_mean": 2883.2, "valid_targets_min": 804 }, { "epoch": 6.114369501466276, "grad_norm": 0.8632663254658965, "learning_rate": 1.9236027476540276e-06, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.14336003363132477, "step": 6255, "valid_targets_mean": 2101.6, "valid_targets_min": 817 }, { "epoch": 6.119257086999022, "grad_norm": 0.7798497119811234, "learning_rate": 1.9027947598780127e-06, "loss": 0.127, "loss_nan_ranks": 0, "loss_rank_avg": 0.14085283875465393, "step": 6260, "valid_targets_mean": 2175.4, "valid_targets_min": 714 }, { "epoch": 6.124144672531769, "grad_norm": 0.8683686286891048, "learning_rate": 1.8820943046625429e-06, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.12134305387735367, "step": 6265, "valid_targets_mean": 1859.7, "valid_targets_min": 776 }, { "epoch": 6.129032258064516, "grad_norm": 0.8639340556226129, "learning_rate": 1.861501505008545e-06, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.14260660111904144, "step": 6270, "valid_targets_mean": 2105.2, "valid_targets_min": 905 }, { "epoch": 6.133919843597263, "grad_norm": 0.7652388086076658, "learning_rate": 1.8410164832772536e-06, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.1462109088897705, "step": 6275, "valid_targets_mean": 2521.6, "valid_targets_min": 689 }, { "epoch": 6.13880742913001, "grad_norm": 0.8599010636007501, "learning_rate": 1.8206393611895045e-06, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.15619584918022156, "step": 6280, "valid_targets_mean": 2249.8, "valid_targets_min": 1113 }, { "epoch": 6.1436950146627565, "grad_norm": 0.8398925161179197, "learning_rate": 1.8003702598249861e-06, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.14089694619178772, "step": 6285, "valid_targets_mean": 2057.7, "valid_targets_min": 1225 }, { "epoch": 6.148582600195503, "grad_norm": 0.9006101111923522, "learning_rate": 1.780209299621547e-06, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.1570209264755249, "step": 6290, "valid_targets_mean": 2732.9, "valid_targets_min": 922 }, { "epoch": 6.15347018572825, "grad_norm": 0.7691620511866091, "learning_rate": 1.7601566003744631e-06, "loss": 0.1364, "loss_nan_ranks": 0, "loss_rank_avg": 0.1531471312046051, "step": 6295, "valid_targets_mean": 2870.6, "valid_targets_min": 947 }, { "epoch": 6.158357771260997, "grad_norm": 0.6860071399944331, "learning_rate": 1.740212281235727e-06, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.13493847846984863, "step": 6300, "valid_targets_mean": 3376.0, "valid_targets_min": 753 }, { "epoch": 6.163245356793744, "grad_norm": 0.7541769441863807, "learning_rate": 1.7203764607133377e-06, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.15232732892036438, "step": 6305, "valid_targets_mean": 2786.0, "valid_targets_min": 671 }, { "epoch": 6.168132942326491, "grad_norm": 0.7651389425645014, "learning_rate": 1.7006492566706233e-06, "loss": 0.1424, "loss_nan_ranks": 0, "loss_rank_avg": 0.13763144612312317, "step": 6310, "valid_targets_mean": 2695.4, "valid_targets_min": 1083 }, { "epoch": 6.173020527859237, "grad_norm": 0.8366808292024842, "learning_rate": 1.6810307863254927e-06, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.14807304739952087, "step": 6315, "valid_targets_mean": 2219.9, "valid_targets_min": 827 }, { "epoch": 6.177908113391984, "grad_norm": 0.8457539648171782, "learning_rate": 1.6615211662497822e-06, "loss": 0.1458, "loss_nan_ranks": 0, "loss_rank_avg": 0.1576795130968094, "step": 6320, "valid_targets_mean": 2348.2, "valid_targets_min": 757 }, { "epoch": 6.182795698924731, "grad_norm": 0.80734473246753, "learning_rate": 1.6421205123685392e-06, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.13625971972942352, "step": 6325, "valid_targets_mean": 2120.9, "valid_targets_min": 806 }, { "epoch": 6.187683284457478, "grad_norm": 0.9804288667902588, "learning_rate": 1.6228289399593334e-06, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.14446699619293213, "step": 6330, "valid_targets_mean": 1873.2, "valid_targets_min": 888 }, { "epoch": 6.192570869990225, "grad_norm": 0.7529261993671538, "learning_rate": 1.603646563651604e-06, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.14811274409294128, "step": 6335, "valid_targets_mean": 2624.8, "valid_targets_min": 796 }, { "epoch": 6.1974584555229715, "grad_norm": 0.7758608591461221, "learning_rate": 1.5845734974259207e-06, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.13113583624362946, "step": 6340, "valid_targets_mean": 2221.9, "valid_targets_min": 900 }, { "epoch": 6.202346041055718, "grad_norm": 0.7977758438125597, "learning_rate": 1.5656098546133658e-06, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.15472404658794403, "step": 6345, "valid_targets_mean": 2333.7, "valid_targets_min": 777 }, { "epoch": 6.207233626588465, "grad_norm": 0.7496625060594996, "learning_rate": 1.5467557478948148e-06, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.15827788412570953, "step": 6350, "valid_targets_mean": 2944.5, "valid_targets_min": 659 }, { "epoch": 6.212121212121212, "grad_norm": 0.7617727567525714, "learning_rate": 1.5280112893002908e-06, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.13309329748153687, "step": 6355, "valid_targets_mean": 2364.3, "valid_targets_min": 988 }, { "epoch": 6.217008797653959, "grad_norm": 0.7687353152394582, "learning_rate": 1.5093765902083069e-06, "loss": 0.1404, "loss_nan_ranks": 0, "loss_rank_avg": 0.15288090705871582, "step": 6360, "valid_targets_mean": 2643.9, "valid_targets_min": 697 }, { "epoch": 6.221896383186706, "grad_norm": 0.8946465205196672, "learning_rate": 1.4908517613451778e-06, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.14633601903915405, "step": 6365, "valid_targets_mean": 2086.7, "valid_targets_min": 607 }, { "epoch": 6.226783968719452, "grad_norm": 0.8280125163578745, "learning_rate": 1.472436912784374e-06, "loss": 0.1444, "loss_nan_ranks": 0, "loss_rank_avg": 0.13586950302124023, "step": 6370, "valid_targets_mean": 2219.1, "valid_targets_min": 1104 }, { "epoch": 6.231671554252199, "grad_norm": 0.9360214005794244, "learning_rate": 1.4541321539458775e-06, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.14993751049041748, "step": 6375, "valid_targets_mean": 1659.2, "valid_targets_min": 686 }, { "epoch": 6.236559139784946, "grad_norm": 0.762660547954432, "learning_rate": 1.4359375935955222e-06, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.1589202582836151, "step": 6380, "valid_targets_mean": 2716.4, "valid_targets_min": 668 }, { "epoch": 6.241446725317693, "grad_norm": 0.8996541456011813, "learning_rate": 1.4178533398443507e-06, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.14994928240776062, "step": 6385, "valid_targets_mean": 1683.6, "valid_targets_min": 731 }, { "epoch": 6.24633431085044, "grad_norm": 0.7402483966290739, "learning_rate": 1.3998795001479605e-06, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.15734237432479858, "step": 6390, "valid_targets_mean": 2690.1, "valid_targets_min": 776 }, { "epoch": 6.2512218963831865, "grad_norm": 0.8314893917101926, "learning_rate": 1.3820161813058786e-06, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.1409616619348526, "step": 6395, "valid_targets_mean": 1984.4, "valid_targets_min": 617 }, { "epoch": 6.256109481915933, "grad_norm": 0.7192255814903107, "learning_rate": 1.3642634894609308e-06, "loss": 0.1453, "loss_nan_ranks": 0, "loss_rank_avg": 0.14671871066093445, "step": 6400, "valid_targets_mean": 2923.3, "valid_targets_min": 567 }, { "epoch": 6.26099706744868, "grad_norm": 0.7999646416770593, "learning_rate": 1.3466215300985996e-06, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.13374221324920654, "step": 6405, "valid_targets_mean": 2253.6, "valid_targets_min": 701 }, { "epoch": 6.265884652981427, "grad_norm": 0.7701307733257204, "learning_rate": 1.3290904080464007e-06, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.15439356863498688, "step": 6410, "valid_targets_mean": 2676.4, "valid_targets_min": 869 }, { "epoch": 6.270772238514174, "grad_norm": 0.717925366016105, "learning_rate": 1.3116702274732585e-06, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.1328277885913849, "step": 6415, "valid_targets_mean": 2629.2, "valid_targets_min": 888 }, { "epoch": 6.275659824046921, "grad_norm": 0.8180028485476835, "learning_rate": 1.2943610918888893e-06, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.15177467465400696, "step": 6420, "valid_targets_mean": 2332.1, "valid_targets_min": 680 }, { "epoch": 6.280547409579667, "grad_norm": 0.8165966121783467, "learning_rate": 1.277163104143191e-06, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.14720627665519714, "step": 6425, "valid_targets_mean": 2315.4, "valid_targets_min": 934 }, { "epoch": 6.285434995112414, "grad_norm": 0.8235251951027993, "learning_rate": 1.2600763664256288e-06, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.15732279419898987, "step": 6430, "valid_targets_mean": 2338.2, "valid_targets_min": 719 }, { "epoch": 6.290322580645161, "grad_norm": 0.8537813636704863, "learning_rate": 1.2431009802646177e-06, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.15671692788600922, "step": 6435, "valid_targets_mean": 2427.2, "valid_targets_min": 614 }, { "epoch": 6.295210166177908, "grad_norm": 0.7787776965511892, "learning_rate": 1.2262370465269368e-06, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.14795002341270447, "step": 6440, "valid_targets_mean": 2533.7, "valid_targets_min": 867 }, { "epoch": 6.300097751710655, "grad_norm": 0.7466171619616006, "learning_rate": 1.2094846654171133e-06, "loss": 0.1438, "loss_nan_ranks": 0, "loss_rank_avg": 0.1360429972410202, "step": 6445, "valid_targets_mean": 2684.0, "valid_targets_min": 930 }, { "epoch": 6.3049853372434015, "grad_norm": 0.8453955068732553, "learning_rate": 1.1928439364768418e-06, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.1500052511692047, "step": 6450, "valid_targets_mean": 2271.9, "valid_targets_min": 656 }, { "epoch": 6.309872922776148, "grad_norm": 0.7381224772665309, "learning_rate": 1.176314958584388e-06, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.1459953933954239, "step": 6455, "valid_targets_mean": 2728.8, "valid_targets_min": 945 }, { "epoch": 6.314760508308895, "grad_norm": 0.7664923578206903, "learning_rate": 1.1598978299539886e-06, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.11979406327009201, "step": 6460, "valid_targets_mean": 2113.8, "valid_targets_min": 740 }, { "epoch": 6.319648093841642, "grad_norm": 0.774864233400857, "learning_rate": 1.143592648135292e-06, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.13750594854354858, "step": 6465, "valid_targets_mean": 2761.6, "valid_targets_min": 847 }, { "epoch": 6.324535679374389, "grad_norm": 0.887880805842084, "learning_rate": 1.1273995100127478e-06, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.1429017186164856, "step": 6470, "valid_targets_mean": 1817.9, "valid_targets_min": 739 }, { "epoch": 6.329423264907136, "grad_norm": 0.7426599652356065, "learning_rate": 1.1113185118050662e-06, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.1407342255115509, "step": 6475, "valid_targets_mean": 2687.5, "valid_targets_min": 830 }, { "epoch": 6.334310850439882, "grad_norm": 0.8069295804769829, "learning_rate": 1.0953497490646204e-06, "loss": 0.1356, "loss_nan_ranks": 0, "loss_rank_avg": 0.1433069258928299, "step": 6480, "valid_targets_mean": 2190.9, "valid_targets_min": 635 }, { "epoch": 6.339198435972629, "grad_norm": 0.7177391118014483, "learning_rate": 1.0794933166768828e-06, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.1430281698703766, "step": 6485, "valid_targets_mean": 3095.9, "valid_targets_min": 770 }, { "epoch": 6.344086021505376, "grad_norm": 0.7687796424872444, "learning_rate": 1.063749308859876e-06, "loss": 0.1395, "loss_nan_ranks": 0, "loss_rank_avg": 0.13334771990776062, "step": 6490, "valid_targets_mean": 2388.4, "valid_targets_min": 966 }, { "epoch": 6.348973607038123, "grad_norm": 0.7612117876020217, "learning_rate": 1.0481178191635876e-06, "loss": 0.1404, "loss_nan_ranks": 0, "loss_rank_avg": 0.1389297991991043, "step": 6495, "valid_targets_mean": 2652.2, "valid_targets_min": 777 }, { "epoch": 6.35386119257087, "grad_norm": 0.7514521694555615, "learning_rate": 1.0325989404694424e-06, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.16383954882621765, "step": 6500, "valid_targets_mean": 2935.7, "valid_targets_min": 1179 }, { "epoch": 6.3587487781036165, "grad_norm": 0.8203426377026969, "learning_rate": 1.017192764989734e-06, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.15453344583511353, "step": 6505, "valid_targets_mean": 2347.6, "valid_targets_min": 721 }, { "epoch": 6.363636363636363, "grad_norm": 0.8292620788591387, "learning_rate": 1.001899384267071e-06, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.15466228127479553, "step": 6510, "valid_targets_mean": 2221.9, "valid_targets_min": 750 }, { "epoch": 6.36852394916911, "grad_norm": 0.829931504832341, "learning_rate": 9.867188891738544e-07, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.13335032761096954, "step": 6515, "valid_targets_mean": 2455.7, "valid_targets_min": 1143 }, { "epoch": 6.373411534701857, "grad_norm": 0.7012016461939861, "learning_rate": 9.716513699117148e-07, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.12033946067094803, "step": 6520, "valid_targets_mean": 2587.4, "valid_targets_min": 1035 }, { "epoch": 6.378299120234604, "grad_norm": 0.7608167779950807, "learning_rate": 9.56696916010995e-07, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.15372420847415924, "step": 6525, "valid_targets_mean": 2700.6, "valid_targets_min": 1255 }, { "epoch": 6.383186705767351, "grad_norm": 0.7875236266722555, "learning_rate": 9.418556163302073e-07, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.1496465802192688, "step": 6530, "valid_targets_mean": 2373.9, "valid_targets_min": 950 }, { "epoch": 6.388074291300097, "grad_norm": 0.9345295844327403, "learning_rate": 9.271275590555073e-07, "loss": 0.1383, "loss_nan_ranks": 0, "loss_rank_avg": 0.13679920136928558, "step": 6535, "valid_targets_mean": 2371.4, "valid_targets_min": 744 }, { "epoch": 6.392961876832844, "grad_norm": 0.8165642457777276, "learning_rate": 9.125128317001653e-07, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.14877143502235413, "step": 6540, "valid_targets_mean": 2413.6, "valid_targets_min": 692 }, { "epoch": 6.397849462365591, "grad_norm": 0.8293551530994266, "learning_rate": 8.980115211040607e-07, "loss": 0.1359, "loss_nan_ranks": 0, "loss_rank_avg": 0.12983205914497375, "step": 6545, "valid_targets_mean": 1852.1, "valid_targets_min": 635 }, { "epoch": 6.402737047898338, "grad_norm": 0.8185584829200172, "learning_rate": 8.836237134331527e-07, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.1399831473827362, "step": 6550, "valid_targets_mean": 2156.9, "valid_targets_min": 878 }, { "epoch": 6.407624633431085, "grad_norm": 0.8752733032904388, "learning_rate": 8.693494941789748e-07, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.14943121373653412, "step": 6555, "valid_targets_mean": 2125.4, "valid_targets_min": 791 }, { "epoch": 6.4125122189638315, "grad_norm": 0.771428128135249, "learning_rate": 8.551889481581255e-07, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.13312771916389465, "step": 6560, "valid_targets_mean": 2736.9, "valid_targets_min": 1206 }, { "epoch": 6.417399804496578, "grad_norm": 0.8363887006600691, "learning_rate": 8.411421595117519e-07, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.1484169363975525, "step": 6565, "valid_targets_mean": 2258.8, "valid_targets_min": 612 }, { "epoch": 6.422287390029325, "grad_norm": 0.841896164198332, "learning_rate": 8.272092117050778e-07, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.14031308889389038, "step": 6570, "valid_targets_mean": 2081.2, "valid_targets_min": 741 }, { "epoch": 6.427174975562072, "grad_norm": 0.8344208378276725, "learning_rate": 8.133901875268813e-07, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.16051240265369415, "step": 6575, "valid_targets_mean": 2340.0, "valid_targets_min": 793 }, { "epoch": 6.432062561094819, "grad_norm": 0.739011240056262, "learning_rate": 7.996851690890195e-07, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.1327826976776123, "step": 6580, "valid_targets_mean": 2467.3, "valid_targets_min": 1040 }, { "epoch": 6.436950146627566, "grad_norm": 0.8388926850354799, "learning_rate": 7.860942378259251e-07, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.13930006325244904, "step": 6585, "valid_targets_mean": 2314.1, "valid_targets_min": 687 }, { "epoch": 6.441837732160312, "grad_norm": 0.736849529441786, "learning_rate": 7.726174744941351e-07, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.1561793088912964, "step": 6590, "valid_targets_mean": 3114.3, "valid_targets_min": 1144 }, { "epoch": 6.446725317693059, "grad_norm": 0.7374996366190613, "learning_rate": 7.592549591718091e-07, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.14413076639175415, "step": 6595, "valid_targets_mean": 3133.8, "valid_targets_min": 1182 }, { "epoch": 6.451612903225806, "grad_norm": 0.8220802356280166, "learning_rate": 7.460067712582519e-07, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.1294611543416977, "step": 6600, "valid_targets_mean": 2196.5, "valid_targets_min": 712 }, { "epoch": 6.456500488758553, "grad_norm": 0.7893984126724283, "learning_rate": 7.328729894734388e-07, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.1567493975162506, "step": 6605, "valid_targets_mean": 2438.6, "valid_targets_min": 703 }, { "epoch": 6.4613880742913, "grad_norm": 0.8117586298458785, "learning_rate": 7.198536918575527e-07, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.1428253948688507, "step": 6610, "valid_targets_mean": 2303.7, "valid_targets_min": 632 }, { "epoch": 6.4662756598240465, "grad_norm": 0.7826755426811578, "learning_rate": 7.069489557705145e-07, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.15663695335388184, "step": 6615, "valid_targets_mean": 2520.6, "valid_targets_min": 655 }, { "epoch": 6.471163245356793, "grad_norm": 0.8284462615884153, "learning_rate": 6.941588578915315e-07, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.1673087477684021, "step": 6620, "valid_targets_mean": 2560.1, "valid_targets_min": 1093 }, { "epoch": 6.476050830889541, "grad_norm": 0.6413200188770708, "learning_rate": 6.814834742186361e-07, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.14878563582897186, "step": 6625, "valid_targets_mean": 4005.8, "valid_targets_min": 696 }, { "epoch": 6.480938416422287, "grad_norm": 0.7615467726204301, "learning_rate": 6.689228800682301e-07, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.14344452321529388, "step": 6630, "valid_targets_mean": 2507.8, "valid_targets_min": 899 }, { "epoch": 6.485826001955035, "grad_norm": 0.7837667879512825, "learning_rate": 6.564771500746525e-07, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.13829047977924347, "step": 6635, "valid_targets_mean": 2337.0, "valid_targets_min": 800 }, { "epoch": 6.490713587487781, "grad_norm": 0.7681966736659308, "learning_rate": 6.441463581897167e-07, "loss": 0.1438, "loss_nan_ranks": 0, "loss_rank_avg": 0.1388791799545288, "step": 6640, "valid_targets_mean": 2536.2, "valid_targets_min": 960 }, { "epoch": 6.495601173020528, "grad_norm": 0.7657991833749364, "learning_rate": 6.319305776822848e-07, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.13757102191448212, "step": 6645, "valid_targets_mean": 2367.8, "valid_targets_min": 720 }, { "epoch": 6.500488758553274, "grad_norm": 0.8617641880740021, "learning_rate": 6.198298811378278e-07, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.1516299545764923, "step": 6650, "valid_targets_mean": 2099.6, "valid_targets_min": 627 }, { "epoch": 6.505376344086022, "grad_norm": 0.8509825074669289, "learning_rate": 6.078443404579948e-07, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.160349503159523, "step": 6655, "valid_targets_mean": 2118.5, "valid_targets_min": 764 }, { "epoch": 6.510263929618768, "grad_norm": 0.7385237771877197, "learning_rate": 5.959740268601843e-07, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.14553092420101166, "step": 6660, "valid_targets_mean": 2765.1, "valid_targets_min": 799 }, { "epoch": 6.515151515151516, "grad_norm": 0.7414225190431922, "learning_rate": 5.842190108771206e-07, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.158996120095253, "step": 6665, "valid_targets_mean": 2852.4, "valid_targets_min": 1218 }, { "epoch": 6.5200391006842615, "grad_norm": 0.9920100082894623, "learning_rate": 5.725793623564379e-07, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.143795907497406, "step": 6670, "valid_targets_mean": 2288.8, "valid_targets_min": 981 }, { "epoch": 6.524926686217009, "grad_norm": 0.7440670427532977, "learning_rate": 5.610551504602657e-07, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.1507560908794403, "step": 6675, "valid_targets_mean": 2652.2, "valid_targets_min": 921 }, { "epoch": 6.529814271749755, "grad_norm": 0.8286332715981629, "learning_rate": 5.496464436648108e-07, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.13288316130638123, "step": 6680, "valid_targets_mean": 1858.8, "valid_targets_min": 777 }, { "epoch": 6.534701857282503, "grad_norm": 0.8232783710376684, "learning_rate": 5.383533097599558e-07, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.13944336771965027, "step": 6685, "valid_targets_mean": 2516.9, "valid_targets_min": 925 }, { "epoch": 6.539589442815249, "grad_norm": 0.7654399610127802, "learning_rate": 5.271758158488638e-07, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.13826604187488556, "step": 6690, "valid_targets_mean": 2636.9, "valid_targets_min": 902 }, { "epoch": 6.5444770283479965, "grad_norm": 0.8184911988154895, "learning_rate": 5.161140283475608e-07, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.1462034285068512, "step": 6695, "valid_targets_mean": 2207.8, "valid_targets_min": 710 }, { "epoch": 6.549364613880742, "grad_norm": 0.7337833239715681, "learning_rate": 5.051680129845605e-07, "loss": 0.1366, "loss_nan_ranks": 0, "loss_rank_avg": 0.12600910663604736, "step": 6700, "valid_targets_mean": 2454.8, "valid_targets_min": 864 }, { "epoch": 6.55425219941349, "grad_norm": 0.8445779401373558, "learning_rate": 4.94337834800458e-07, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.1528075784444809, "step": 6705, "valid_targets_mean": 2297.4, "valid_targets_min": 716 }, { "epoch": 6.559139784946236, "grad_norm": 0.7101947557300763, "learning_rate": 4.836235581475523e-07, "loss": 0.1381, "loss_nan_ranks": 0, "loss_rank_avg": 0.12695491313934326, "step": 6710, "valid_targets_mean": 2736.0, "valid_targets_min": 801 }, { "epoch": 6.564027370478984, "grad_norm": 0.8639233831130482, "learning_rate": 4.7302524668946916e-07, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.14430125057697296, "step": 6715, "valid_targets_mean": 2032.4, "valid_targets_min": 846 }, { "epoch": 6.568914956011731, "grad_norm": 0.7461099525991259, "learning_rate": 4.6254296340076497e-07, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.13411906361579895, "step": 6720, "valid_targets_mean": 2808.7, "valid_targets_min": 648 }, { "epoch": 6.573802541544477, "grad_norm": 0.7989702744987931, "learning_rate": 4.521767705665747e-07, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.15190516412258148, "step": 6725, "valid_targets_mean": 2514.4, "valid_targets_min": 740 }, { "epoch": 6.578690127077224, "grad_norm": 0.8220944285398598, "learning_rate": 4.419267297822205e-07, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.1572040170431137, "step": 6730, "valid_targets_mean": 2357.9, "valid_targets_min": 790 }, { "epoch": 6.583577712609971, "grad_norm": 0.6585139462243008, "learning_rate": 4.317929019528566e-07, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.13705238699913025, "step": 6735, "valid_targets_mean": 3228.4, "valid_targets_min": 752 }, { "epoch": 6.588465298142718, "grad_norm": 0.8169152817627165, "learning_rate": 4.217753472931141e-07, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.139057457447052, "step": 6740, "valid_targets_mean": 2172.5, "valid_targets_min": 640 }, { "epoch": 6.593352883675465, "grad_norm": 0.7809355920094504, "learning_rate": 4.118741253267322e-07, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.14593061804771423, "step": 6745, "valid_targets_mean": 2661.4, "valid_targets_min": 780 }, { "epoch": 6.5982404692082115, "grad_norm": 0.7768920952770774, "learning_rate": 4.020892948862032e-07, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.13564547896385193, "step": 6750, "valid_targets_mean": 2473.9, "valid_targets_min": 537 }, { "epoch": 6.603128054740958, "grad_norm": 0.7722557323473561, "learning_rate": 3.9242091411243245e-07, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.1392875760793686, "step": 6755, "valid_targets_mean": 2471.2, "valid_targets_min": 790 }, { "epoch": 6.608015640273705, "grad_norm": 0.7539682369302184, "learning_rate": 3.8286904045438553e-07, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.1369071751832962, "step": 6760, "valid_targets_mean": 2399.9, "valid_targets_min": 610 }, { "epoch": 6.612903225806452, "grad_norm": 0.6424299073579681, "learning_rate": 3.73433730668753e-07, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.13768397271633148, "step": 6765, "valid_targets_mean": 3869.8, "valid_targets_min": 1204 }, { "epoch": 6.617790811339199, "grad_norm": 0.6880284888599075, "learning_rate": 3.641150408196037e-07, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.12130261957645416, "step": 6770, "valid_targets_mean": 2982.4, "valid_targets_min": 815 }, { "epoch": 6.622678396871946, "grad_norm": 0.8219148218793978, "learning_rate": 3.5491302627806314e-07, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.15362417697906494, "step": 6775, "valid_targets_mean": 2819.4, "valid_targets_min": 919 }, { "epoch": 6.627565982404692, "grad_norm": 0.7921515154766982, "learning_rate": 3.4582774172197576e-07, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.13740390539169312, "step": 6780, "valid_targets_mean": 2345.8, "valid_targets_min": 790 }, { "epoch": 6.632453567937439, "grad_norm": 0.7739946089387783, "learning_rate": 3.368592411355831e-07, "loss": 0.1392, "loss_nan_ranks": 0, "loss_rank_avg": 0.1267765611410141, "step": 6785, "valid_targets_mean": 2384.4, "valid_targets_min": 771 }, { "epoch": 6.637341153470186, "grad_norm": 0.7562090861343093, "learning_rate": 3.2800757780920846e-07, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.1409822702407837, "step": 6790, "valid_targets_mean": 2635.0, "valid_targets_min": 594 }, { "epoch": 6.642228739002933, "grad_norm": 0.8014153886361279, "learning_rate": 3.192728043389237e-07, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.15787863731384277, "step": 6795, "valid_targets_mean": 2474.6, "valid_targets_min": 1065 }, { "epoch": 6.64711632453568, "grad_norm": 0.8105759791663855, "learning_rate": 3.106549726262542e-07, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.15971817076206207, "step": 6800, "valid_targets_mean": 2614.4, "valid_targets_min": 1129 }, { "epoch": 6.6520039100684265, "grad_norm": 0.7732426818990713, "learning_rate": 3.0215413387787e-07, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.1353302150964737, "step": 6805, "valid_targets_mean": 2363.2, "valid_targets_min": 725 }, { "epoch": 6.656891495601173, "grad_norm": 0.6933846730883887, "learning_rate": 2.937703386052637e-07, "loss": 0.1379, "loss_nan_ranks": 0, "loss_rank_avg": 0.12826628983020782, "step": 6810, "valid_targets_mean": 3215.6, "valid_targets_min": 821 }, { "epoch": 6.66177908113392, "grad_norm": 0.8557865157908506, "learning_rate": 2.8550363662447347e-07, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.1560901701450348, "step": 6815, "valid_targets_mean": 2224.4, "valid_targets_min": 803 }, { "epoch": 6.666666666666667, "grad_norm": 0.8732910114888374, "learning_rate": 2.77354077055767e-07, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.145709827542305, "step": 6820, "valid_targets_mean": 2143.8, "valid_targets_min": 729 }, { "epoch": 6.671554252199414, "grad_norm": 0.780368314719552, "learning_rate": 2.6932170832336016e-07, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.14553119242191315, "step": 6825, "valid_targets_mean": 2521.6, "valid_targets_min": 934 }, { "epoch": 6.676441837732161, "grad_norm": 0.7148221396324418, "learning_rate": 2.614065781551345e-07, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.1638277769088745, "step": 6830, "valid_targets_mean": 3283.7, "valid_targets_min": 1090 }, { "epoch": 6.681329423264907, "grad_norm": 0.7948993329236099, "learning_rate": 2.5360873358234004e-07, "loss": 0.1419, "loss_nan_ranks": 0, "loss_rank_avg": 0.14200204610824585, "step": 6835, "valid_targets_mean": 2449.1, "valid_targets_min": 738 }, { "epoch": 6.686217008797654, "grad_norm": 0.7070697581069597, "learning_rate": 2.459282209393243e-07, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.1273440271615982, "step": 6840, "valid_targets_mean": 2714.1, "valid_targets_min": 793 }, { "epoch": 6.691104594330401, "grad_norm": 0.804428556746242, "learning_rate": 2.3836508586325246e-07, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.13834835588932037, "step": 6845, "valid_targets_mean": 2142.0, "valid_targets_min": 684 }, { "epoch": 6.695992179863148, "grad_norm": 0.8003383717639464, "learning_rate": 2.309193732938453e-07, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.15829630196094513, "step": 6850, "valid_targets_mean": 2366.2, "valid_targets_min": 744 }, { "epoch": 6.700879765395895, "grad_norm": 0.8634766410996613, "learning_rate": 2.235911274730973e-07, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.16072383522987366, "step": 6855, "valid_targets_mean": 2273.4, "valid_targets_min": 680 }, { "epoch": 6.7057673509286415, "grad_norm": 0.8555538490006295, "learning_rate": 2.1638039194503246e-07, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.15848436951637268, "step": 6860, "valid_targets_mean": 2117.4, "valid_targets_min": 718 }, { "epoch": 6.710654936461388, "grad_norm": 0.8279297269051833, "learning_rate": 2.0928720955542436e-07, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.14095677435398102, "step": 6865, "valid_targets_mean": 2048.8, "valid_targets_min": 754 }, { "epoch": 6.715542521994135, "grad_norm": 0.7949216593255324, "learning_rate": 2.0231162245156088e-07, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.15973398089408875, "step": 6870, "valid_targets_mean": 2616.4, "valid_targets_min": 898 }, { "epoch": 6.720430107526882, "grad_norm": 0.7776529385814106, "learning_rate": 1.9545367208197995e-07, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.13128122687339783, "step": 6875, "valid_targets_mean": 2468.4, "valid_targets_min": 773 }, { "epoch": 6.725317693059629, "grad_norm": 0.7470593281900991, "learning_rate": 1.887133991962342e-07, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.13984917104244232, "step": 6880, "valid_targets_mean": 2672.4, "valid_targets_min": 918 }, { "epoch": 6.730205278592376, "grad_norm": 0.8327481491216713, "learning_rate": 1.8209084384464005e-07, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.14572235941886902, "step": 6885, "valid_targets_mean": 2151.9, "valid_targets_min": 812 }, { "epoch": 6.735092864125122, "grad_norm": 0.7666404720709251, "learning_rate": 1.7558604537804224e-07, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.1454159915447235, "step": 6890, "valid_targets_mean": 2545.7, "valid_targets_min": 759 }, { "epoch": 6.739980449657869, "grad_norm": 0.7742410628801816, "learning_rate": 1.6919904244758311e-07, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.15060219168663025, "step": 6895, "valid_targets_mean": 2724.8, "valid_targets_min": 826 }, { "epoch": 6.744868035190616, "grad_norm": 0.8696550747312377, "learning_rate": 1.6292987300446705e-07, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.14360955357551575, "step": 6900, "valid_targets_mean": 1997.2, "valid_targets_min": 688 }, { "epoch": 6.749755620723363, "grad_norm": 0.669193884708062, "learning_rate": 1.5677857429974296e-07, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.12194126844406128, "step": 6905, "valid_targets_mean": 2778.8, "valid_targets_min": 753 }, { "epoch": 6.75464320625611, "grad_norm": 0.8129272991005836, "learning_rate": 1.507451828840756e-07, "loss": 0.1381, "loss_nan_ranks": 0, "loss_rank_avg": 0.12596674263477325, "step": 6910, "valid_targets_mean": 2184.9, "valid_targets_min": 533 }, { "epoch": 6.7595307917888565, "grad_norm": 0.8272536163498828, "learning_rate": 1.4482973460753446e-07, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.16095013916492462, "step": 6915, "valid_targets_mean": 2635.4, "valid_targets_min": 1072 }, { "epoch": 6.764418377321603, "grad_norm": 0.8546760713602463, "learning_rate": 1.3903226461937424e-07, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.1363896131515503, "step": 6920, "valid_targets_mean": 2176.2, "valid_targets_min": 663 }, { "epoch": 6.76930596285435, "grad_norm": 0.7403266010437409, "learning_rate": 1.3335280736783028e-07, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.15206800401210785, "step": 6925, "valid_targets_mean": 2854.7, "valid_targets_min": 1169 }, { "epoch": 6.774193548387097, "grad_norm": 0.7772690818458694, "learning_rate": 1.2779139659991224e-07, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.1384185254573822, "step": 6930, "valid_targets_mean": 2430.2, "valid_targets_min": 708 }, { "epoch": 6.779081133919844, "grad_norm": 0.8678197977791959, "learning_rate": 1.2234806536120857e-07, "loss": 0.1488, "loss_nan_ranks": 0, "loss_rank_avg": 0.1501295566558838, "step": 6935, "valid_targets_mean": 1968.8, "valid_targets_min": 832 }, { "epoch": 6.783968719452591, "grad_norm": 1.006053072526263, "learning_rate": 1.1702284599568014e-07, "loss": 0.145, "loss_nan_ranks": 0, "loss_rank_avg": 0.15837866067886353, "step": 6940, "valid_targets_mean": 1922.8, "valid_targets_min": 692 }, { "epoch": 6.788856304985337, "grad_norm": 0.7781597084300925, "learning_rate": 1.1181577014547807e-07, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.14804880321025848, "step": 6945, "valid_targets_mean": 2636.6, "valid_targets_min": 874 }, { "epoch": 6.793743890518084, "grad_norm": 0.7361777760679318, "learning_rate": 1.0672686875074834e-07, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.12848952412605286, "step": 6950, "valid_targets_mean": 2487.4, "valid_targets_min": 880 }, { "epoch": 6.798631476050831, "grad_norm": 0.9048873371832021, "learning_rate": 1.0175617204945421e-07, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.1462620347738266, "step": 6955, "valid_targets_mean": 1957.2, "valid_targets_min": 802 }, { "epoch": 6.803519061583578, "grad_norm": 0.8115943754772563, "learning_rate": 9.690370957718965e-08, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.14204561710357666, "step": 6960, "valid_targets_mean": 2568.1, "valid_targets_min": 692 }, { "epoch": 6.808406647116325, "grad_norm": 0.7847252093602829, "learning_rate": 9.216951016701281e-08, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.1391274333000183, "step": 6965, "valid_targets_mean": 2426.6, "valid_targets_min": 820 }, { "epoch": 6.8132942326490715, "grad_norm": 0.7599174927993604, "learning_rate": 8.755360194926399e-08, "loss": 0.1344, "loss_nan_ranks": 0, "loss_rank_avg": 0.15206477046012878, "step": 6970, "valid_targets_mean": 2830.7, "valid_targets_min": 847 }, { "epoch": 6.818181818181818, "grad_norm": 0.7366744359812574, "learning_rate": 8.30560123514057e-08, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.14298483729362488, "step": 6975, "valid_targets_mean": 2676.4, "valid_targets_min": 1298 }, { "epoch": 6.823069403714565, "grad_norm": 0.7873925943117703, "learning_rate": 7.867676809786284e-08, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.14373791217803955, "step": 6980, "valid_targets_mean": 2348.8, "valid_targets_min": 737 }, { "epoch": 6.827956989247312, "grad_norm": 0.7786043991826431, "learning_rate": 7.441589520984726e-08, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.1594143807888031, "step": 6985, "valid_targets_mean": 2935.5, "valid_targets_min": 921 }, { "epoch": 6.832844574780059, "grad_norm": 0.7362339661403121, "learning_rate": 7.027341900523122e-08, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.1562596559524536, "step": 6990, "valid_targets_mean": 3039.9, "valid_targets_min": 1045 }, { "epoch": 6.837732160312806, "grad_norm": 0.8183556025387007, "learning_rate": 6.624936409836524e-08, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.15503844618797302, "step": 6995, "valid_targets_mean": 2337.7, "valid_targets_min": 727 }, { "epoch": 6.842619745845552, "grad_norm": 0.7856265162452774, "learning_rate": 6.23437543999561e-08, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.1516461968421936, "step": 7000, "valid_targets_mean": 2516.7, "valid_targets_min": 1013 }, { "epoch": 6.847507331378299, "grad_norm": 0.7797885305733583, "learning_rate": 5.855661311691574e-08, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.16110171377658844, "step": 7005, "valid_targets_mean": 2726.2, "valid_targets_min": 990 }, { "epoch": 6.852394916911046, "grad_norm": 0.8996911264100806, "learning_rate": 5.4887962752216975e-08, "loss": 0.1373, "loss_nan_ranks": 0, "loss_rank_avg": 0.14116908609867096, "step": 7010, "valid_targets_mean": 2133.9, "valid_targets_min": 967 }, { "epoch": 6.857282502443793, "grad_norm": 0.7855480605188909, "learning_rate": 5.1337825104775805e-08, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.13040246069431305, "step": 7015, "valid_targets_mean": 2354.3, "valid_targets_min": 815 }, { "epoch": 6.86217008797654, "grad_norm": 0.778868414355739, "learning_rate": 4.790622126930489e-08, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.16201795637607574, "step": 7020, "valid_targets_mean": 2563.2, "valid_targets_min": 1043 }, { "epoch": 6.8670576735092865, "grad_norm": 0.8949061085156262, "learning_rate": 4.459317163619803e-08, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.1284133791923523, "step": 7025, "valid_targets_mean": 1841.8, "valid_targets_min": 958 }, { "epoch": 6.871945259042033, "grad_norm": 0.9097660526010823, "learning_rate": 4.13986958914081e-08, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.15148180723190308, "step": 7030, "valid_targets_mean": 1931.8, "valid_targets_min": 679 }, { "epoch": 6.87683284457478, "grad_norm": 0.8079953101764225, "learning_rate": 3.832281301632712e-08, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.1472192108631134, "step": 7035, "valid_targets_mean": 2672.9, "valid_targets_min": 670 }, { "epoch": 6.881720430107527, "grad_norm": 0.8377820814625377, "learning_rate": 3.536554128767522e-08, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.11620961874723434, "step": 7040, "valid_targets_mean": 1944.7, "valid_targets_min": 917 }, { "epoch": 6.886608015640274, "grad_norm": 0.9780072356339135, "learning_rate": 3.252689827739186e-08, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.13305175304412842, "step": 7045, "valid_targets_mean": 1505.8, "valid_targets_min": 921 }, { "epoch": 6.891495601173021, "grad_norm": 0.7630678184839079, "learning_rate": 2.980690085253368e-08, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.14864769577980042, "step": 7050, "valid_targets_mean": 2593.9, "valid_targets_min": 625 }, { "epoch": 6.896383186705767, "grad_norm": 0.7665055215312272, "learning_rate": 2.7205565175167925e-08, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.14561477303504944, "step": 7055, "valid_targets_mean": 3042.3, "valid_targets_min": 963 }, { "epoch": 6.901270772238514, "grad_norm": 0.7931423401009772, "learning_rate": 2.472290670228361e-08, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.14829900860786438, "step": 7060, "valid_targets_mean": 2566.6, "valid_targets_min": 672 }, { "epoch": 6.906158357771261, "grad_norm": 0.7348681150492757, "learning_rate": 2.2358940185698285e-08, "loss": 0.145, "loss_nan_ranks": 0, "loss_rank_avg": 0.15821123123168945, "step": 7065, "valid_targets_mean": 3052.2, "valid_targets_min": 1009 }, { "epoch": 6.911045943304008, "grad_norm": 0.7851239048108627, "learning_rate": 2.0113679671960317e-08, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.15088459849357605, "step": 7070, "valid_targets_mean": 2557.6, "valid_targets_min": 514 }, { "epoch": 6.915933528836755, "grad_norm": 0.7257205703096241, "learning_rate": 1.7987138502284508e-08, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.14671635627746582, "step": 7075, "valid_targets_mean": 2951.8, "valid_targets_min": 1216 }, { "epoch": 6.9208211143695015, "grad_norm": 0.7158651863598146, "learning_rate": 1.5979329312456603e-08, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.156073197722435, "step": 7080, "valid_targets_mean": 3083.7, "valid_targets_min": 987 }, { "epoch": 6.925708699902248, "grad_norm": 0.7570891695989537, "learning_rate": 1.4090264032760037e-08, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.133244588971138, "step": 7085, "valid_targets_mean": 2580.4, "valid_targets_min": 832 }, { "epoch": 6.930596285434995, "grad_norm": 0.8832686071227391, "learning_rate": 1.2319953887918179e-08, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.13915324211120605, "step": 7090, "valid_targets_mean": 2498.4, "valid_targets_min": 632 }, { "epoch": 6.935483870967742, "grad_norm": 0.7469142291910154, "learning_rate": 1.0668409397009972e-08, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.13527530431747437, "step": 7095, "valid_targets_mean": 3218.7, "valid_targets_min": 794 }, { "epoch": 6.940371456500489, "grad_norm": 0.7764886081432477, "learning_rate": 9.135640373418853e-09, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.15149667859077454, "step": 7100, "valid_targets_mean": 2654.7, "valid_targets_min": 1291 }, { "epoch": 6.945259042033236, "grad_norm": 0.792380332907017, "learning_rate": 7.721655924770588e-09, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.14253517985343933, "step": 7105, "valid_targets_mean": 2680.3, "valid_targets_min": 1109 }, { "epoch": 6.9501466275659824, "grad_norm": 0.8708382788168486, "learning_rate": 6.426464452879977e-09, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.15370717644691467, "step": 7110, "valid_targets_mean": 1872.2, "valid_targets_min": 824 }, { "epoch": 6.955034213098729, "grad_norm": 0.7697531302927278, "learning_rate": 5.250073653702004e-09, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.14434030652046204, "step": 7115, "valid_targets_mean": 2634.2, "valid_targets_min": 882 }, { "epoch": 6.959921798631476, "grad_norm": 0.909840589624624, "learning_rate": 4.192490517285208e-09, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.1433998942375183, "step": 7120, "valid_targets_mean": 1897.3, "valid_targets_min": 721 }, { "epoch": 6.964809384164223, "grad_norm": 0.880665464777133, "learning_rate": 3.2537213277228364e-09, "loss": 0.1438, "loss_nan_ranks": 0, "loss_rank_avg": 0.15554025769233704, "step": 7125, "valid_targets_mean": 2096.7, "valid_targets_min": 754 }, { "epoch": 6.96969696969697, "grad_norm": 0.7411591407393181, "learning_rate": 2.4337716631328555e-09, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.13086152076721191, "step": 7130, "valid_targets_mean": 2635.5, "valid_targets_min": 826 }, { "epoch": 6.9745845552297165, "grad_norm": 0.8057506293460369, "learning_rate": 1.732646395606885e-09, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.14949795603752136, "step": 7135, "valid_targets_mean": 2405.2, "valid_targets_min": 748 }, { "epoch": 6.979472140762463, "grad_norm": 0.8097660910794996, "learning_rate": 1.1503496911924316e-09, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.134006530046463, "step": 7140, "valid_targets_mean": 2312.4, "valid_targets_min": 997 }, { "epoch": 6.98435972629521, "grad_norm": 0.7666411016932615, "learning_rate": 6.868850098618041e-10, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.1432676464319229, "step": 7145, "valid_targets_mean": 2855.9, "valid_targets_min": 763 }, { "epoch": 6.989247311827957, "grad_norm": 0.8085737681168628, "learning_rate": 3.4225510549656947e-10, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.13285693526268005, "step": 7150, "valid_targets_mean": 2373.7, "valid_targets_min": 684 }, { "epoch": 6.994134897360704, "grad_norm": 0.6798769668315741, "learning_rate": 1.1646202586756973e-10, "loss": 0.1453, "loss_nan_ranks": 0, "loss_rank_avg": 0.15072640776634216, "step": 7155, "valid_targets_mean": 3628.1, "valid_targets_min": 1272 }, { "epoch": 6.999022482893451, "grad_norm": 0.8430786453318077, "learning_rate": 9.507112626039316e-12, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.11695080995559692, "step": 7160, "valid_targets_mean": 2002.8, "valid_targets_min": 715 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.1567835956811905, "step": 7161, "total_flos": 1242507420499968.0, "train_loss": 0.2217263549632857, "train_runtime": 30173.9773, "train_samples_per_second": 3.796, "train_steps_per_second": 0.237, "valid_targets_mean": 1853.1, "valid_targets_min": 622 } ], "logging_steps": 5, "max_steps": 7161, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1242507420499968.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }