a1-stack_junit / trainer_state.json
EtashGuha's picture
Upload folder using huggingface_hub
c4e38ec verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4606,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.007598784194528876,
"grad_norm": 16.54100795724015,
"learning_rate": 3.4707158351409984e-07,
"loss": 0.6415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6890859603881836,
"step": 5,
"valid_targets_mean": 4029.6,
"valid_targets_min": 742
},
{
"epoch": 0.015197568389057751,
"grad_norm": 17.760320126405695,
"learning_rate": 7.809110629067245e-07,
"loss": 0.6735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6768203973770142,
"step": 10,
"valid_targets_mean": 4724.0,
"valid_targets_min": 333
},
{
"epoch": 0.022796352583586626,
"grad_norm": 14.700502278309516,
"learning_rate": 1.2147505422993492e-06,
"loss": 0.6621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6386404633522034,
"step": 15,
"valid_targets_mean": 4853.7,
"valid_targets_min": 1059
},
{
"epoch": 0.030395136778115502,
"grad_norm": 12.016024137339164,
"learning_rate": 1.6485900216919743e-06,
"loss": 0.6268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6092511415481567,
"step": 20,
"valid_targets_mean": 5505.4,
"valid_targets_min": 2608
},
{
"epoch": 0.037993920972644375,
"grad_norm": 7.202624222295684,
"learning_rate": 2.0824295010845986e-06,
"loss": 0.5318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4805890917778015,
"step": 25,
"valid_targets_mean": 4894.8,
"valid_targets_min": 746
},
{
"epoch": 0.04559270516717325,
"grad_norm": 5.248039681477442,
"learning_rate": 2.516268980477224e-06,
"loss": 0.5034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5152153372764587,
"step": 30,
"valid_targets_mean": 4687.7,
"valid_targets_min": 1705
},
{
"epoch": 0.05319148936170213,
"grad_norm": 2.714176181066118,
"learning_rate": 2.950108459869848e-06,
"loss": 0.4815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4753047823905945,
"step": 35,
"valid_targets_mean": 4859.7,
"valid_targets_min": 456
},
{
"epoch": 0.060790273556231005,
"grad_norm": 1.7777692231211755,
"learning_rate": 3.383947939262473e-06,
"loss": 0.4372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4611857831478119,
"step": 40,
"valid_targets_mean": 4217.9,
"valid_targets_min": 741
},
{
"epoch": 0.06838905775075987,
"grad_norm": 1.3787959870798525,
"learning_rate": 3.817787418655098e-06,
"loss": 0.4164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4521799385547638,
"step": 45,
"valid_targets_mean": 3577.2,
"valid_targets_min": 525
},
{
"epoch": 0.07598784194528875,
"grad_norm": 1.0709482777091444,
"learning_rate": 4.251626898047723e-06,
"loss": 0.4129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45762407779693604,
"step": 50,
"valid_targets_mean": 4046.8,
"valid_targets_min": 847
},
{
"epoch": 0.08358662613981763,
"grad_norm": 0.8316164594444523,
"learning_rate": 4.685466377440348e-06,
"loss": 0.3775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38839221000671387,
"step": 55,
"valid_targets_mean": 5905.9,
"valid_targets_min": 1232
},
{
"epoch": 0.0911854103343465,
"grad_norm": 0.7446660666424425,
"learning_rate": 5.1193058568329725e-06,
"loss": 0.3891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34218358993530273,
"step": 60,
"valid_targets_mean": 4599.2,
"valid_targets_min": 554
},
{
"epoch": 0.09878419452887538,
"grad_norm": 0.8425007884341953,
"learning_rate": 5.5531453362255974e-06,
"loss": 0.3781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36715853214263916,
"step": 65,
"valid_targets_mean": 4719.6,
"valid_targets_min": 590
},
{
"epoch": 0.10638297872340426,
"grad_norm": 0.6619149306280321,
"learning_rate": 5.986984815618222e-06,
"loss": 0.3861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3819279968738556,
"step": 70,
"valid_targets_mean": 4757.8,
"valid_targets_min": 881
},
{
"epoch": 0.11398176291793313,
"grad_norm": 0.5731111234637317,
"learning_rate": 6.420824295010846e-06,
"loss": 0.3629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3706345558166504,
"step": 75,
"valid_targets_mean": 5672.5,
"valid_targets_min": 1128
},
{
"epoch": 0.12158054711246201,
"grad_norm": 0.6080686326455707,
"learning_rate": 6.854663774403471e-06,
"loss": 0.3312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38144651055336,
"step": 80,
"valid_targets_mean": 4179.6,
"valid_targets_min": 814
},
{
"epoch": 0.12917933130699089,
"grad_norm": 0.6499495432455763,
"learning_rate": 7.288503253796096e-06,
"loss": 0.3446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3940460979938507,
"step": 85,
"valid_targets_mean": 4595.6,
"valid_targets_min": 583
},
{
"epoch": 0.13677811550151975,
"grad_norm": 0.4843533852497594,
"learning_rate": 7.722342733188721e-06,
"loss": 0.332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3182428181171417,
"step": 90,
"valid_targets_mean": 5585.4,
"valid_targets_min": 740
},
{
"epoch": 0.14437689969604864,
"grad_norm": 0.6242189491842878,
"learning_rate": 8.156182212581345e-06,
"loss": 0.3316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3119521737098694,
"step": 95,
"valid_targets_mean": 5690.2,
"valid_targets_min": 792
},
{
"epoch": 0.1519756838905775,
"grad_norm": 0.5346923069880523,
"learning_rate": 8.59002169197397e-06,
"loss": 0.3313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31788039207458496,
"step": 100,
"valid_targets_mean": 4587.9,
"valid_targets_min": 767
},
{
"epoch": 0.1595744680851064,
"grad_norm": 0.5073268077298685,
"learning_rate": 9.023861171366595e-06,
"loss": 0.3194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3051730990409851,
"step": 105,
"valid_targets_mean": 5143.8,
"valid_targets_min": 823
},
{
"epoch": 0.16717325227963525,
"grad_norm": 0.5467162692473684,
"learning_rate": 9.457700650759219e-06,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32401126623153687,
"step": 110,
"valid_targets_mean": 5420.0,
"valid_targets_min": 674
},
{
"epoch": 0.17477203647416414,
"grad_norm": 0.5541588789236693,
"learning_rate": 9.891540130151845e-06,
"loss": 0.3334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3607725501060486,
"step": 115,
"valid_targets_mean": 5116.0,
"valid_targets_min": 569
},
{
"epoch": 0.182370820668693,
"grad_norm": 0.5403092031436869,
"learning_rate": 1.032537960954447e-05,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.290938138961792,
"step": 120,
"valid_targets_mean": 4455.6,
"valid_targets_min": 1819
},
{
"epoch": 0.1899696048632219,
"grad_norm": 0.5924655899271373,
"learning_rate": 1.0759219088937095e-05,
"loss": 0.3343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31885042786598206,
"step": 125,
"valid_targets_mean": 3642.6,
"valid_targets_min": 401
},
{
"epoch": 0.19756838905775076,
"grad_norm": 0.49980402806514684,
"learning_rate": 1.119305856832972e-05,
"loss": 0.2857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2728749215602875,
"step": 130,
"valid_targets_mean": 4462.3,
"valid_targets_min": 585
},
{
"epoch": 0.20516717325227962,
"grad_norm": 0.5224338478901207,
"learning_rate": 1.1626898047722344e-05,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29036590456962585,
"step": 135,
"valid_targets_mean": 4953.9,
"valid_targets_min": 901
},
{
"epoch": 0.2127659574468085,
"grad_norm": 0.5647977318046398,
"learning_rate": 1.2060737527114967e-05,
"loss": 0.2992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30531400442123413,
"step": 140,
"valid_targets_mean": 3919.9,
"valid_targets_min": 797
},
{
"epoch": 0.22036474164133737,
"grad_norm": 0.5768676708119788,
"learning_rate": 1.2494577006507593e-05,
"loss": 0.3144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3926551342010498,
"step": 145,
"valid_targets_mean": 4445.3,
"valid_targets_min": 595
},
{
"epoch": 0.22796352583586627,
"grad_norm": 0.46004731662025494,
"learning_rate": 1.2928416485900217e-05,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23685210943222046,
"step": 150,
"valid_targets_mean": 4963.2,
"valid_targets_min": 1646
},
{
"epoch": 0.23556231003039513,
"grad_norm": 0.6456923331623713,
"learning_rate": 1.3362255965292842e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32530516386032104,
"step": 155,
"valid_targets_mean": 3147.6,
"valid_targets_min": 713
},
{
"epoch": 0.24316109422492402,
"grad_norm": 0.5132446277120045,
"learning_rate": 1.3796095444685466e-05,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3017147481441498,
"step": 160,
"valid_targets_mean": 5447.2,
"valid_targets_min": 662
},
{
"epoch": 0.2507598784194529,
"grad_norm": 0.5526604062654956,
"learning_rate": 1.4229934924078092e-05,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2687798738479614,
"step": 165,
"valid_targets_mean": 4341.5,
"valid_targets_min": 756
},
{
"epoch": 0.25835866261398177,
"grad_norm": 0.5293460369161004,
"learning_rate": 1.4663774403470716e-05,
"loss": 0.2804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28431305289268494,
"step": 170,
"valid_targets_mean": 6130.4,
"valid_targets_min": 1724
},
{
"epoch": 0.26595744680851063,
"grad_norm": 0.5138145073678304,
"learning_rate": 1.5097613882863342e-05,
"loss": 0.2892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29994410276412964,
"step": 175,
"valid_targets_mean": 4394.1,
"valid_targets_min": 589
},
{
"epoch": 0.2735562310030395,
"grad_norm": 0.5043230432581788,
"learning_rate": 1.5531453362255964e-05,
"loss": 0.2841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2635194659233093,
"step": 180,
"valid_targets_mean": 4637.4,
"valid_targets_min": 588
},
{
"epoch": 0.2811550151975684,
"grad_norm": 0.5633614566403176,
"learning_rate": 1.5965292841648592e-05,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.349490761756897,
"step": 185,
"valid_targets_mean": 5181.4,
"valid_targets_min": 1743
},
{
"epoch": 0.2887537993920973,
"grad_norm": 0.5633432190899903,
"learning_rate": 1.6399132321041216e-05,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28400588035583496,
"step": 190,
"valid_targets_mean": 4035.6,
"valid_targets_min": 1318
},
{
"epoch": 0.29635258358662614,
"grad_norm": 0.48584306761961266,
"learning_rate": 1.6832971800433843e-05,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2302139550447464,
"step": 195,
"valid_targets_mean": 5217.0,
"valid_targets_min": 1825
},
{
"epoch": 0.303951367781155,
"grad_norm": 0.5423337122654377,
"learning_rate": 1.7266811279826464e-05,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2699054479598999,
"step": 200,
"valid_targets_mean": 4060.4,
"valid_targets_min": 824
},
{
"epoch": 0.31155015197568386,
"grad_norm": 0.583883380975703,
"learning_rate": 1.770065075921909e-05,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28162840008735657,
"step": 205,
"valid_targets_mean": 4595.1,
"valid_targets_min": 446
},
{
"epoch": 0.3191489361702128,
"grad_norm": 0.5187106940915953,
"learning_rate": 1.8134490238611715e-05,
"loss": 0.2586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25653451681137085,
"step": 210,
"valid_targets_mean": 4721.1,
"valid_targets_min": 885
},
{
"epoch": 0.32674772036474165,
"grad_norm": 0.5079241607768279,
"learning_rate": 1.856832971800434e-05,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.257007360458374,
"step": 215,
"valid_targets_mean": 5210.9,
"valid_targets_min": 784
},
{
"epoch": 0.3343465045592705,
"grad_norm": 0.6159525490464162,
"learning_rate": 1.9002169197396964e-05,
"loss": 0.2707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3035469651222229,
"step": 220,
"valid_targets_mean": 4253.7,
"valid_targets_min": 670
},
{
"epoch": 0.34194528875379937,
"grad_norm": 0.618048775817979,
"learning_rate": 1.9436008676789588e-05,
"loss": 0.2914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3232946991920471,
"step": 225,
"valid_targets_mean": 3915.6,
"valid_targets_min": 686
},
{
"epoch": 0.3495440729483283,
"grad_norm": 0.4988454732686451,
"learning_rate": 1.9869848156182215e-05,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2464175820350647,
"step": 230,
"valid_targets_mean": 4478.2,
"valid_targets_min": 1934
},
{
"epoch": 0.35714285714285715,
"grad_norm": 0.5788630961414701,
"learning_rate": 2.030368763557484e-05,
"loss": 0.2697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25093919038772583,
"step": 235,
"valid_targets_mean": 4403.9,
"valid_targets_min": 2002
},
{
"epoch": 0.364741641337386,
"grad_norm": 0.5727233609316779,
"learning_rate": 2.0737527114967463e-05,
"loss": 0.2787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930532693862915,
"step": 240,
"valid_targets_mean": 3878.2,
"valid_targets_min": 683
},
{
"epoch": 0.3723404255319149,
"grad_norm": 0.507643333171839,
"learning_rate": 2.117136659436009e-05,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26503849029541016,
"step": 245,
"valid_targets_mean": 5116.3,
"valid_targets_min": 1771
},
{
"epoch": 0.3799392097264438,
"grad_norm": 0.5575549222120635,
"learning_rate": 2.160520607375271e-05,
"loss": 0.239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24154013395309448,
"step": 250,
"valid_targets_mean": 4581.1,
"valid_targets_min": 446
},
{
"epoch": 0.38753799392097266,
"grad_norm": 0.5133849867561285,
"learning_rate": 2.203904555314534e-05,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2547852694988251,
"step": 255,
"valid_targets_mean": 4651.8,
"valid_targets_min": 434
},
{
"epoch": 0.3951367781155015,
"grad_norm": 0.46783460540928934,
"learning_rate": 2.2472885032537963e-05,
"loss": 0.2714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23877258598804474,
"step": 260,
"valid_targets_mean": 5490.8,
"valid_targets_min": 1221
},
{
"epoch": 0.4027355623100304,
"grad_norm": 0.5446072363730794,
"learning_rate": 2.290672451193059e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23716062307357788,
"step": 265,
"valid_targets_mean": 4415.1,
"valid_targets_min": 567
},
{
"epoch": 0.41033434650455924,
"grad_norm": 0.5076237944415188,
"learning_rate": 2.334056399132321e-05,
"loss": 0.2406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2342528998851776,
"step": 270,
"valid_targets_mean": 4982.2,
"valid_targets_min": 867
},
{
"epoch": 0.41793313069908816,
"grad_norm": 0.5204833234773354,
"learning_rate": 2.3774403470715835e-05,
"loss": 0.2722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24817609786987305,
"step": 275,
"valid_targets_mean": 4886.1,
"valid_targets_min": 1124
},
{
"epoch": 0.425531914893617,
"grad_norm": 1.1929428353263904,
"learning_rate": 2.4208242950108462e-05,
"loss": 0.2534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2741398513317108,
"step": 280,
"valid_targets_mean": 5717.5,
"valid_targets_min": 863
},
{
"epoch": 0.4331306990881459,
"grad_norm": 0.585914448752194,
"learning_rate": 2.464208242950109e-05,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27346092462539673,
"step": 285,
"valid_targets_mean": 4714.8,
"valid_targets_min": 738
},
{
"epoch": 0.44072948328267475,
"grad_norm": 0.6700936401277653,
"learning_rate": 2.507592190889371e-05,
"loss": 0.2714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3218214511871338,
"step": 290,
"valid_targets_mean": 3352.8,
"valid_targets_min": 665
},
{
"epoch": 0.44832826747720367,
"grad_norm": 0.5819949812246825,
"learning_rate": 2.5509761388286335e-05,
"loss": 0.2454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24475443363189697,
"step": 295,
"valid_targets_mean": 5024.5,
"valid_targets_min": 1008
},
{
"epoch": 0.45592705167173253,
"grad_norm": 0.5564851893611434,
"learning_rate": 2.5943600867678962e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25335440039634705,
"step": 300,
"valid_targets_mean": 4271.6,
"valid_targets_min": 495
},
{
"epoch": 0.4635258358662614,
"grad_norm": 0.6776311836920197,
"learning_rate": 2.637744034707159e-05,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26621827483177185,
"step": 305,
"valid_targets_mean": 4792.2,
"valid_targets_min": 585
},
{
"epoch": 0.47112462006079026,
"grad_norm": 0.5014128476072633,
"learning_rate": 2.681127982646421e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23652535676956177,
"step": 310,
"valid_targets_mean": 5203.9,
"valid_targets_min": 631
},
{
"epoch": 0.4787234042553192,
"grad_norm": 0.5471285546055437,
"learning_rate": 2.7245119305856834e-05,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2725940942764282,
"step": 315,
"valid_targets_mean": 4777.1,
"valid_targets_min": 1762
},
{
"epoch": 0.48632218844984804,
"grad_norm": 0.5215837029470914,
"learning_rate": 2.7678958785249462e-05,
"loss": 0.2357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2674940228462219,
"step": 320,
"valid_targets_mean": 4912.2,
"valid_targets_min": 1286
},
{
"epoch": 0.4939209726443769,
"grad_norm": 0.5545464098953832,
"learning_rate": 2.8112798264642082e-05,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27066224813461304,
"step": 325,
"valid_targets_mean": 4713.8,
"valid_targets_min": 581
},
{
"epoch": 0.5015197568389058,
"grad_norm": 0.5291981229160326,
"learning_rate": 2.854663774403471e-05,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27261027693748474,
"step": 330,
"valid_targets_mean": 5018.4,
"valid_targets_min": 825
},
{
"epoch": 0.5091185410334347,
"grad_norm": 0.5927074347019183,
"learning_rate": 2.8980477223427334e-05,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23593679070472717,
"step": 335,
"valid_targets_mean": 4369.9,
"valid_targets_min": 852
},
{
"epoch": 0.5167173252279635,
"grad_norm": 0.5613566212263488,
"learning_rate": 2.941431670281996e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25743183493614197,
"step": 340,
"valid_targets_mean": 4878.5,
"valid_targets_min": 736
},
{
"epoch": 0.5243161094224924,
"grad_norm": 0.43333351737553155,
"learning_rate": 2.9848156182212582e-05,
"loss": 0.2418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22708739340305328,
"step": 345,
"valid_targets_mean": 5272.6,
"valid_targets_min": 2600
},
{
"epoch": 0.5319148936170213,
"grad_norm": 0.5349091750560264,
"learning_rate": 3.028199566160521e-05,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2423931062221527,
"step": 350,
"valid_targets_mean": 4710.4,
"valid_targets_min": 1708
},
{
"epoch": 0.5395136778115501,
"grad_norm": 0.552342573882699,
"learning_rate": 3.0715835140997834e-05,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2209261655807495,
"step": 355,
"valid_targets_mean": 4220.2,
"valid_targets_min": 498
},
{
"epoch": 0.547112462006079,
"grad_norm": 0.47358599117445827,
"learning_rate": 3.114967462039046e-05,
"loss": 0.2431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22403742372989655,
"step": 360,
"valid_targets_mean": 5009.1,
"valid_targets_min": 826
},
{
"epoch": 0.5547112462006079,
"grad_norm": 0.5508791979851065,
"learning_rate": 3.158351409978308e-05,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2744586765766144,
"step": 365,
"valid_targets_mean": 4221.0,
"valid_targets_min": 658
},
{
"epoch": 0.5623100303951368,
"grad_norm": 0.4880656851972933,
"learning_rate": 3.2017353579175706e-05,
"loss": 0.257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2102406919002533,
"step": 370,
"valid_targets_mean": 5021.4,
"valid_targets_min": 422
},
{
"epoch": 0.5699088145896657,
"grad_norm": 0.5066085991817625,
"learning_rate": 3.2451193058568337e-05,
"loss": 0.2493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.220636785030365,
"step": 375,
"valid_targets_mean": 4511.9,
"valid_targets_min": 904
},
{
"epoch": 0.5775075987841946,
"grad_norm": 0.7189915330518424,
"learning_rate": 3.288503253796096e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2566250264644623,
"step": 380,
"valid_targets_mean": 4385.5,
"valid_targets_min": 551
},
{
"epoch": 0.5851063829787234,
"grad_norm": 0.548460587196264,
"learning_rate": 3.331887201735358e-05,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23478102684020996,
"step": 385,
"valid_targets_mean": 4521.1,
"valid_targets_min": 940
},
{
"epoch": 0.5927051671732523,
"grad_norm": 0.7285447421019886,
"learning_rate": 3.375271149674621e-05,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2555179297924042,
"step": 390,
"valid_targets_mean": 3723.9,
"valid_targets_min": 409
},
{
"epoch": 0.6003039513677811,
"grad_norm": 0.5544467667445715,
"learning_rate": 3.418655097613883e-05,
"loss": 0.2459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2515088617801666,
"step": 395,
"valid_targets_mean": 4729.4,
"valid_targets_min": 791
},
{
"epoch": 0.60790273556231,
"grad_norm": 0.53995409546225,
"learning_rate": 3.462039045553146e-05,
"loss": 0.2477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23457960784435272,
"step": 400,
"valid_targets_mean": 5069.6,
"valid_targets_min": 489
},
{
"epoch": 0.6155015197568389,
"grad_norm": 0.9196646418934739,
"learning_rate": 3.505422993492408e-05,
"loss": 0.2449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23785921931266785,
"step": 405,
"valid_targets_mean": 4393.4,
"valid_targets_min": 829
},
{
"epoch": 0.6231003039513677,
"grad_norm": 0.6099790951053485,
"learning_rate": 3.5488069414316705e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23619459569454193,
"step": 410,
"valid_targets_mean": 3865.0,
"valid_targets_min": 1002
},
{
"epoch": 0.6306990881458967,
"grad_norm": 0.5925560150305617,
"learning_rate": 3.592190889370933e-05,
"loss": 0.2534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24648156762123108,
"step": 415,
"valid_targets_mean": 5077.6,
"valid_targets_min": 1028
},
{
"epoch": 0.6382978723404256,
"grad_norm": 0.5334746742630121,
"learning_rate": 3.635574837310195e-05,
"loss": 0.2337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21448864042758942,
"step": 420,
"valid_targets_mean": 4616.1,
"valid_targets_min": 574
},
{
"epoch": 0.6458966565349544,
"grad_norm": 0.5167724016109878,
"learning_rate": 3.678958785249458e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.230168879032135,
"step": 425,
"valid_targets_mean": 4870.9,
"valid_targets_min": 921
},
{
"epoch": 0.6534954407294833,
"grad_norm": 0.5454984899416742,
"learning_rate": 3.722342733188721e-05,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.262331485748291,
"step": 430,
"valid_targets_mean": 5432.7,
"valid_targets_min": 933
},
{
"epoch": 0.6610942249240122,
"grad_norm": 0.7273049295570767,
"learning_rate": 3.765726681127983e-05,
"loss": 0.2398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25644373893737793,
"step": 435,
"valid_targets_mean": 3536.0,
"valid_targets_min": 710
},
{
"epoch": 0.668693009118541,
"grad_norm": 0.5453606831740409,
"learning_rate": 3.8091106290672456e-05,
"loss": 0.2312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24661529064178467,
"step": 440,
"valid_targets_mean": 4021.8,
"valid_targets_min": 599
},
{
"epoch": 0.6762917933130699,
"grad_norm": 0.5397724365767885,
"learning_rate": 3.852494577006508e-05,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2421499490737915,
"step": 445,
"valid_targets_mean": 4597.5,
"valid_targets_min": 370
},
{
"epoch": 0.6838905775075987,
"grad_norm": 0.5764238756332084,
"learning_rate": 3.8958785249457704e-05,
"loss": 0.2261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2172556221485138,
"step": 450,
"valid_targets_mean": 5077.4,
"valid_targets_min": 1299
},
{
"epoch": 0.6914893617021277,
"grad_norm": 0.5511870862131859,
"learning_rate": 3.939262472885033e-05,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23796507716178894,
"step": 455,
"valid_targets_mean": 3540.4,
"valid_targets_min": 781
},
{
"epoch": 0.6990881458966566,
"grad_norm": 0.5240137590905279,
"learning_rate": 3.982646420824295e-05,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3238080143928528,
"step": 460,
"valid_targets_mean": 6050.4,
"valid_targets_min": 921
},
{
"epoch": 0.7066869300911854,
"grad_norm": 0.504788443919895,
"learning_rate": 3.999994829970777e-05,
"loss": 0.2519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535270154476166,
"step": 465,
"valid_targets_mean": 4623.6,
"valid_targets_min": 642
},
{
"epoch": 0.7142857142857143,
"grad_norm": 0.6552382106268326,
"learning_rate": 3.999963235444541e-05,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23992504179477692,
"step": 470,
"valid_targets_mean": 5108.4,
"valid_targets_min": 702
},
{
"epoch": 0.7218844984802432,
"grad_norm": 0.5338400861286152,
"learning_rate": 3.999902919083712e-05,
"loss": 0.2426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2298986315727234,
"step": 475,
"valid_targets_mean": 4551.4,
"valid_targets_min": 827
},
{
"epoch": 0.729483282674772,
"grad_norm": 0.4717163253476549,
"learning_rate": 3.999813881754504e-05,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22416530549526215,
"step": 480,
"valid_targets_mean": 5166.6,
"valid_targets_min": 2461
},
{
"epoch": 0.7370820668693009,
"grad_norm": 0.46569192135259724,
"learning_rate": 3.999696124735598e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20350381731987,
"step": 485,
"valid_targets_mean": 5345.7,
"valid_targets_min": 1890
},
{
"epoch": 0.7446808510638298,
"grad_norm": 0.42173419222407094,
"learning_rate": 3.999549649718124e-05,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21917913854122162,
"step": 490,
"valid_targets_mean": 6391.4,
"valid_targets_min": 3738
},
{
"epoch": 0.7522796352583586,
"grad_norm": 0.5432626540059464,
"learning_rate": 3.999374458805636e-05,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2308879792690277,
"step": 495,
"valid_targets_mean": 4123.1,
"valid_targets_min": 597
},
{
"epoch": 0.7598784194528876,
"grad_norm": 0.5137145588974806,
"learning_rate": 3.999170554514082e-05,
"loss": 0.2331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23714055120944977,
"step": 500,
"valid_targets_mean": 4805.9,
"valid_targets_min": 605
},
{
"epoch": 0.7674772036474165,
"grad_norm": 0.49268000212812557,
"learning_rate": 3.998937939771771e-05,
"loss": 0.2222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24276787042617798,
"step": 505,
"valid_targets_mean": 4071.9,
"valid_targets_min": 790
},
{
"epoch": 0.7750759878419453,
"grad_norm": 0.6202296018779553,
"learning_rate": 3.998676617919322e-05,
"loss": 0.2437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27594321966171265,
"step": 510,
"valid_targets_mean": 3380.7,
"valid_targets_min": 440
},
{
"epoch": 0.7826747720364742,
"grad_norm": 0.4863803507783552,
"learning_rate": 3.9983865927096276e-05,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24749267101287842,
"step": 515,
"valid_targets_mean": 5073.1,
"valid_targets_min": 777
},
{
"epoch": 0.790273556231003,
"grad_norm": 0.5836827968647129,
"learning_rate": 3.998067868307792e-05,
"loss": 0.2272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23861373960971832,
"step": 520,
"valid_targets_mean": 5020.6,
"valid_targets_min": 570
},
{
"epoch": 0.7978723404255319,
"grad_norm": 0.5231558404449659,
"learning_rate": 3.9977204492910744e-05,
"loss": 0.233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22653838992118835,
"step": 525,
"valid_targets_mean": 4575.4,
"valid_targets_min": 565
},
{
"epoch": 0.8054711246200608,
"grad_norm": 0.5430934870471972,
"learning_rate": 3.997344340648822e-05,
"loss": 0.2358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22603115439414978,
"step": 530,
"valid_targets_mean": 4679.3,
"valid_targets_min": 937
},
{
"epoch": 0.8130699088145896,
"grad_norm": 0.5286884499015065,
"learning_rate": 3.996939547782399e-05,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22073689103126526,
"step": 535,
"valid_targets_mean": 4476.1,
"valid_targets_min": 718
},
{
"epoch": 0.8206686930091185,
"grad_norm": 0.5785998410503295,
"learning_rate": 3.996506076505109e-05,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2660371661186218,
"step": 540,
"valid_targets_mean": 4106.3,
"valid_targets_min": 487
},
{
"epoch": 0.8282674772036475,
"grad_norm": 0.6951317726718936,
"learning_rate": 3.996043933042112e-05,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24442562460899353,
"step": 545,
"valid_targets_mean": 4844.5,
"valid_targets_min": 834
},
{
"epoch": 0.8358662613981763,
"grad_norm": 0.43506966442749545,
"learning_rate": 3.995553124030334e-05,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20776590704917908,
"step": 550,
"valid_targets_mean": 4980.6,
"valid_targets_min": 465
},
{
"epoch": 0.8434650455927052,
"grad_norm": 0.4706049122050459,
"learning_rate": 3.9950336565183725e-05,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27285271883010864,
"step": 555,
"valid_targets_mean": 5395.9,
"valid_targets_min": 990
},
{
"epoch": 0.851063829787234,
"grad_norm": 0.49091088519408277,
"learning_rate": 3.994485537966394e-05,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2088671624660492,
"step": 560,
"valid_targets_mean": 4588.9,
"valid_targets_min": 930
},
{
"epoch": 0.8586626139817629,
"grad_norm": 0.5986083125056836,
"learning_rate": 3.993908776246029e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24598953127861023,
"step": 565,
"valid_targets_mean": 3864.4,
"valid_targets_min": 694
},
{
"epoch": 0.8662613981762918,
"grad_norm": 0.5161879038146385,
"learning_rate": 3.993303379640256e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24257272481918335,
"step": 570,
"valid_targets_mean": 3828.1,
"valid_targets_min": 714
},
{
"epoch": 0.8738601823708206,
"grad_norm": 0.4991892963677317,
"learning_rate": 3.992669356843287e-05,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2508493661880493,
"step": 575,
"valid_targets_mean": 4322.0,
"valid_targets_min": 1183
},
{
"epoch": 0.8814589665653495,
"grad_norm": 0.46377204664593574,
"learning_rate": 3.992006716960437e-05,
"loss": 0.2293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2126588225364685,
"step": 580,
"valid_targets_mean": 4726.4,
"valid_targets_min": 771
},
{
"epoch": 0.8890577507598785,
"grad_norm": 0.4484638597015378,
"learning_rate": 3.9913154695079983e-05,
"loss": 0.2479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2277049422264099,
"step": 585,
"valid_targets_mean": 5441.6,
"valid_targets_min": 672
},
{
"epoch": 0.8966565349544073,
"grad_norm": 0.473975742493428,
"learning_rate": 3.9905956244131e-05,
"loss": 0.2406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2310577630996704,
"step": 590,
"valid_targets_mean": 4966.7,
"valid_targets_min": 171
},
{
"epoch": 0.9042553191489362,
"grad_norm": 0.5269660383414424,
"learning_rate": 3.989847192013569e-05,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20536382496356964,
"step": 595,
"valid_targets_mean": 4305.1,
"valid_targets_min": 818
},
{
"epoch": 0.9118541033434651,
"grad_norm": 0.5290469023785411,
"learning_rate": 3.9890701830577784e-05,
"loss": 0.2519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19890496134757996,
"step": 600,
"valid_targets_mean": 3980.8,
"valid_targets_min": 911
},
{
"epoch": 0.9194528875379939,
"grad_norm": 0.44803784041894573,
"learning_rate": 3.9882646087044944e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2399585247039795,
"step": 605,
"valid_targets_mean": 5333.2,
"valid_targets_min": 280
},
{
"epoch": 0.9270516717325228,
"grad_norm": 0.4328101297576573,
"learning_rate": 3.987430480522717e-05,
"loss": 0.2227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21868915855884552,
"step": 610,
"valid_targets_mean": 5678.4,
"valid_targets_min": 1871
},
{
"epoch": 0.9346504559270516,
"grad_norm": 0.49304307903824257,
"learning_rate": 3.986567810491511e-05,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2420819252729416,
"step": 615,
"valid_targets_mean": 4536.2,
"valid_targets_min": 809
},
{
"epoch": 0.9422492401215805,
"grad_norm": 0.5700813425381566,
"learning_rate": 3.9856766109998376e-05,
"loss": 0.2407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21311193704605103,
"step": 620,
"valid_targets_mean": 4451.4,
"valid_targets_min": 593
},
{
"epoch": 0.9498480243161094,
"grad_norm": 0.6294683305416847,
"learning_rate": 3.9847568948463754e-05,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20918530225753784,
"step": 625,
"valid_targets_mean": 4797.4,
"valid_targets_min": 847
},
{
"epoch": 0.9574468085106383,
"grad_norm": 0.49380029688075006,
"learning_rate": 3.983808675239333e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2152310311794281,
"step": 630,
"valid_targets_mean": 4176.9,
"valid_targets_min": 692
},
{
"epoch": 0.9650455927051672,
"grad_norm": 0.5200102205973911,
"learning_rate": 3.9828319657962655e-05,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2529393136501312,
"step": 635,
"valid_targets_mean": 4521.0,
"valid_targets_min": 1069
},
{
"epoch": 0.9726443768996961,
"grad_norm": 0.5009014898507517,
"learning_rate": 3.981826780543873e-05,
"loss": 0.2398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2124088704586029,
"step": 640,
"valid_targets_mean": 4639.8,
"valid_targets_min": 268
},
{
"epoch": 0.9802431610942249,
"grad_norm": 0.47854286438275906,
"learning_rate": 3.980793133917805e-05,
"loss": 0.2284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22133532166481018,
"step": 645,
"valid_targets_mean": 4939.1,
"valid_targets_min": 1059
},
{
"epoch": 0.9878419452887538,
"grad_norm": 0.44229863697562477,
"learning_rate": 3.979731040762446e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20959582924842834,
"step": 650,
"valid_targets_mean": 5179.6,
"valid_targets_min": 805
},
{
"epoch": 0.9954407294832827,
"grad_norm": 0.4641726376092792,
"learning_rate": 3.97864051633071e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22157493233680725,
"step": 655,
"valid_targets_mean": 4819.9,
"valid_targets_min": 646
},
{
"epoch": 1.0030395136778116,
"grad_norm": 0.7931644284514437,
"learning_rate": 3.977521576283815e-05,
"loss": 0.2343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19440427422523499,
"step": 660,
"valid_targets_mean": 4668.7,
"valid_targets_min": 915
},
{
"epoch": 1.0106382978723405,
"grad_norm": 0.48788029210277306,
"learning_rate": 3.9763742366910626e-05,
"loss": 0.206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1956978291273117,
"step": 665,
"valid_targets_mean": 4805.8,
"valid_targets_min": 694
},
{
"epoch": 1.0182370820668694,
"grad_norm": 0.5298990414713055,
"learning_rate": 3.975198514029604e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2972638010978699,
"step": 670,
"valid_targets_mean": 4853.2,
"valid_targets_min": 512
},
{
"epoch": 1.0258358662613982,
"grad_norm": 0.5473369439399378,
"learning_rate": 3.9739944251842054e-05,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21648220717906952,
"step": 675,
"valid_targets_mean": 5254.8,
"valid_targets_min": 1077
},
{
"epoch": 1.033434650455927,
"grad_norm": 0.8965405989782883,
"learning_rate": 3.9727619874470066e-05,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24239912629127502,
"step": 680,
"valid_targets_mean": 4575.9,
"valid_targets_min": 847
},
{
"epoch": 1.041033434650456,
"grad_norm": 0.45053643384905995,
"learning_rate": 3.971501218517267e-05,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20542305707931519,
"step": 685,
"valid_targets_mean": 4701.5,
"valid_targets_min": 359
},
{
"epoch": 1.0486322188449848,
"grad_norm": 0.5355621304269382,
"learning_rate": 3.9702121365011194e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24637873470783234,
"step": 690,
"valid_targets_mean": 4662.4,
"valid_targets_min": 797
},
{
"epoch": 1.0562310030395137,
"grad_norm": 0.46031160112965963,
"learning_rate": 3.968894759911304e-05,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22839926183223724,
"step": 695,
"valid_targets_mean": 5164.2,
"valid_targets_min": 904
},
{
"epoch": 1.0638297872340425,
"grad_norm": 0.4910433091107382,
"learning_rate": 3.9675491076669043e-05,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21850205957889557,
"step": 700,
"valid_targets_mean": 4950.7,
"valid_targets_min": 478
},
{
"epoch": 1.0714285714285714,
"grad_norm": 0.5876241654950701,
"learning_rate": 3.966175199093077e-05,
"loss": 0.2152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23394906520843506,
"step": 705,
"valid_targets_mean": 3169.8,
"valid_targets_min": 809
},
{
"epoch": 1.0790273556231003,
"grad_norm": 0.46432326611030017,
"learning_rate": 3.9647730539207715e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2200213074684143,
"step": 710,
"valid_targets_mean": 5574.2,
"valid_targets_min": 2786
},
{
"epoch": 1.0866261398176291,
"grad_norm": 0.4275229879620877,
"learning_rate": 3.963342692286449e-05,
"loss": 0.2161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20706182718276978,
"step": 715,
"valid_targets_mean": 5002.6,
"valid_targets_min": 1028
},
{
"epoch": 1.094224924012158,
"grad_norm": 0.5268786606408785,
"learning_rate": 3.9618841347317925e-05,
"loss": 0.2099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20836099982261658,
"step": 720,
"valid_targets_mean": 3824.6,
"valid_targets_min": 834
},
{
"epoch": 1.1018237082066868,
"grad_norm": 0.44352266391750467,
"learning_rate": 3.9603974022034117e-05,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1991317719221115,
"step": 725,
"valid_targets_mean": 5762.8,
"valid_targets_min": 2565
},
{
"epoch": 1.1094224924012157,
"grad_norm": 0.5059377730602702,
"learning_rate": 3.9588825160525406e-05,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2332250475883484,
"step": 730,
"valid_targets_mean": 4394.6,
"valid_targets_min": 778
},
{
"epoch": 1.1170212765957448,
"grad_norm": 0.5277265421398942,
"learning_rate": 3.9573394980347354e-05,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23748330771923065,
"step": 735,
"valid_targets_mean": 4523.4,
"valid_targets_min": 588
},
{
"epoch": 1.1246200607902737,
"grad_norm": 0.46757311577973365,
"learning_rate": 3.9557683703095564e-05,
"loss": 0.2074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20653977990150452,
"step": 740,
"valid_targets_mean": 5119.2,
"valid_targets_min": 446
},
{
"epoch": 1.1322188449848025,
"grad_norm": 0.4423041648030623,
"learning_rate": 3.954169155440255e-05,
"loss": 0.2234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2072131335735321,
"step": 745,
"valid_targets_mean": 4472.0,
"valid_targets_min": 271
},
{
"epoch": 1.1398176291793314,
"grad_norm": 0.4428410311750491,
"learning_rate": 3.952541876393444e-05,
"loss": 0.2206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23159939050674438,
"step": 750,
"valid_targets_mean": 4634.8,
"valid_targets_min": 810
},
{
"epoch": 1.1474164133738602,
"grad_norm": 0.5243183428010766,
"learning_rate": 3.9508865565387745e-05,
"loss": 0.2137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22126150131225586,
"step": 755,
"valid_targets_mean": 4285.5,
"valid_targets_min": 702
},
{
"epoch": 1.155015197568389,
"grad_norm": 0.45761304225615707,
"learning_rate": 3.949203219648594e-05,
"loss": 0.217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20640668272972107,
"step": 760,
"valid_targets_mean": 4922.4,
"valid_targets_min": 229
},
{
"epoch": 1.162613981762918,
"grad_norm": 0.4830790302776904,
"learning_rate": 3.94749188989761e-05,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2300214022397995,
"step": 765,
"valid_targets_mean": 4988.9,
"valid_targets_min": 2275
},
{
"epoch": 1.1702127659574468,
"grad_norm": 0.6344964312381591,
"learning_rate": 3.945752591862538e-05,
"loss": 0.2075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22842663526535034,
"step": 770,
"valid_targets_mean": 3627.2,
"valid_targets_min": 662
},
{
"epoch": 1.1778115501519757,
"grad_norm": 0.48098689360030655,
"learning_rate": 3.943985350521753e-05,
"loss": 0.2306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2292681783437729,
"step": 775,
"valid_targets_mean": 4028.1,
"valid_targets_min": 732
},
{
"epoch": 1.1854103343465046,
"grad_norm": 0.5336086809835088,
"learning_rate": 3.942190191254928e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22446206212043762,
"step": 780,
"valid_targets_mean": 4275.8,
"valid_targets_min": 741
},
{
"epoch": 1.1930091185410334,
"grad_norm": 0.613832091134627,
"learning_rate": 3.9403671398426705e-05,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2014659196138382,
"step": 785,
"valid_targets_mean": 5527.8,
"valid_targets_min": 2519
},
{
"epoch": 1.2006079027355623,
"grad_norm": 0.7772463802272693,
"learning_rate": 3.938516222466153e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20852729678153992,
"step": 790,
"valid_targets_mean": 4968.9,
"valid_targets_min": 605
},
{
"epoch": 1.2082066869300911,
"grad_norm": 0.5158401148303159,
"learning_rate": 3.936637465706735e-05,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25038856267929077,
"step": 795,
"valid_targets_mean": 4784.4,
"valid_targets_min": 655
},
{
"epoch": 1.21580547112462,
"grad_norm": 1.031320737042501,
"learning_rate": 3.934730896545583e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21661558747291565,
"step": 800,
"valid_targets_mean": 3556.4,
"valid_targets_min": 653
},
{
"epoch": 1.2234042553191489,
"grad_norm": 0.46779923698778514,
"learning_rate": 3.932796542363283e-05,
"loss": 0.2113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19566161930561066,
"step": 805,
"valid_targets_mean": 4376.0,
"valid_targets_min": 810
},
{
"epoch": 1.2310030395136777,
"grad_norm": 0.4326481517949445,
"learning_rate": 3.930834430939444e-05,
"loss": 0.2145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19606706500053406,
"step": 810,
"valid_targets_mean": 5616.6,
"valid_targets_min": 2732
},
{
"epoch": 1.2386018237082066,
"grad_norm": 0.47029688029877836,
"learning_rate": 3.9288445904523063e-05,
"loss": 0.219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1963462084531784,
"step": 815,
"valid_targets_mean": 4256.6,
"valid_targets_min": 1593
},
{
"epoch": 1.2462006079027357,
"grad_norm": 0.4914352971694942,
"learning_rate": 3.926827049478329e-05,
"loss": 0.2273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2369862049818039,
"step": 820,
"valid_targets_mean": 5430.8,
"valid_targets_min": 465
},
{
"epoch": 1.2537993920972643,
"grad_norm": 0.4983986981283837,
"learning_rate": 3.924781836991783e-05,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2174890637397766,
"step": 825,
"valid_targets_mean": 4507.7,
"valid_targets_min": 801
},
{
"epoch": 1.2613981762917934,
"grad_norm": 0.4385888971144186,
"learning_rate": 3.922708982364337e-05,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21676486730575562,
"step": 830,
"valid_targets_mean": 5402.2,
"valid_targets_min": 933
},
{
"epoch": 1.2689969604863223,
"grad_norm": 0.45249778212242275,
"learning_rate": 3.920608515364631e-05,
"loss": 0.2245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20077060163021088,
"step": 835,
"valid_targets_mean": 4443.8,
"valid_targets_min": 491
},
{
"epoch": 1.2765957446808511,
"grad_norm": 0.47777362802657686,
"learning_rate": 3.9184804661578535e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23784896731376648,
"step": 840,
"valid_targets_mean": 5061.4,
"valid_targets_min": 846
},
{
"epoch": 1.28419452887538,
"grad_norm": 0.4135085697969651,
"learning_rate": 3.9163248653053033e-05,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20635738968849182,
"step": 845,
"valid_targets_mean": 5489.4,
"valid_targets_min": 1148
},
{
"epoch": 1.2917933130699089,
"grad_norm": 0.4117297091921728,
"learning_rate": 3.9141417437639566e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18252739310264587,
"step": 850,
"valid_targets_mean": 4780.3,
"valid_targets_min": 799
},
{
"epoch": 1.2993920972644377,
"grad_norm": 0.48551756342329966,
"learning_rate": 3.911931132886016e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24173299968242645,
"step": 855,
"valid_targets_mean": 5113.2,
"valid_targets_min": 756
},
{
"epoch": 1.3069908814589666,
"grad_norm": 0.4727140541170104,
"learning_rate": 3.9096930644184674e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1915874183177948,
"step": 860,
"valid_targets_mean": 4394.3,
"valid_targets_min": 685
},
{
"epoch": 1.3145896656534954,
"grad_norm": 0.48025400940036744,
"learning_rate": 3.907427570502616e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2418954074382782,
"step": 865,
"valid_targets_mean": 3894.8,
"valid_targets_min": 502
},
{
"epoch": 1.3221884498480243,
"grad_norm": 0.4849042187708983,
"learning_rate": 3.90513468367363e-05,
"loss": 0.2157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2329632043838501,
"step": 870,
"valid_targets_mean": 4571.7,
"valid_targets_min": 1992
},
{
"epoch": 1.3297872340425532,
"grad_norm": 0.5027508815921192,
"learning_rate": 3.9028144368600746e-05,
"loss": 0.2072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19249165058135986,
"step": 875,
"valid_targets_mean": 4092.1,
"valid_targets_min": 490
},
{
"epoch": 1.337386018237082,
"grad_norm": 0.43340094826535847,
"learning_rate": 3.900466863383434e-05,
"loss": 0.2074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16721683740615845,
"step": 880,
"valid_targets_mean": 4360.1,
"valid_targets_min": 678
},
{
"epoch": 1.344984802431611,
"grad_norm": 0.42492899268845147,
"learning_rate": 3.898091996957638e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18311715126037598,
"step": 885,
"valid_targets_mean": 5269.4,
"valid_targets_min": 2234
},
{
"epoch": 1.3525835866261398,
"grad_norm": 0.45185682893053764,
"learning_rate": 3.895689871688571e-05,
"loss": 0.2277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2394876629114151,
"step": 890,
"valid_targets_mean": 5222.2,
"valid_targets_min": 779
},
{
"epoch": 1.3601823708206686,
"grad_norm": 0.4595708686629068,
"learning_rate": 3.893260522073591e-05,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19897980988025665,
"step": 895,
"valid_targets_mean": 4327.2,
"valid_targets_min": 1913
},
{
"epoch": 1.3677811550151975,
"grad_norm": 0.5538183693714539,
"learning_rate": 3.8908039830010296e-05,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21077513694763184,
"step": 900,
"valid_targets_mean": 4477.2,
"valid_targets_min": 1914
},
{
"epoch": 1.3753799392097266,
"grad_norm": 0.4826233268835563,
"learning_rate": 3.888320289749687e-05,
"loss": 0.2167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20590105652809143,
"step": 905,
"valid_targets_mean": 4855.0,
"valid_targets_min": 987
},
{
"epoch": 1.3829787234042552,
"grad_norm": 0.45816874548401804,
"learning_rate": 3.885809477988334e-05,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18594498932361603,
"step": 910,
"valid_targets_mean": 4613.8,
"valid_targets_min": 486
},
{
"epoch": 1.3905775075987843,
"grad_norm": 0.46458650367475696,
"learning_rate": 3.883271583775194e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20757240056991577,
"step": 915,
"valid_targets_mean": 5135.2,
"valid_targets_min": 567
},
{
"epoch": 1.3981762917933132,
"grad_norm": 0.49573212835944025,
"learning_rate": 3.880706643557425e-05,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20922252535820007,
"step": 920,
"valid_targets_mean": 4993.9,
"valid_targets_min": 1608
},
{
"epoch": 1.405775075987842,
"grad_norm": 0.5065076653284654,
"learning_rate": 3.8781146941705975e-05,
"loss": 0.219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22266633808612823,
"step": 925,
"valid_targets_mean": 3984.9,
"valid_targets_min": 663
},
{
"epoch": 1.4133738601823709,
"grad_norm": 0.46389395621934165,
"learning_rate": 3.8754957728381676e-05,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1952955424785614,
"step": 930,
"valid_targets_mean": 4305.5,
"valid_targets_min": 659
},
{
"epoch": 1.4209726443768997,
"grad_norm": 0.4244364300260148,
"learning_rate": 3.87284991717094e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19909913837909698,
"step": 935,
"valid_targets_mean": 5106.8,
"valid_targets_min": 692
},
{
"epoch": 1.4285714285714286,
"grad_norm": 0.48753574099908936,
"learning_rate": 3.870177165166526e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22329512238502502,
"step": 940,
"valid_targets_mean": 4227.9,
"valid_targets_min": 960
},
{
"epoch": 1.4361702127659575,
"grad_norm": 0.46921808961532296,
"learning_rate": 3.8674775552088034e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1966555416584015,
"step": 945,
"valid_targets_mean": 4668.8,
"valid_targets_min": 1045
},
{
"epoch": 1.4437689969604863,
"grad_norm": 0.5011462054285303,
"learning_rate": 3.864751126067359e-05,
"loss": 0.2288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3067967891693115,
"step": 950,
"valid_targets_mean": 5225.8,
"valid_targets_min": 982
},
{
"epoch": 1.4513677811550152,
"grad_norm": 0.45640279658712546,
"learning_rate": 3.861997916896937e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20878750085830688,
"step": 955,
"valid_targets_mean": 4429.0,
"valid_targets_min": 401
},
{
"epoch": 1.458966565349544,
"grad_norm": 0.4318101933694944,
"learning_rate": 3.859217967236872e-05,
"loss": 0.2142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21009142696857452,
"step": 960,
"valid_targets_mean": 5187.9,
"valid_targets_min": 1245
},
{
"epoch": 1.466565349544073,
"grad_norm": 0.4639537052196582,
"learning_rate": 3.856411317010525e-05,
"loss": 0.2253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20182490348815918,
"step": 965,
"valid_targets_mean": 4228.9,
"valid_targets_min": 1395
},
{
"epoch": 1.4741641337386018,
"grad_norm": 0.5830750830049942,
"learning_rate": 3.853578006524711e-05,
"loss": 0.2198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25057747960090637,
"step": 970,
"valid_targets_mean": 3692.9,
"valid_targets_min": 853
},
{
"epoch": 1.4817629179331306,
"grad_norm": 0.6135846306078634,
"learning_rate": 3.8507180764691134e-05,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26475679874420166,
"step": 975,
"valid_targets_mean": 5166.6,
"valid_targets_min": 2214
},
{
"epoch": 1.4893617021276595,
"grad_norm": 0.42930269291397805,
"learning_rate": 3.847831567915706e-05,
"loss": 0.23,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22688277065753937,
"step": 980,
"valid_targets_mean": 5970.2,
"valid_targets_min": 1687
},
{
"epoch": 1.4969604863221884,
"grad_norm": 0.44889401709296317,
"learning_rate": 3.844918522318164e-05,
"loss": 0.2144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2054261565208435,
"step": 985,
"valid_targets_mean": 4887.9,
"valid_targets_min": 1082
},
{
"epoch": 1.5045592705167175,
"grad_norm": 0.4849219730059719,
"learning_rate": 3.84197898151126e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2193393111228943,
"step": 990,
"valid_targets_mean": 5518.3,
"valid_targets_min": 348
},
{
"epoch": 1.512158054711246,
"grad_norm": 0.47364060795273005,
"learning_rate": 3.839012987710275e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2376159131526947,
"step": 995,
"valid_targets_mean": 4844.3,
"valid_targets_min": 873
},
{
"epoch": 1.5197568389057752,
"grad_norm": 0.477005009585305,
"learning_rate": 3.836020583510382e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23394693434238434,
"step": 1000,
"valid_targets_mean": 4632.9,
"valid_targets_min": 763
},
{
"epoch": 1.5273556231003038,
"grad_norm": 0.43901547735782315,
"learning_rate": 3.833001811886041e-05,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2290436327457428,
"step": 1005,
"valid_targets_mean": 4733.1,
"valid_targets_min": 729
},
{
"epoch": 1.534954407294833,
"grad_norm": 0.4128584010075957,
"learning_rate": 3.8299567161903787e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18785551190376282,
"step": 1010,
"valid_targets_mean": 5352.2,
"valid_targets_min": 2335
},
{
"epoch": 1.5425531914893615,
"grad_norm": 0.5109402768329384,
"learning_rate": 3.826885340154566e-05,
"loss": 0.2272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25076034665107727,
"step": 1015,
"valid_targets_mean": 4775.5,
"valid_targets_min": 891
},
{
"epoch": 1.5501519756838906,
"grad_norm": 0.4615963241009783,
"learning_rate": 3.8237877278871916e-05,
"loss": 0.2257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22021520137786865,
"step": 1020,
"valid_targets_mean": 4804.6,
"valid_targets_min": 1759
},
{
"epoch": 1.5577507598784195,
"grad_norm": 0.41168421067320043,
"learning_rate": 3.820663923873626e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22017160058021545,
"step": 1025,
"valid_targets_mean": 5034.6,
"valid_targets_min": 689
},
{
"epoch": 1.5653495440729484,
"grad_norm": 0.5570301288304671,
"learning_rate": 3.817513972975385e-05,
"loss": 0.2154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21190384030342102,
"step": 1030,
"valid_targets_mean": 3886.7,
"valid_targets_min": 816
},
{
"epoch": 1.5729483282674772,
"grad_norm": 0.48710822220429656,
"learning_rate": 3.814337920429485e-05,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21960590779781342,
"step": 1035,
"valid_targets_mean": 4042.9,
"valid_targets_min": 546
},
{
"epoch": 1.580547112462006,
"grad_norm": 0.4956003916710543,
"learning_rate": 3.811135811847792e-05,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2413313090801239,
"step": 1040,
"valid_targets_mean": 4299.2,
"valid_targets_min": 605
},
{
"epoch": 1.588145896656535,
"grad_norm": 0.5142660653107718,
"learning_rate": 3.807907693216368e-05,
"loss": 0.2109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23288393020629883,
"step": 1045,
"valid_targets_mean": 4768.5,
"valid_targets_min": 811
},
{
"epoch": 1.5957446808510638,
"grad_norm": 0.5129928776520155,
"learning_rate": 3.804653610894811e-05,
"loss": 0.2157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20630177855491638,
"step": 1050,
"valid_targets_mean": 3965.7,
"valid_targets_min": 1768
},
{
"epoch": 1.6033434650455927,
"grad_norm": 0.4428766734377924,
"learning_rate": 3.801373611615585e-05,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2139415144920349,
"step": 1055,
"valid_targets_mean": 4501.2,
"valid_targets_min": 528
},
{
"epoch": 1.6109422492401215,
"grad_norm": 0.3976871596351703,
"learning_rate": 3.798067742483355e-05,
"loss": 0.2055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1983199268579483,
"step": 1060,
"valid_targets_mean": 4932.3,
"valid_targets_min": 593
},
{
"epoch": 1.6185410334346506,
"grad_norm": 0.43538181451443764,
"learning_rate": 3.794736050974308e-05,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21794393658638,
"step": 1065,
"valid_targets_mean": 5077.6,
"valid_targets_min": 828
},
{
"epoch": 1.6261398176291793,
"grad_norm": 0.41261656921486206,
"learning_rate": 3.7913785849354693e-05,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18821759521961212,
"step": 1070,
"valid_targets_mean": 4659.0,
"valid_targets_min": 776
},
{
"epoch": 1.6337386018237083,
"grad_norm": 0.4607656496157841,
"learning_rate": 3.787995392584017e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23070788383483887,
"step": 1075,
"valid_targets_mean": 5037.2,
"valid_targets_min": 767
},
{
"epoch": 1.641337386018237,
"grad_norm": 0.521744416704874,
"learning_rate": 3.784586522506589e-05,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23326215147972107,
"step": 1080,
"valid_targets_mean": 4300.6,
"valid_targets_min": 752
},
{
"epoch": 1.648936170212766,
"grad_norm": 0.5411151907665869,
"learning_rate": 3.781152023658588e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19801482558250427,
"step": 1085,
"valid_targets_mean": 4037.4,
"valid_targets_min": 565
},
{
"epoch": 1.6565349544072947,
"grad_norm": 0.4881180236795167,
"learning_rate": 3.7776919453634735e-05,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20285995304584503,
"step": 1090,
"valid_targets_mean": 4716.8,
"valid_targets_min": 1812
},
{
"epoch": 1.6641337386018238,
"grad_norm": 0.3892565204932596,
"learning_rate": 3.774206337312058e-05,
"loss": 0.2146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19384154677391052,
"step": 1095,
"valid_targets_mean": 5548.1,
"valid_targets_min": 1723
},
{
"epoch": 1.6717325227963524,
"grad_norm": 0.6079201585046432,
"learning_rate": 3.7706952495617895e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2272331863641739,
"step": 1100,
"valid_targets_mean": 4440.2,
"valid_targets_min": 754
},
{
"epoch": 1.6793313069908815,
"grad_norm": 0.4392880697961998,
"learning_rate": 3.767158732536037e-05,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20622758567333221,
"step": 1105,
"valid_targets_mean": 5115.8,
"valid_targets_min": 2178
},
{
"epoch": 1.6869300911854104,
"grad_norm": 0.4760913157214835,
"learning_rate": 3.7635968370233625e-05,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22895006835460663,
"step": 1110,
"valid_targets_mean": 4197.4,
"valid_targets_min": 664
},
{
"epoch": 1.6945288753799392,
"grad_norm": 0.42921725245111436,
"learning_rate": 3.760009614176792e-05,
"loss": 0.2092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20630860328674316,
"step": 1115,
"valid_targets_mean": 5539.1,
"valid_targets_min": 1629
},
{
"epoch": 1.702127659574468,
"grad_norm": 0.47421657315391796,
"learning_rate": 3.7563971155130834e-05,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19295352697372437,
"step": 1120,
"valid_targets_mean": 4742.3,
"valid_targets_min": 900
},
{
"epoch": 1.709726443768997,
"grad_norm": 0.44277966038489874,
"learning_rate": 3.752759392911986e-05,
"loss": 0.2121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21693378686904907,
"step": 1125,
"valid_targets_mean": 5488.9,
"valid_targets_min": 2673
},
{
"epoch": 1.7173252279635258,
"grad_norm": 0.35764926472016434,
"learning_rate": 3.7490964986154936e-05,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1632017195224762,
"step": 1130,
"valid_targets_mean": 5798.2,
"valid_targets_min": 2382
},
{
"epoch": 1.7249240121580547,
"grad_norm": 0.46310293456133733,
"learning_rate": 3.745408485227094e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2125653326511383,
"step": 1135,
"valid_targets_mean": 4493.4,
"valid_targets_min": 703
},
{
"epoch": 1.7325227963525835,
"grad_norm": 0.48402636671915206,
"learning_rate": 3.7416954057110165e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2212226539850235,
"step": 1140,
"valid_targets_mean": 4891.2,
"valid_targets_min": 422
},
{
"epoch": 1.7401215805471124,
"grad_norm": 0.48544415851378125,
"learning_rate": 3.7379573133914686e-05,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24577516317367554,
"step": 1145,
"valid_targets_mean": 4704.4,
"valid_targets_min": 683
},
{
"epoch": 1.7477203647416415,
"grad_norm": 0.4686217061157862,
"learning_rate": 3.7341942619518736e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20010778307914734,
"step": 1150,
"valid_targets_mean": 4060.2,
"valid_targets_min": 740
},
{
"epoch": 1.7553191489361701,
"grad_norm": 0.456474362675113,
"learning_rate": 3.730406305434093e-05,
"loss": 0.2183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21529576182365417,
"step": 1155,
"valid_targets_mean": 4461.8,
"valid_targets_min": 407
},
{
"epoch": 1.7629179331306992,
"grad_norm": 0.39386216864446827,
"learning_rate": 3.726593498237659e-05,
"loss": 0.2173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20742088556289673,
"step": 1160,
"valid_targets_mean": 5696.4,
"valid_targets_min": 832
},
{
"epoch": 1.7705167173252279,
"grad_norm": 0.4954398039746765,
"learning_rate": 3.7227558951189866e-05,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2127082198858261,
"step": 1165,
"valid_targets_mean": 4003.1,
"valid_targets_min": 1097
},
{
"epoch": 1.778115501519757,
"grad_norm": 0.47012021916770536,
"learning_rate": 3.7188935511905895e-05,
"loss": 0.2208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2261389195919037,
"step": 1170,
"valid_targets_mean": 5014.4,
"valid_targets_min": 1036
},
{
"epoch": 1.7857142857142856,
"grad_norm": 0.4746767287862107,
"learning_rate": 3.715006521920289e-05,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19433888792991638,
"step": 1175,
"valid_targets_mean": 4523.8,
"valid_targets_min": 625
},
{
"epoch": 1.7933130699088147,
"grad_norm": 0.4791758218613005,
"learning_rate": 3.711094863130417e-05,
"loss": 0.2161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22052708268165588,
"step": 1180,
"valid_targets_mean": 5126.8,
"valid_targets_min": 1164
},
{
"epoch": 1.8009118541033433,
"grad_norm": 0.43857817303439106,
"learning_rate": 3.707158630997015e-05,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21629557013511658,
"step": 1185,
"valid_targets_mean": 5371.6,
"valid_targets_min": 728
},
{
"epoch": 1.8085106382978724,
"grad_norm": 0.5348041335538533,
"learning_rate": 3.703197882049026e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2324264943599701,
"step": 1190,
"valid_targets_mean": 3775.2,
"valid_targets_min": 637
},
{
"epoch": 1.8161094224924013,
"grad_norm": 0.3889586019552747,
"learning_rate": 3.699212673167484e-05,
"loss": 0.2116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2274361550807953,
"step": 1195,
"valid_targets_mean": 6306.4,
"valid_targets_min": 622
},
{
"epoch": 1.8237082066869301,
"grad_norm": 0.46857624747519244,
"learning_rate": 3.695203061584695e-05,
"loss": 0.2068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23175036907196045,
"step": 1200,
"valid_targets_mean": 4628.2,
"valid_targets_min": 429
},
{
"epoch": 1.831306990881459,
"grad_norm": 0.4885718145421046,
"learning_rate": 3.69116910488342e-05,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22779184579849243,
"step": 1205,
"valid_targets_mean": 4191.6,
"valid_targets_min": 156
},
{
"epoch": 1.8389057750759878,
"grad_norm": 0.4639904198544056,
"learning_rate": 3.687110860996041e-05,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2027101218700409,
"step": 1210,
"valid_targets_mean": 4831.6,
"valid_targets_min": 699
},
{
"epoch": 1.8465045592705167,
"grad_norm": 0.46833719588845396,
"learning_rate": 3.6830283882037335e-05,
"loss": 0.2165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20325730741024017,
"step": 1215,
"valid_targets_mean": 5097.8,
"valid_targets_min": 465
},
{
"epoch": 1.8541033434650456,
"grad_norm": 0.41463391792421084,
"learning_rate": 3.678921745135631e-05,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20085079967975616,
"step": 1220,
"valid_targets_mean": 5023.6,
"valid_targets_min": 633
},
{
"epoch": 1.8617021276595744,
"grad_norm": 0.44749514129370893,
"learning_rate": 3.674790990767979e-05,
"loss": 0.2289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20688676834106445,
"step": 1225,
"valid_targets_mean": 4845.9,
"valid_targets_min": 667
},
{
"epoch": 1.8693009118541033,
"grad_norm": 0.4502221753599573,
"learning_rate": 3.670636184423288e-05,
"loss": 0.2103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19071269035339355,
"step": 1230,
"valid_targets_mean": 4245.0,
"valid_targets_min": 500
},
{
"epoch": 1.8768996960486324,
"grad_norm": 0.5334681412726286,
"learning_rate": 3.666457385769487e-05,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2248763144016266,
"step": 1235,
"valid_targets_mean": 4481.5,
"valid_targets_min": 770
},
{
"epoch": 1.884498480243161,
"grad_norm": 0.4644916347166466,
"learning_rate": 3.66225465481906e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2305462807416916,
"step": 1240,
"valid_targets_mean": 4303.9,
"valid_targets_min": 630
},
{
"epoch": 1.89209726443769,
"grad_norm": 0.4267832479199372,
"learning_rate": 3.658028051928189e-05,
"loss": 0.2092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18598158657550812,
"step": 1245,
"valid_targets_mean": 4759.4,
"valid_targets_min": 965
},
{
"epoch": 1.8996960486322187,
"grad_norm": 0.46975601834979414,
"learning_rate": 3.6537776377958836e-05,
"loss": 0.2302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2438843995332718,
"step": 1250,
"valid_targets_mean": 4358.6,
"valid_targets_min": 545
},
{
"epoch": 1.9072948328267478,
"grad_norm": 0.41467959071923455,
"learning_rate": 3.649503473463112e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18656185269355774,
"step": 1255,
"valid_targets_mean": 4789.7,
"valid_targets_min": 622
},
{
"epoch": 1.9148936170212765,
"grad_norm": 0.48720410950048604,
"learning_rate": 3.645205620311923e-05,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2179066389799118,
"step": 1260,
"valid_targets_mean": 4316.3,
"valid_targets_min": 718
},
{
"epoch": 1.9224924012158056,
"grad_norm": 0.47737074347118913,
"learning_rate": 3.6408841400645644e-05,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20159170031547546,
"step": 1265,
"valid_targets_mean": 4676.4,
"valid_targets_min": 920
},
{
"epoch": 1.9300911854103342,
"grad_norm": 0.38561599683027503,
"learning_rate": 3.636539094782598e-05,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18330830335617065,
"step": 1270,
"valid_targets_mean": 4813.8,
"valid_targets_min": 811
},
{
"epoch": 1.9376899696048633,
"grad_norm": 0.4850605122437156,
"learning_rate": 3.632170546866007e-05,
"loss": 0.2168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22532254457473755,
"step": 1275,
"valid_targets_mean": 3973.6,
"valid_targets_min": 335
},
{
"epoch": 1.9452887537993921,
"grad_norm": 0.43992666790664475,
"learning_rate": 3.6277785590523e-05,
"loss": 0.2201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24039697647094727,
"step": 1280,
"valid_targets_mean": 5707.9,
"valid_targets_min": 511
},
{
"epoch": 1.952887537993921,
"grad_norm": 3.9664174496666083,
"learning_rate": 3.623363194415609e-05,
"loss": 0.214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21847763657569885,
"step": 1285,
"valid_targets_mean": 4531.5,
"valid_targets_min": 991
},
{
"epoch": 1.9604863221884499,
"grad_norm": 0.4595577415716105,
"learning_rate": 3.618924516365788e-05,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20071235299110413,
"step": 1290,
"valid_targets_mean": 4902.6,
"valid_targets_min": 777
},
{
"epoch": 1.9680851063829787,
"grad_norm": 0.44567806699122325,
"learning_rate": 3.614462588647495e-05,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24957430362701416,
"step": 1295,
"valid_targets_mean": 4669.9,
"valid_targets_min": 1479
},
{
"epoch": 1.9756838905775076,
"grad_norm": 0.42210130028239157,
"learning_rate": 3.609977475339284e-05,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2057563215494156,
"step": 1300,
"valid_targets_mean": 5229.6,
"valid_targets_min": 969
},
{
"epoch": 1.9832826747720365,
"grad_norm": 0.48785866462041777,
"learning_rate": 3.6054692408526806e-05,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2031518667936325,
"step": 1305,
"valid_targets_mean": 3585.4,
"valid_targets_min": 843
},
{
"epoch": 1.9908814589665653,
"grad_norm": 0.4191280920943274,
"learning_rate": 3.6009379499312563e-05,
"loss": 0.2142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21392418444156647,
"step": 1310,
"valid_targets_mean": 5448.1,
"valid_targets_min": 2162
},
{
"epoch": 1.9984802431610942,
"grad_norm": 0.571865229628622,
"learning_rate": 3.5963836676497034e-05,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21553698182106018,
"step": 1315,
"valid_targets_mean": 3434.1,
"valid_targets_min": 460
},
{
"epoch": 2.0060790273556233,
"grad_norm": 0.4580819817800281,
"learning_rate": 3.5918064594128946e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18602877855300903,
"step": 1320,
"valid_targets_mean": 4337.8,
"valid_targets_min": 527
},
{
"epoch": 2.013677811550152,
"grad_norm": 0.4308848554547568,
"learning_rate": 3.5872063909549465e-05,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1809544563293457,
"step": 1325,
"valid_targets_mean": 4842.1,
"valid_targets_min": 305
},
{
"epoch": 2.021276595744681,
"grad_norm": 0.4304570423447681,
"learning_rate": 3.5825835283382754e-05,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17694029211997986,
"step": 1330,
"valid_targets_mean": 5139.7,
"valid_targets_min": 1709
},
{
"epoch": 2.0288753799392096,
"grad_norm": 0.4201481077802898,
"learning_rate": 3.5779379379526516e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17606091499328613,
"step": 1335,
"valid_targets_mean": 5894.2,
"valid_targets_min": 348
},
{
"epoch": 2.0364741641337387,
"grad_norm": 0.43796821938518954,
"learning_rate": 3.57326968651424e-05,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19579800963401794,
"step": 1340,
"valid_targets_mean": 4780.1,
"valid_targets_min": 1077
},
{
"epoch": 2.0440729483282674,
"grad_norm": 0.431578307043594,
"learning_rate": 3.5685788410646455e-05,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17831829190254211,
"step": 1345,
"valid_targets_mean": 4907.6,
"valid_targets_min": 590
},
{
"epoch": 2.0516717325227964,
"grad_norm": 0.4188648321222995,
"learning_rate": 3.5638654689699493e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15893448889255524,
"step": 1350,
"valid_targets_mean": 5083.1,
"valid_targets_min": 1164
},
{
"epoch": 2.059270516717325,
"grad_norm": 0.4452501919855169,
"learning_rate": 3.559129637919744e-05,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19416233897209167,
"step": 1355,
"valid_targets_mean": 4871.6,
"valid_targets_min": 1124
},
{
"epoch": 2.066869300911854,
"grad_norm": 0.5486933381235863,
"learning_rate": 3.5543714159261576e-05,
"loss": 0.1991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21765755116939545,
"step": 1360,
"valid_targets_mean": 4549.6,
"valid_targets_min": 756
},
{
"epoch": 2.074468085106383,
"grad_norm": 0.46291383560602983,
"learning_rate": 3.5495908713228774e-05,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22245173156261444,
"step": 1365,
"valid_targets_mean": 4870.3,
"valid_targets_min": 829
},
{
"epoch": 2.082066869300912,
"grad_norm": 0.43346588262932606,
"learning_rate": 3.544788072764173e-05,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16855968534946442,
"step": 1370,
"valid_targets_mean": 5086.5,
"valid_targets_min": 1568
},
{
"epoch": 2.0896656534954405,
"grad_norm": 0.46753186284834775,
"learning_rate": 3.5399630892239036e-05,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17375516891479492,
"step": 1375,
"valid_targets_mean": 4855.5,
"valid_targets_min": 1441
},
{
"epoch": 2.0972644376899696,
"grad_norm": 0.5417497219166529,
"learning_rate": 3.535115989994533e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22097179293632507,
"step": 1380,
"valid_targets_mean": 4113.6,
"valid_targets_min": 608
},
{
"epoch": 2.1048632218844983,
"grad_norm": 0.5031450181476247,
"learning_rate": 3.530246844686133e-05,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20294921100139618,
"step": 1385,
"valid_targets_mean": 4546.1,
"valid_targets_min": 610
},
{
"epoch": 2.1124620060790273,
"grad_norm": 0.4352408641314383,
"learning_rate": 3.5253557232253805e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18328158557415009,
"step": 1390,
"valid_targets_mean": 4523.4,
"valid_targets_min": 317
},
{
"epoch": 2.1200607902735564,
"grad_norm": 0.4965079663934899,
"learning_rate": 3.520442695854558e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19759127497673035,
"step": 1395,
"valid_targets_mean": 4122.6,
"valid_targets_min": 651
},
{
"epoch": 2.127659574468085,
"grad_norm": 0.4372048480171316,
"learning_rate": 3.515507833130543e-05,
"loss": 0.2099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.260989785194397,
"step": 1400,
"valid_targets_mean": 5767.1,
"valid_targets_min": 647
},
{
"epoch": 2.135258358662614,
"grad_norm": 0.4432824108788825,
"learning_rate": 3.510551205923793e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1798432469367981,
"step": 1405,
"valid_targets_mean": 4649.9,
"valid_targets_min": 887
},
{
"epoch": 2.142857142857143,
"grad_norm": 0.47056895174749847,
"learning_rate": 3.50557288541733e-05,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28239643573760986,
"step": 1410,
"valid_targets_mean": 5144.9,
"valid_targets_min": 668
},
{
"epoch": 2.150455927051672,
"grad_norm": 0.48033852287738354,
"learning_rate": 3.5005729431057176e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18898963928222656,
"step": 1415,
"valid_targets_mean": 4188.7,
"valid_targets_min": 642
},
{
"epoch": 2.1580547112462005,
"grad_norm": 0.44907430023415723,
"learning_rate": 3.4955514507940335e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21947622299194336,
"step": 1420,
"valid_targets_mean": 4689.1,
"valid_targets_min": 811
},
{
"epoch": 2.1656534954407296,
"grad_norm": 0.48987352731998796,
"learning_rate": 3.490508480596839e-05,
"loss": 0.2001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23712974786758423,
"step": 1425,
"valid_targets_mean": 4526.9,
"valid_targets_min": 1906
},
{
"epoch": 2.1732522796352582,
"grad_norm": 0.4635255839622089,
"learning_rate": 3.485444104937144e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19113010168075562,
"step": 1430,
"valid_targets_mean": 5611.0,
"valid_targets_min": 506
},
{
"epoch": 2.1808510638297873,
"grad_norm": 0.5259676202088338,
"learning_rate": 3.4803583965453635e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1842001974582672,
"step": 1435,
"valid_targets_mean": 5102.6,
"valid_targets_min": 2495
},
{
"epoch": 2.188449848024316,
"grad_norm": 0.44606267698952673,
"learning_rate": 3.475251428458281e-05,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16230902075767517,
"step": 1440,
"valid_targets_mean": 4659.9,
"valid_targets_min": 559
},
{
"epoch": 2.196048632218845,
"grad_norm": 0.4688428145128331,
"learning_rate": 3.4701232740179876e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20408767461776733,
"step": 1445,
"valid_targets_mean": 4121.8,
"valid_targets_min": 589
},
{
"epoch": 2.2036474164133737,
"grad_norm": 0.5991278401653526,
"learning_rate": 3.464974006870841e-05,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1730174869298935,
"step": 1450,
"valid_targets_mean": 4380.2,
"valid_targets_min": 872
},
{
"epoch": 2.211246200607903,
"grad_norm": 0.5317059372292597,
"learning_rate": 3.4598037009664e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21209636330604553,
"step": 1455,
"valid_targets_mean": 4217.3,
"valid_targets_min": 576
},
{
"epoch": 2.2188449848024314,
"grad_norm": 0.430168348759962,
"learning_rate": 3.454612430556365e-05,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1825931817293167,
"step": 1460,
"valid_targets_mean": 5261.9,
"valid_targets_min": 605
},
{
"epoch": 2.2264437689969605,
"grad_norm": 0.3749747542503873,
"learning_rate": 3.44940027019351e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17250074446201324,
"step": 1465,
"valid_targets_mean": 5484.4,
"valid_targets_min": 702
},
{
"epoch": 2.2340425531914896,
"grad_norm": 0.4590123136778495,
"learning_rate": 3.444167294730617e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21813246607780457,
"step": 1470,
"valid_targets_mean": 5121.4,
"valid_targets_min": 306
},
{
"epoch": 2.2416413373860182,
"grad_norm": 0.49931169623759,
"learning_rate": 3.4389135793193935e-05,
"loss": 0.196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.218278706073761,
"step": 1475,
"valid_targets_mean": 3389.2,
"valid_targets_min": 545
},
{
"epoch": 2.2492401215805473,
"grad_norm": 0.44543315364919134,
"learning_rate": 3.4336391994094e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18760555982589722,
"step": 1480,
"valid_targets_mean": 4307.0,
"valid_targets_min": 666
},
{
"epoch": 2.256838905775076,
"grad_norm": 0.4886663621134491,
"learning_rate": 3.4283442307469625e-05,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2062349021434784,
"step": 1485,
"valid_targets_mean": 4356.3,
"valid_targets_min": 766
},
{
"epoch": 2.264437689969605,
"grad_norm": 0.4376731027831436,
"learning_rate": 3.423028749374086e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1697554588317871,
"step": 1490,
"valid_targets_mean": 4621.5,
"valid_targets_min": 626
},
{
"epoch": 2.2720364741641337,
"grad_norm": 0.44145953072536115,
"learning_rate": 3.417692831627361e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17671933770179749,
"step": 1495,
"valid_targets_mean": 4243.6,
"valid_targets_min": 490
},
{
"epoch": 2.2796352583586628,
"grad_norm": 0.46231753746429277,
"learning_rate": 3.412336554136871e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.217167928814888,
"step": 1500,
"valid_targets_mean": 4889.9,
"valid_targets_min": 940
},
{
"epoch": 2.2872340425531914,
"grad_norm": 0.41849411158618643,
"learning_rate": 3.406959993825088e-05,
"loss": 0.1879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1857946813106537,
"step": 1505,
"valid_targets_mean": 4538.6,
"valid_targets_min": 1136
},
{
"epoch": 2.2948328267477205,
"grad_norm": 0.42440454933579597,
"learning_rate": 3.4015632279057675e-05,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19058769941329956,
"step": 1510,
"valid_targets_mean": 5174.3,
"valid_targets_min": 2350
},
{
"epoch": 2.302431610942249,
"grad_norm": 0.4531043322688376,
"learning_rate": 3.396146333882846e-05,
"loss": 0.2017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.207040473818779,
"step": 1515,
"valid_targets_mean": 5085.9,
"valid_targets_min": 1122
},
{
"epoch": 2.310030395136778,
"grad_norm": 0.43663796857915893,
"learning_rate": 3.3907093895493186e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19464045763015747,
"step": 1520,
"valid_targets_mean": 4950.9,
"valid_targets_min": 709
},
{
"epoch": 2.317629179331307,
"grad_norm": 0.42579767171142163,
"learning_rate": 3.385252472986129e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17376163601875305,
"step": 1525,
"valid_targets_mean": 5796.6,
"valid_targets_min": 829
},
{
"epoch": 2.325227963525836,
"grad_norm": 0.4254323477143335,
"learning_rate": 3.379775662561045e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20658773183822632,
"step": 1530,
"valid_targets_mean": 4603.7,
"valid_targets_min": 937
},
{
"epoch": 2.3328267477203646,
"grad_norm": 0.40841513731217177,
"learning_rate": 3.374279036927535e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18336258828639984,
"step": 1535,
"valid_targets_mean": 4597.2,
"valid_targets_min": 376
},
{
"epoch": 2.3404255319148937,
"grad_norm": 0.40660499202393396,
"learning_rate": 3.368762675023635e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17899194359779358,
"step": 1540,
"valid_targets_mean": 5368.1,
"valid_targets_min": 748
},
{
"epoch": 2.3480243161094223,
"grad_norm": 0.4869497094603196,
"learning_rate": 3.363226656070819e-05,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20963457226753235,
"step": 1545,
"valid_targets_mean": 4233.9,
"valid_targets_min": 799
},
{
"epoch": 2.3556231003039514,
"grad_norm": 0.42891641992075347,
"learning_rate": 3.3576710595728586e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18602633476257324,
"step": 1550,
"valid_targets_mean": 4363.8,
"valid_targets_min": 156
},
{
"epoch": 2.36322188449848,
"grad_norm": 0.4784395146562949,
"learning_rate": 3.352095965314682e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20554772019386292,
"step": 1555,
"valid_targets_mean": 4412.3,
"valid_targets_min": 732
},
{
"epoch": 2.370820668693009,
"grad_norm": 0.3940116430034305,
"learning_rate": 3.3465014533612295e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16700813174247742,
"step": 1560,
"valid_targets_mean": 4859.4,
"valid_targets_min": 2115
},
{
"epoch": 2.378419452887538,
"grad_norm": 0.4053824724130465,
"learning_rate": 3.340887604056301e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19125846028327942,
"step": 1565,
"valid_targets_mean": 5586.5,
"valid_targets_min": 855
},
{
"epoch": 2.386018237082067,
"grad_norm": 0.467001631524023,
"learning_rate": 3.335254498021404e-05,
"loss": 0.1987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21299326419830322,
"step": 1570,
"valid_targets_mean": 4965.8,
"valid_targets_min": 333
},
{
"epoch": 2.393617021276596,
"grad_norm": 0.46807262963090795,
"learning_rate": 3.329602216154594e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21306315064430237,
"step": 1575,
"valid_targets_mean": 4142.6,
"valid_targets_min": 618
},
{
"epoch": 2.4012158054711246,
"grad_norm": 0.4351369955863477,
"learning_rate": 3.323930839629318e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.192465141415596,
"step": 1580,
"valid_targets_mean": 4713.5,
"valid_targets_min": 805
},
{
"epoch": 2.4088145896656536,
"grad_norm": 0.4664276306785285,
"learning_rate": 3.318240449893242e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20806226134300232,
"step": 1585,
"valid_targets_mean": 4086.8,
"valid_targets_min": 616
},
{
"epoch": 2.4164133738601823,
"grad_norm": 0.4691257656452498,
"learning_rate": 3.3125311286670836e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23262707889080048,
"step": 1590,
"valid_targets_mean": 4931.9,
"valid_targets_min": 633
},
{
"epoch": 2.4240121580547114,
"grad_norm": 0.42906847559664973,
"learning_rate": 3.3068029579434404e-05,
"loss": 0.196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19915705919265747,
"step": 1595,
"valid_targets_mean": 4431.0,
"valid_targets_min": 397
},
{
"epoch": 2.43161094224924,
"grad_norm": 0.4018736513467274,
"learning_rate": 3.3010560199856105e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16372954845428467,
"step": 1600,
"valid_targets_mean": 5064.1,
"valid_targets_min": 1229
},
{
"epoch": 2.439209726443769,
"grad_norm": 0.4520461458479404,
"learning_rate": 3.2952903973264115e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19510574638843536,
"step": 1605,
"valid_targets_mean": 4399.9,
"valid_targets_min": 646
},
{
"epoch": 2.4468085106382977,
"grad_norm": 0.3918033831100767,
"learning_rate": 3.289506172766997e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1935116946697235,
"step": 1610,
"valid_targets_mean": 5341.8,
"valid_targets_min": 801
},
{
"epoch": 2.454407294832827,
"grad_norm": 0.43294616241650447,
"learning_rate": 3.283703429375663e-05,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16868659853935242,
"step": 1615,
"valid_targets_mean": 4395.4,
"valid_targets_min": 518
},
{
"epoch": 2.4620060790273555,
"grad_norm": 0.5245421221092823,
"learning_rate": 3.2778822504866594e-05,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2138800024986267,
"step": 1620,
"valid_targets_mean": 3523.9,
"valid_targets_min": 736
},
{
"epoch": 2.4696048632218845,
"grad_norm": 0.44947552448463496,
"learning_rate": 3.272042719698992e-05,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2089487910270691,
"step": 1625,
"valid_targets_mean": 4868.6,
"valid_targets_min": 708
},
{
"epoch": 2.477203647416413,
"grad_norm": 0.5745948604608038,
"learning_rate": 3.2661849208752205e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15748457610607147,
"step": 1630,
"valid_targets_mean": 5253.4,
"valid_targets_min": 1100
},
{
"epoch": 2.4848024316109423,
"grad_norm": 0.466310291931274,
"learning_rate": 3.2603089381402574e-05,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18000131845474243,
"step": 1635,
"valid_targets_mean": 4540.9,
"valid_targets_min": 594
},
{
"epoch": 2.4924012158054714,
"grad_norm": 0.4887847049484213,
"learning_rate": 3.254414855880155e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19799655675888062,
"step": 1640,
"valid_targets_mean": 3895.6,
"valid_targets_min": 632
},
{
"epoch": 2.5,
"grad_norm": 0.44432072579472404,
"learning_rate": 3.2485027587408965e-05,
"loss": 0.1925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18566831946372986,
"step": 1645,
"valid_targets_mean": 4716.8,
"valid_targets_min": 785
},
{
"epoch": 2.5075987841945286,
"grad_norm": 0.7254579276839739,
"learning_rate": 3.2425727316271814e-05,
"loss": 0.2156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2835049033164978,
"step": 1650,
"valid_targets_mean": 4848.5,
"valid_targets_min": 1102
},
{
"epoch": 2.5151975683890577,
"grad_norm": 0.45281348742054633,
"learning_rate": 3.2366248597012037e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21764954924583435,
"step": 1655,
"valid_targets_mean": 4480.8,
"valid_targets_min": 808
},
{
"epoch": 2.522796352583587,
"grad_norm": 0.45329008128640347,
"learning_rate": 3.230659228381432e-05,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19859766960144043,
"step": 1660,
"valid_targets_mean": 4694.1,
"valid_targets_min": 710
},
{
"epoch": 2.5303951367781155,
"grad_norm": 0.3991066726887112,
"learning_rate": 3.2246759233413765e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18775928020477295,
"step": 1665,
"valid_targets_mean": 5537.6,
"valid_targets_min": 2270
},
{
"epoch": 2.5379939209726445,
"grad_norm": 0.45660075830572106,
"learning_rate": 3.218675030508367e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21159949898719788,
"step": 1670,
"valid_targets_mean": 4234.2,
"valid_targets_min": 465
},
{
"epoch": 2.545592705167173,
"grad_norm": 0.47845524476355505,
"learning_rate": 3.212656636062314e-05,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18367314338684082,
"step": 1675,
"valid_targets_mean": 3884.0,
"valid_targets_min": 609
},
{
"epoch": 2.5531914893617023,
"grad_norm": 0.47337775511493685,
"learning_rate": 3.2066208264344695e-05,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19395776093006134,
"step": 1680,
"valid_targets_mean": 4240.3,
"valid_targets_min": 1731
},
{
"epoch": 2.560790273556231,
"grad_norm": 0.49086260546972615,
"learning_rate": 3.200567688306192e-05,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2288236916065216,
"step": 1685,
"valid_targets_mean": 3920.8,
"valid_targets_min": 658
},
{
"epoch": 2.56838905775076,
"grad_norm": 0.48820274570312466,
"learning_rate": 3.194497308607694e-05,
"loss": 0.2084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2082967460155487,
"step": 1690,
"valid_targets_mean": 4256.8,
"valid_targets_min": 440
},
{
"epoch": 2.5759878419452886,
"grad_norm": 0.43205681075466934,
"learning_rate": 3.1884097745167986e-05,
"loss": 0.1852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1597200632095337,
"step": 1695,
"valid_targets_mean": 4130.8,
"valid_targets_min": 878
},
{
"epoch": 2.5835866261398177,
"grad_norm": 0.5054254906668799,
"learning_rate": 3.182305173457688e-05,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2262079417705536,
"step": 1700,
"valid_targets_mean": 4460.6,
"valid_targets_min": 401
},
{
"epoch": 2.5911854103343464,
"grad_norm": 0.504689704310772,
"learning_rate": 3.1761835930996424e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1995968520641327,
"step": 1705,
"valid_targets_mean": 3648.3,
"valid_targets_min": 558
},
{
"epoch": 2.5987841945288754,
"grad_norm": 0.4392316385094666,
"learning_rate": 3.1700451213557896e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20353609323501587,
"step": 1710,
"valid_targets_mean": 4641.1,
"valid_targets_min": 845
},
{
"epoch": 2.6063829787234045,
"grad_norm": 0.44339996982872454,
"learning_rate": 3.1638898463818336e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15977585315704346,
"step": 1715,
"valid_targets_mean": 4352.1,
"valid_targets_min": 827
},
{
"epoch": 2.613981762917933,
"grad_norm": 0.5398477413573792,
"learning_rate": 3.157717856574794e-05,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18378981947898865,
"step": 1720,
"valid_targets_mean": 4131.6,
"valid_targets_min": 331
},
{
"epoch": 2.621580547112462,
"grad_norm": 0.39672349034501203,
"learning_rate": 3.151529240571737e-05,
"loss": 0.2048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19032993912696838,
"step": 1725,
"valid_targets_mean": 5932.7,
"valid_targets_min": 2148
},
{
"epoch": 2.629179331306991,
"grad_norm": 0.4826721393487148,
"learning_rate": 3.1453240872484974e-05,
"loss": 0.2209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21052716672420502,
"step": 1730,
"valid_targets_mean": 4064.6,
"valid_targets_min": 713
},
{
"epoch": 2.63677811550152,
"grad_norm": 0.40797959815259904,
"learning_rate": 3.139102485718407e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18385851383209229,
"step": 1735,
"valid_targets_mean": 5094.5,
"valid_targets_min": 774
},
{
"epoch": 2.6443768996960486,
"grad_norm": 0.49388764627269777,
"learning_rate": 3.1328645253310136e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20751240849494934,
"step": 1740,
"valid_targets_mean": 4489.2,
"valid_targets_min": 668
},
{
"epoch": 2.6519756838905773,
"grad_norm": 0.41221441649011,
"learning_rate": 3.126610295670798e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18350102007389069,
"step": 1745,
"valid_targets_mean": 5068.5,
"valid_targets_min": 1047
},
{
"epoch": 2.6595744680851063,
"grad_norm": 0.43487564674132706,
"learning_rate": 3.120339886555885e-05,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1929788887500763,
"step": 1750,
"valid_targets_mean": 4648.7,
"valid_targets_min": 1712
},
{
"epoch": 2.6671732522796354,
"grad_norm": 0.3931845374369816,
"learning_rate": 3.114053388036757e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17840635776519775,
"step": 1755,
"valid_targets_mean": 5762.4,
"valid_targets_min": 537
},
{
"epoch": 2.674772036474164,
"grad_norm": 0.46325220533318656,
"learning_rate": 3.1077508903949594e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15973162651062012,
"step": 1760,
"valid_targets_mean": 4577.9,
"valid_targets_min": 1190
},
{
"epoch": 2.682370820668693,
"grad_norm": 0.448314100365069,
"learning_rate": 3.1014324841418025e-05,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21308580040931702,
"step": 1765,
"valid_targets_mean": 4523.5,
"valid_targets_min": 689
},
{
"epoch": 2.689969604863222,
"grad_norm": 0.4126949676808008,
"learning_rate": 3.095098260017065e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17054617404937744,
"step": 1770,
"valid_targets_mean": 4661.3,
"valid_targets_min": 940
},
{
"epoch": 2.697568389057751,
"grad_norm": 0.520594987471646,
"learning_rate": 3.088748308987687e-05,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18412724137306213,
"step": 1775,
"valid_targets_mean": 4541.3,
"valid_targets_min": 425
},
{
"epoch": 2.7051671732522795,
"grad_norm": 0.4292929031518839,
"learning_rate": 3.082382722246467e-05,
"loss": 0.2083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18564680218696594,
"step": 1780,
"valid_targets_mean": 4726.2,
"valid_targets_min": 849
},
{
"epoch": 2.7127659574468086,
"grad_norm": 0.4143100769110258,
"learning_rate": 3.07600159121075e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19952227175235748,
"step": 1785,
"valid_targets_mean": 6396.9,
"valid_targets_min": 2406
},
{
"epoch": 2.7203647416413372,
"grad_norm": 0.5138412636257836,
"learning_rate": 3.069605007521115e-05,
"loss": 0.198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21767953038215637,
"step": 1790,
"valid_targets_mean": 4080.7,
"valid_targets_min": 855
},
{
"epoch": 2.7279635258358663,
"grad_norm": 0.9274624474305112,
"learning_rate": 3.063193063040061e-05,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2023240178823471,
"step": 1795,
"valid_targets_mean": 4271.2,
"valid_targets_min": 299
},
{
"epoch": 2.735562310030395,
"grad_norm": 0.4505218736377883,
"learning_rate": 3.0567658498506835e-05,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19997933506965637,
"step": 1800,
"valid_targets_mean": 6215.2,
"valid_targets_min": 834
},
{
"epoch": 2.743161094224924,
"grad_norm": 0.45112279832870705,
"learning_rate": 3.050323460255359e-05,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20109710097312927,
"step": 1805,
"valid_targets_mean": 4547.4,
"valid_targets_min": 594
},
{
"epoch": 2.750759878419453,
"grad_norm": 0.45439465696192066,
"learning_rate": 3.0438659867744104e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22971929609775543,
"step": 1810,
"valid_targets_mean": 4679.8,
"valid_targets_min": 630
},
{
"epoch": 2.7583586626139818,
"grad_norm": 0.4239951858010868,
"learning_rate": 3.0373935221447846e-05,
"loss": 0.1861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18463487923145294,
"step": 1815,
"valid_targets_mean": 4548.8,
"valid_targets_min": 832
},
{
"epoch": 2.7659574468085104,
"grad_norm": 0.46571130038179387,
"learning_rate": 3.030906159318721e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2257537692785263,
"step": 1820,
"valid_targets_mean": 4535.1,
"valid_targets_min": 822
},
{
"epoch": 2.7735562310030395,
"grad_norm": 0.5251100785646777,
"learning_rate": 3.0244039914624127e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16839849948883057,
"step": 1825,
"valid_targets_mean": 4547.6,
"valid_targets_min": 551
},
{
"epoch": 2.7811550151975686,
"grad_norm": 0.46551771612143145,
"learning_rate": 3.017887111954671e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21392841637134552,
"step": 1830,
"valid_targets_mean": 4989.8,
"valid_targets_min": 1092
},
{
"epoch": 2.788753799392097,
"grad_norm": 0.45282545824018966,
"learning_rate": 3.0113556143855836e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17507150769233704,
"step": 1835,
"valid_targets_mean": 3937.5,
"valid_targets_min": 433
},
{
"epoch": 2.7963525835866263,
"grad_norm": 0.8573211013484289,
"learning_rate": 3.004809592555172e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1929873377084732,
"step": 1840,
"valid_targets_mean": 4398.6,
"valid_targets_min": 447
},
{
"epoch": 2.803951367781155,
"grad_norm": 0.4511946895966249,
"learning_rate": 2.9982491404720408e-05,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25569894909858704,
"step": 1845,
"valid_targets_mean": 5263.1,
"valid_targets_min": 704
},
{
"epoch": 2.811550151975684,
"grad_norm": 0.4075365034632511,
"learning_rate": 2.9916743523520336e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18254083395004272,
"step": 1850,
"valid_targets_mean": 5106.1,
"valid_targets_min": 1353
},
{
"epoch": 2.8191489361702127,
"grad_norm": 0.39703735203471957,
"learning_rate": 2.9850853226168738e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1689942181110382,
"step": 1855,
"valid_targets_mean": 5267.1,
"valid_targets_min": 1235
},
{
"epoch": 2.8267477203647418,
"grad_norm": 0.4300034911707786,
"learning_rate": 2.9784821458928116e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19870391488075256,
"step": 1860,
"valid_targets_mean": 4619.8,
"valid_targets_min": 672
},
{
"epoch": 2.8343465045592704,
"grad_norm": 0.4731017750575238,
"learning_rate": 2.9718649170092653e-05,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2331341654062271,
"step": 1865,
"valid_targets_mean": 4517.1,
"valid_targets_min": 673
},
{
"epoch": 2.8419452887537995,
"grad_norm": 0.47588128492307696,
"learning_rate": 2.9652337309974582e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17996634542942047,
"step": 1870,
"valid_targets_mean": 3985.2,
"valid_targets_min": 962
},
{
"epoch": 2.849544072948328,
"grad_norm": 0.5647869677542844,
"learning_rate": 2.958588683089056e-05,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21768032014369965,
"step": 1875,
"valid_targets_mean": 3708.1,
"valid_targets_min": 342
},
{
"epoch": 2.857142857142857,
"grad_norm": 0.4169198649338515,
"learning_rate": 2.9519298687147945e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17996545135974884,
"step": 1880,
"valid_targets_mean": 4830.1,
"valid_targets_min": 834
},
{
"epoch": 2.8647416413373863,
"grad_norm": 0.46342593085414296,
"learning_rate": 2.9452573835031154e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17930959165096283,
"step": 1885,
"valid_targets_mean": 5006.9,
"valid_targets_min": 1043
},
{
"epoch": 2.872340425531915,
"grad_norm": 0.5952920705102613,
"learning_rate": 2.9385713232787877e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17503748834133148,
"step": 1890,
"valid_targets_mean": 4345.5,
"valid_targets_min": 702
},
{
"epoch": 2.8799392097264436,
"grad_norm": 1.5179001765998326,
"learning_rate": 2.9318717840615352e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17403315007686615,
"step": 1895,
"valid_targets_mean": 5409.5,
"valid_targets_min": 2159
},
{
"epoch": 2.8875379939209727,
"grad_norm": 0.45039073631427357,
"learning_rate": 2.9251588620646543e-05,
"loss": 0.2208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19473648071289062,
"step": 1900,
"valid_targets_mean": 4456.6,
"valid_targets_min": 561
},
{
"epoch": 2.8951367781155017,
"grad_norm": 0.5386037897816643,
"learning_rate": 2.9184326536936356e-05,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20459288358688354,
"step": 1905,
"valid_targets_mean": 5313.1,
"valid_targets_min": 1889
},
{
"epoch": 2.9027355623100304,
"grad_norm": 0.5171036731287691,
"learning_rate": 2.9116932555447764e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19427910447120667,
"step": 1910,
"valid_targets_mean": 4551.8,
"valid_targets_min": 640
},
{
"epoch": 2.910334346504559,
"grad_norm": 0.3956323253175454,
"learning_rate": 2.904940764403795e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16807705163955688,
"step": 1915,
"valid_targets_mean": 5148.9,
"valid_targets_min": 1114
},
{
"epoch": 2.917933130699088,
"grad_norm": 0.4609179179948364,
"learning_rate": 2.898175277244441e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18651928007602692,
"step": 1920,
"valid_targets_mean": 4270.8,
"valid_targets_min": 829
},
{
"epoch": 2.925531914893617,
"grad_norm": 0.3746013132633794,
"learning_rate": 2.891396891227103e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18432965874671936,
"step": 1925,
"valid_targets_mean": 5464.6,
"valid_targets_min": 869
},
{
"epoch": 2.933130699088146,
"grad_norm": 0.44757073319717156,
"learning_rate": 2.88460570369741e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2037007212638855,
"step": 1930,
"valid_targets_mean": 5044.7,
"valid_targets_min": 650
},
{
"epoch": 2.940729483282675,
"grad_norm": 0.5165497089688482,
"learning_rate": 2.877801812184838e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19577309489250183,
"step": 1935,
"valid_targets_mean": 3723.6,
"valid_targets_min": 263
},
{
"epoch": 2.9483282674772036,
"grad_norm": 0.5248044839976569,
"learning_rate": 2.8709853144013063e-05,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17888793349266052,
"step": 1940,
"valid_targets_mean": 5473.5,
"valid_targets_min": 2971
},
{
"epoch": 2.9559270516717326,
"grad_norm": 0.46290978562548923,
"learning_rate": 2.8641563082397755e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19724613428115845,
"step": 1945,
"valid_targets_mean": 4504.6,
"valid_targets_min": 683
},
{
"epoch": 2.9635258358662613,
"grad_norm": 0.47247130378721536,
"learning_rate": 2.857314891772841e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1742001324892044,
"step": 1950,
"valid_targets_mean": 4378.8,
"valid_targets_min": 900
},
{
"epoch": 2.9711246200607904,
"grad_norm": 0.38540265276997787,
"learning_rate": 2.850461163251325e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1545667052268982,
"step": 1955,
"valid_targets_mean": 4485.9,
"valid_targets_min": 825
},
{
"epoch": 2.978723404255319,
"grad_norm": 0.4375842807396514,
"learning_rate": 2.8435952211028652e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20349517464637756,
"step": 1960,
"valid_targets_mean": 4611.9,
"valid_targets_min": 1259
},
{
"epoch": 2.986322188449848,
"grad_norm": 0.393339700104493,
"learning_rate": 2.8367171639305014e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1762651801109314,
"step": 1965,
"valid_targets_mean": 4854.0,
"valid_targets_min": 1188
},
{
"epoch": 2.9939209726443767,
"grad_norm": 0.4408583709677064,
"learning_rate": 2.8298270905112598e-05,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17071180045604706,
"step": 1970,
"valid_targets_mean": 4334.9,
"valid_targets_min": 1033
},
{
"epoch": 3.001519756838906,
"grad_norm": 0.4509769720521314,
"learning_rate": 2.8229250997947338e-05,
"loss": 0.1899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19761110842227936,
"step": 1975,
"valid_targets_mean": 5020.1,
"valid_targets_min": 464
},
{
"epoch": 3.0091185410334345,
"grad_norm": 0.44397107618825393,
"learning_rate": 2.8160112909016627e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15861201286315918,
"step": 1980,
"valid_targets_mean": 4464.9,
"valid_targets_min": 434
},
{
"epoch": 3.0167173252279635,
"grad_norm": 0.4590917607720272,
"learning_rate": 2.8090857631225105e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17721785604953766,
"step": 1985,
"valid_targets_mean": 4993.2,
"valid_targets_min": 443
},
{
"epoch": 3.024316109422492,
"grad_norm": 1.6476449501443067,
"learning_rate": 2.8021486159160365e-05,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21059048175811768,
"step": 1990,
"valid_targets_mean": 3777.8,
"valid_targets_min": 567
},
{
"epoch": 3.0319148936170213,
"grad_norm": 0.3955766292317692,
"learning_rate": 2.7951999489078697e-05,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15698814392089844,
"step": 1995,
"valid_targets_mean": 5706.5,
"valid_targets_min": 1789
},
{
"epoch": 3.0395136778115504,
"grad_norm": 0.6060112559647506,
"learning_rate": 2.7882398618890763e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17217731475830078,
"step": 2000,
"valid_targets_mean": 4799.2,
"valid_targets_min": 675
},
{
"epoch": 3.047112462006079,
"grad_norm": 0.48214170254530214,
"learning_rate": 2.781268454814728e-05,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18182724714279175,
"step": 2005,
"valid_targets_mean": 4482.8,
"valid_targets_min": 268
},
{
"epoch": 3.054711246200608,
"grad_norm": 0.4254186774774426,
"learning_rate": 2.7742858278024657e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17712415754795074,
"step": 2010,
"valid_targets_mean": 5016.2,
"valid_targets_min": 933
},
{
"epoch": 3.0623100303951367,
"grad_norm": 0.4561837122624953,
"learning_rate": 2.7672920811310615e-05,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1763693392276764,
"step": 2015,
"valid_targets_mean": 5105.2,
"valid_targets_min": 1198
},
{
"epoch": 3.069908814589666,
"grad_norm": 0.6538535804895353,
"learning_rate": 2.7602873152389795e-05,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15733420848846436,
"step": 2020,
"valid_targets_mean": 4136.8,
"valid_targets_min": 1002
},
{
"epoch": 3.0775075987841944,
"grad_norm": 0.4383597724717559,
"learning_rate": 2.7532716307229325e-05,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18817880749702454,
"step": 2025,
"valid_targets_mean": 4361.4,
"valid_targets_min": 566
},
{
"epoch": 3.0851063829787235,
"grad_norm": 0.4468187218329756,
"learning_rate": 2.7462451283364372e-05,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18754516541957855,
"step": 2030,
"valid_targets_mean": 5809.6,
"valid_targets_min": 2367
},
{
"epoch": 3.092705167173252,
"grad_norm": 0.4923380379793573,
"learning_rate": 2.739207908988369e-05,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1901119500398636,
"step": 2035,
"valid_targets_mean": 4648.6,
"valid_targets_min": 651
},
{
"epoch": 3.1003039513677813,
"grad_norm": 0.43950335258891504,
"learning_rate": 2.7321600737415103e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1579056680202484,
"step": 2040,
"valid_targets_mean": 4848.3,
"valid_targets_min": 513
},
{
"epoch": 3.10790273556231,
"grad_norm": 0.43941575889354745,
"learning_rate": 2.7251017238111014e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17752686142921448,
"step": 2045,
"valid_targets_mean": 4887.9,
"valid_targets_min": 552
},
{
"epoch": 3.115501519756839,
"grad_norm": 0.43006557381731564,
"learning_rate": 2.718032960563384e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1756466031074524,
"step": 2050,
"valid_targets_mean": 5296.2,
"valid_targets_min": 1395
},
{
"epoch": 3.1231003039513676,
"grad_norm": 0.3962603202091622,
"learning_rate": 2.710953885514149e-05,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13223829865455627,
"step": 2055,
"valid_targets_mean": 4657.5,
"valid_targets_min": 1941
},
{
"epoch": 3.1306990881458967,
"grad_norm": 0.47787066171111203,
"learning_rate": 2.7038646003272778e-05,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1752995252609253,
"step": 2060,
"valid_targets_mean": 4332.5,
"valid_targets_min": 523
},
{
"epoch": 3.1382978723404253,
"grad_norm": 0.49333053682614264,
"learning_rate": 2.6967652068132787e-05,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1864144653081894,
"step": 2065,
"valid_targets_mean": 3611.1,
"valid_targets_min": 567
},
{
"epoch": 3.1458966565349544,
"grad_norm": 0.4781276995658994,
"learning_rate": 2.6896558069278294e-05,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14743542671203613,
"step": 2070,
"valid_targets_mean": 4010.8,
"valid_targets_min": 543
},
{
"epoch": 3.1534954407294835,
"grad_norm": 0.4481532756441824,
"learning_rate": 2.6825365027703104e-05,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1980597823858261,
"step": 2075,
"valid_targets_mean": 5291.1,
"valid_targets_min": 446
},
{
"epoch": 3.161094224924012,
"grad_norm": 0.44883490224285716,
"learning_rate": 2.6754073965823394e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19897349178791046,
"step": 2080,
"valid_targets_mean": 5601.1,
"valid_targets_min": 460
},
{
"epoch": 3.1686930091185412,
"grad_norm": 0.47818122842888633,
"learning_rate": 2.668268590746303e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16886334121227264,
"step": 2085,
"valid_targets_mean": 3956.9,
"valid_targets_min": 672
},
{
"epoch": 3.17629179331307,
"grad_norm": 0.44699975246028895,
"learning_rate": 2.6611201877838858e-05,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1886739879846573,
"step": 2090,
"valid_targets_mean": 5496.0,
"valid_targets_min": 1891
},
{
"epoch": 3.183890577507599,
"grad_norm": 0.46241733640368204,
"learning_rate": 2.6539622903545992e-05,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16013459861278534,
"step": 2095,
"valid_targets_mean": 5061.5,
"valid_targets_min": 842
},
{
"epoch": 3.1914893617021276,
"grad_norm": 0.419537783672445,
"learning_rate": 2.6467950012543055e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15453095734119415,
"step": 2100,
"valid_targets_mean": 5147.8,
"valid_targets_min": 1776
},
{
"epoch": 3.1990881458966567,
"grad_norm": 0.4430059744559326,
"learning_rate": 2.639618423413742e-05,
"loss": 0.1786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15962053835391998,
"step": 2105,
"valid_targets_mean": 4258.2,
"valid_targets_min": 719
},
{
"epoch": 3.2066869300911853,
"grad_norm": 0.4601551349059534,
"learning_rate": 2.6324326598970447e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19752000272274017,
"step": 2110,
"valid_targets_mean": 5594.7,
"valid_targets_min": 2157
},
{
"epoch": 3.2142857142857144,
"grad_norm": 0.4432941671854632,
"learning_rate": 2.6252378139002666e-05,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16792172193527222,
"step": 2115,
"valid_targets_mean": 4681.6,
"valid_targets_min": 831
},
{
"epoch": 3.221884498480243,
"grad_norm": 1.0521842556961734,
"learning_rate": 2.618033988749895e-05,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18343770503997803,
"step": 2120,
"valid_targets_mean": 4442.8,
"valid_targets_min": 593
},
{
"epoch": 3.229483282674772,
"grad_norm": 0.4703582807896684,
"learning_rate": 2.6108212879013694e-05,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.182417631149292,
"step": 2125,
"valid_targets_mean": 5050.2,
"valid_targets_min": 882
},
{
"epoch": 3.237082066869301,
"grad_norm": 0.5066204484636513,
"learning_rate": 2.6035998149375928e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23296314477920532,
"step": 2130,
"valid_targets_mean": 4509.6,
"valid_targets_min": 585
},
{
"epoch": 3.24468085106383,
"grad_norm": 0.47427217437454394,
"learning_rate": 2.5963696735674487e-05,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1860450804233551,
"step": 2135,
"valid_targets_mean": 4647.2,
"valid_targets_min": 697
},
{
"epoch": 3.2522796352583585,
"grad_norm": 0.4250698588091916,
"learning_rate": 2.5891309676243084e-05,
"loss": 0.185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16689786314964294,
"step": 2140,
"valid_targets_mean": 4561.6,
"valid_targets_min": 756
},
{
"epoch": 3.2598784194528876,
"grad_norm": 0.47029762963920585,
"learning_rate": 2.5818838010645393e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15192772448062897,
"step": 2145,
"valid_targets_mean": 4186.0,
"valid_targets_min": 434
},
{
"epoch": 3.2674772036474162,
"grad_norm": 0.4554599632142264,
"learning_rate": 2.5746282779660145e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17261144518852234,
"step": 2150,
"valid_targets_mean": 4568.7,
"valid_targets_min": 1854
},
{
"epoch": 3.2750759878419453,
"grad_norm": 0.4502827257632833,
"learning_rate": 2.5673645025266174e-05,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1779678761959076,
"step": 2155,
"valid_targets_mean": 4289.7,
"valid_targets_min": 781
},
{
"epoch": 3.282674772036474,
"grad_norm": 0.4787827101748988,
"learning_rate": 2.5600925790627423e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1940232217311859,
"step": 2160,
"valid_targets_mean": 4486.1,
"valid_targets_min": 171
},
{
"epoch": 3.290273556231003,
"grad_norm": 0.45438086048067683,
"learning_rate": 2.5528126120078018e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19441285729408264,
"step": 2165,
"valid_targets_mean": 5050.3,
"valid_targets_min": 1728
},
{
"epoch": 3.297872340425532,
"grad_norm": 0.40566641587346486,
"learning_rate": 2.545524705910722e-05,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17091290652751923,
"step": 2170,
"valid_targets_mean": 5804.4,
"valid_targets_min": 1156
},
{
"epoch": 3.3054711246200608,
"grad_norm": 0.42598008462425585,
"learning_rate": 2.5382289654344433e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16645470261573792,
"step": 2175,
"valid_targets_mean": 4971.6,
"valid_targets_min": 673
},
{
"epoch": 3.31306990881459,
"grad_norm": 0.440353868517696,
"learning_rate": 2.530925495354418e-05,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17304345965385437,
"step": 2180,
"valid_targets_mean": 4552.6,
"valid_targets_min": 1465
},
{
"epoch": 3.3206686930091185,
"grad_norm": 0.45749279193739023,
"learning_rate": 2.523614400557103e-05,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16047537326812744,
"step": 2185,
"valid_targets_mean": 4131.4,
"valid_targets_min": 641
},
{
"epoch": 3.3282674772036476,
"grad_norm": 0.42763280388882297,
"learning_rate": 2.516295786038457e-05,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19560299813747406,
"step": 2190,
"valid_targets_mean": 5307.1,
"valid_targets_min": 686
},
{
"epoch": 3.335866261398176,
"grad_norm": 0.45229487644284055,
"learning_rate": 2.5089697569024293e-05,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17956998944282532,
"step": 2195,
"valid_targets_mean": 4415.1,
"valid_targets_min": 479
},
{
"epoch": 3.3434650455927053,
"grad_norm": 0.49947402828635423,
"learning_rate": 2.501636418359453e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19726476073265076,
"step": 2200,
"valid_targets_mean": 4160.0,
"valid_targets_min": 702
},
{
"epoch": 3.351063829787234,
"grad_norm": 0.5624015949940533,
"learning_rate": 2.4942958757249322e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17548981308937073,
"step": 2205,
"valid_targets_mean": 4641.6,
"valid_targets_min": 741
},
{
"epoch": 3.358662613981763,
"grad_norm": 0.47188014259395983,
"learning_rate": 2.4869482344177297e-05,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.191510871052742,
"step": 2210,
"valid_targets_mean": 5098.9,
"valid_targets_min": 732
},
{
"epoch": 3.3662613981762917,
"grad_norm": 0.4044372525372168,
"learning_rate": 2.479593599958655e-05,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1595427691936493,
"step": 2215,
"valid_targets_mean": 4987.1,
"valid_targets_min": 2150
},
{
"epoch": 3.3738601823708207,
"grad_norm": 0.4610514723176418,
"learning_rate": 2.472232077968947e-05,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18796592950820923,
"step": 2220,
"valid_targets_mean": 4755.8,
"valid_targets_min": 804
},
{
"epoch": 3.3814589665653494,
"grad_norm": 0.4762033973991841,
"learning_rate": 2.4648637741687572e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17647765576839447,
"step": 2225,
"valid_targets_mean": 4052.8,
"valid_targets_min": 1097
},
{
"epoch": 3.3890577507598785,
"grad_norm": 0.5674700704733731,
"learning_rate": 2.4574887943756322e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21014189720153809,
"step": 2230,
"valid_targets_mean": 5642.9,
"valid_targets_min": 887
},
{
"epoch": 3.396656534954407,
"grad_norm": 0.45407587371796526,
"learning_rate": 2.450107244502994e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18419310450553894,
"step": 2235,
"valid_targets_mean": 4964.2,
"valid_targets_min": 631
},
{
"epoch": 3.404255319148936,
"grad_norm": 0.6036076286770431,
"learning_rate": 2.442719230558619e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19704486429691315,
"step": 2240,
"valid_targets_mean": 3990.9,
"valid_targets_min": 879
},
{
"epoch": 3.4118541033434653,
"grad_norm": 0.5044426709371705,
"learning_rate": 2.435324858643114e-05,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17976920306682587,
"step": 2245,
"valid_targets_mean": 4607.1,
"valid_targets_min": 276
},
{
"epoch": 3.419452887537994,
"grad_norm": 0.47427419752248345,
"learning_rate": 2.4279242349483945e-05,
"loss": 0.1869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18903280794620514,
"step": 2250,
"valid_targets_mean": 4716.1,
"valid_targets_min": 1806
},
{
"epoch": 3.4270516717325226,
"grad_norm": 0.5315098096977057,
"learning_rate": 2.42051746575616e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22392138838768005,
"step": 2255,
"valid_targets_mean": 3496.4,
"valid_targets_min": 263
},
{
"epoch": 3.4346504559270516,
"grad_norm": 0.39060444130604355,
"learning_rate": 2.413104657436365e-05,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14147084951400757,
"step": 2260,
"valid_targets_mean": 4482.1,
"valid_targets_min": 527
},
{
"epoch": 3.4422492401215807,
"grad_norm": 0.44338388859066824,
"learning_rate": 2.4056859164456933e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20094552636146545,
"step": 2265,
"valid_targets_mean": 5268.6,
"valid_targets_min": 601
},
{
"epoch": 3.4498480243161094,
"grad_norm": 0.4361432780966179,
"learning_rate": 2.3982613493260298e-05,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1768036186695099,
"step": 2270,
"valid_targets_mean": 5291.0,
"valid_targets_min": 506
},
{
"epoch": 3.4574468085106385,
"grad_norm": 0.5069263015357972,
"learning_rate": 2.390831062702929e-05,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19090662896633148,
"step": 2275,
"valid_targets_mean": 4792.0,
"valid_targets_min": 361
},
{
"epoch": 3.465045592705167,
"grad_norm": 0.40616123029264917,
"learning_rate": 2.383395163284083e-05,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15730628371238708,
"step": 2280,
"valid_targets_mean": 5398.0,
"valid_targets_min": 1965
},
{
"epoch": 3.472644376899696,
"grad_norm": 0.4339438381996928,
"learning_rate": 2.3759537578577926e-05,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16227596998214722,
"step": 2285,
"valid_targets_mean": 5389.4,
"valid_targets_min": 682
},
{
"epoch": 3.480243161094225,
"grad_norm": 0.44867888022495267,
"learning_rate": 2.3685069532914292e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1895052194595337,
"step": 2290,
"valid_targets_mean": 5373.5,
"valid_targets_min": 1378
},
{
"epoch": 3.487841945288754,
"grad_norm": 0.45859302831224075,
"learning_rate": 2.3610548565299044e-05,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.161161869764328,
"step": 2295,
"valid_targets_mean": 4974.8,
"valid_targets_min": 963
},
{
"epoch": 3.4954407294832825,
"grad_norm": 0.47990973790811997,
"learning_rate": 2.35359757459413e-05,
"loss": 0.1861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1807297170162201,
"step": 2300,
"valid_targets_mean": 3966.6,
"valid_targets_min": 594
},
{
"epoch": 3.5030395136778116,
"grad_norm": 0.4458814501241054,
"learning_rate": 2.3461352145794835e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1584734320640564,
"step": 2305,
"valid_targets_mean": 4710.0,
"valid_targets_min": 1068
},
{
"epoch": 3.5106382978723403,
"grad_norm": 0.5204277337187776,
"learning_rate": 2.338667883654271e-05,
"loss": 0.1726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19432294368743896,
"step": 2310,
"valid_targets_mean": 3841.7,
"valid_targets_min": 403
},
{
"epoch": 3.5182370820668694,
"grad_norm": 0.5002703947790278,
"learning_rate": 2.3311956890581845e-05,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1830371916294098,
"step": 2315,
"valid_targets_mean": 4266.8,
"valid_targets_min": 588
},
{
"epoch": 3.5258358662613984,
"grad_norm": 0.45671055489988216,
"learning_rate": 2.3237187381007654e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17926675081253052,
"step": 2320,
"valid_targets_mean": 4515.0,
"valid_targets_min": 654
},
{
"epoch": 3.533434650455927,
"grad_norm": 0.44706162372061575,
"learning_rate": 2.3162371381598627e-05,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17958760261535645,
"step": 2325,
"valid_targets_mean": 4538.9,
"valid_targets_min": 646
},
{
"epoch": 3.5410334346504557,
"grad_norm": 0.48526337740475023,
"learning_rate": 2.308750996680089e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1857941448688507,
"step": 2330,
"valid_targets_mean": 4541.9,
"valid_targets_min": 718
},
{
"epoch": 3.548632218844985,
"grad_norm": 0.6863209953782875,
"learning_rate": 2.3012604211712787e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15989352762699127,
"step": 2335,
"valid_targets_mean": 4711.3,
"valid_targets_min": 905
},
{
"epoch": 3.556231003039514,
"grad_norm": 0.43601817882878313,
"learning_rate": 2.2937655192069453e-05,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15695396065711975,
"step": 2340,
"valid_targets_mean": 4525.1,
"valid_targets_min": 554
},
{
"epoch": 3.5638297872340425,
"grad_norm": 0.4384690019868411,
"learning_rate": 2.286266398422734e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17277196049690247,
"step": 2345,
"valid_targets_mean": 5536.7,
"valid_targets_min": 966
},
{
"epoch": 3.571428571428571,
"grad_norm": 0.50720927906344,
"learning_rate": 2.278763166514879e-05,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1746547669172287,
"step": 2350,
"valid_targets_mean": 4262.4,
"valid_targets_min": 688
},
{
"epoch": 3.5790273556231003,
"grad_norm": 0.5082859794711881,
"learning_rate": 2.2712559312386525e-05,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16094228625297546,
"step": 2355,
"valid_targets_mean": 4750.5,
"valid_targets_min": 354
},
{
"epoch": 3.5866261398176293,
"grad_norm": 0.5324693739038185,
"learning_rate": 2.2637448004068227e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1898549497127533,
"step": 2360,
"valid_targets_mean": 4889.1,
"valid_targets_min": 868
},
{
"epoch": 3.594224924012158,
"grad_norm": 0.40332096235924436,
"learning_rate": 2.2562298818881005e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1677415668964386,
"step": 2365,
"valid_targets_mean": 4815.6,
"valid_targets_min": 449
},
{
"epoch": 3.601823708206687,
"grad_norm": 0.4975962462446565,
"learning_rate": 2.2487112836055932e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1909307986497879,
"step": 2370,
"valid_targets_mean": 4240.7,
"valid_targets_min": 873
},
{
"epoch": 3.6094224924012157,
"grad_norm": 0.4333440171846238,
"learning_rate": 2.241189113535253e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17210185527801514,
"step": 2375,
"valid_targets_mean": 4546.3,
"valid_targets_min": 814
},
{
"epoch": 3.617021276595745,
"grad_norm": 0.4286229722867218,
"learning_rate": 2.2336634797043294e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17077794671058655,
"step": 2380,
"valid_targets_mean": 4828.9,
"valid_targets_min": 2075
},
{
"epoch": 3.6246200607902734,
"grad_norm": 0.5351152453484341,
"learning_rate": 2.226134490189813e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20225580036640167,
"step": 2385,
"valid_targets_mean": 4493.8,
"valid_targets_min": 816
},
{
"epoch": 3.6322188449848025,
"grad_norm": 0.4595793337143316,
"learning_rate": 2.2186022531168877e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18067389726638794,
"step": 2390,
"valid_targets_mean": 4226.4,
"valid_targets_min": 876
},
{
"epoch": 3.639817629179331,
"grad_norm": 0.4376288036773449,
"learning_rate": 2.2110668766573756e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17458736896514893,
"step": 2395,
"valid_targets_mean": 4607.4,
"valid_targets_min": 378
},
{
"epoch": 3.6474164133738602,
"grad_norm": 0.4235273238288212,
"learning_rate": 2.2035284690281835e-05,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16206535696983337,
"step": 2400,
"valid_targets_mean": 4671.6,
"valid_targets_min": 427
},
{
"epoch": 3.655015197568389,
"grad_norm": 0.4645835996278293,
"learning_rate": 2.1959871384897508e-05,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1612105816602707,
"step": 2405,
"valid_targets_mean": 4012.2,
"valid_targets_min": 736
},
{
"epoch": 3.662613981762918,
"grad_norm": 0.4339263612443116,
"learning_rate": 2.188442993344492e-05,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18110080063343048,
"step": 2410,
"valid_targets_mean": 5371.9,
"valid_targets_min": 1880
},
{
"epoch": 3.670212765957447,
"grad_norm": 0.5156390412963044,
"learning_rate": 2.1808961419352433e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19328826665878296,
"step": 2415,
"valid_targets_mean": 5049.5,
"valid_targets_min": 1733
},
{
"epoch": 3.6778115501519757,
"grad_norm": 0.4257958182746545,
"learning_rate": 2.173346692643706e-05,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15053753554821014,
"step": 2420,
"valid_targets_mean": 4545.5,
"valid_targets_min": 845
},
{
"epoch": 3.6854103343465043,
"grad_norm": 0.41421446171755727,
"learning_rate": 2.1657947538888907e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15670928359031677,
"step": 2425,
"valid_targets_mean": 4735.4,
"valid_targets_min": 2303
},
{
"epoch": 3.6930091185410334,
"grad_norm": 0.46488209722389967,
"learning_rate": 2.158240434125557e-05,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17502865195274353,
"step": 2430,
"valid_targets_mean": 4069.9,
"valid_targets_min": 843
},
{
"epoch": 3.7006079027355625,
"grad_norm": 0.44273639823588856,
"learning_rate": 2.150683841842662e-05,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17152325809001923,
"step": 2435,
"valid_targets_mean": 4846.6,
"valid_targets_min": 1167
},
{
"epoch": 3.708206686930091,
"grad_norm": 0.41156415643010313,
"learning_rate": 2.1431250855617978e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15151536464691162,
"step": 2440,
"valid_targets_mean": 4472.1,
"valid_targets_min": 280
},
{
"epoch": 3.71580547112462,
"grad_norm": 0.45636761630984557,
"learning_rate": 2.1355642738356327e-05,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16730879247188568,
"step": 2445,
"valid_targets_mean": 3877.2,
"valid_targets_min": 406
},
{
"epoch": 3.723404255319149,
"grad_norm": 0.41821546008836596,
"learning_rate": 2.128001515246355e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1652117371559143,
"step": 2450,
"valid_targets_mean": 5117.6,
"valid_targets_min": 1054
},
{
"epoch": 3.731003039513678,
"grad_norm": 0.5195131380448494,
"learning_rate": 2.1204369184041115e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21220675110816956,
"step": 2455,
"valid_targets_mean": 3935.9,
"valid_targets_min": 608
},
{
"epoch": 3.7386018237082066,
"grad_norm": 0.4759365332843418,
"learning_rate": 2.1128705919454488e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21190626919269562,
"step": 2460,
"valid_targets_mean": 5204.1,
"valid_targets_min": 776
},
{
"epoch": 3.7462006079027357,
"grad_norm": 0.44340296838544296,
"learning_rate": 2.1053026445317534e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16357441246509552,
"step": 2465,
"valid_targets_mean": 5137.4,
"valid_targets_min": 531
},
{
"epoch": 3.7537993920972643,
"grad_norm": 0.602232408360396,
"learning_rate": 2.09773318484769e-05,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14004534482955933,
"step": 2470,
"valid_targets_mean": 4292.4,
"valid_targets_min": 861
},
{
"epoch": 3.7613981762917934,
"grad_norm": 0.4860093104756001,
"learning_rate": 2.0901623215996406e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17179439961910248,
"step": 2475,
"valid_targets_mean": 4222.4,
"valid_targets_min": 2111
},
{
"epoch": 3.768996960486322,
"grad_norm": 0.5345377630387919,
"learning_rate": 2.082590163514146e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19142243266105652,
"step": 2480,
"valid_targets_mean": 3549.6,
"valid_targets_min": 650
},
{
"epoch": 3.776595744680851,
"grad_norm": 0.5131611773395347,
"learning_rate": 2.07501681933634e-05,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23167961835861206,
"step": 2485,
"valid_targets_mean": 4783.1,
"valid_targets_min": 422
},
{
"epoch": 3.78419452887538,
"grad_norm": 0.43772278574910306,
"learning_rate": 2.0674423978283924e-05,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.159462109208107,
"step": 2490,
"valid_targets_mean": 4151.8,
"valid_targets_min": 1045
},
{
"epoch": 3.791793313069909,
"grad_norm": 0.48634040579611115,
"learning_rate": 2.059867007767943e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1738453060388565,
"step": 2495,
"valid_targets_mean": 4146.1,
"valid_targets_min": 314
},
{
"epoch": 3.7993920972644375,
"grad_norm": 0.45093092640477583,
"learning_rate": 2.0522907579465413e-05,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1663065254688263,
"step": 2500,
"valid_targets_mean": 3941.2,
"valid_targets_min": 1010
},
{
"epoch": 3.8069908814589666,
"grad_norm": 0.50654438664862,
"learning_rate": 2.0447137571680856e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20836275815963745,
"step": 2505,
"valid_targets_mean": 4301.9,
"valid_targets_min": 870
},
{
"epoch": 3.8145896656534957,
"grad_norm": 0.47213930537918863,
"learning_rate": 2.037136114247257e-05,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19136860966682434,
"step": 2510,
"valid_targets_mean": 4427.4,
"valid_targets_min": 571
},
{
"epoch": 3.8221884498480243,
"grad_norm": 0.6652881182583804,
"learning_rate": 2.0295579380079596e-05,
"loss": 0.1825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16894681751728058,
"step": 2515,
"valid_targets_mean": 4250.4,
"valid_targets_min": 473
},
{
"epoch": 3.829787234042553,
"grad_norm": 0.4220064998153064,
"learning_rate": 2.0219793372817557e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1527949720621109,
"step": 2520,
"valid_targets_mean": 4826.4,
"valid_targets_min": 827
},
{
"epoch": 3.837386018237082,
"grad_norm": 0.43668863176276407,
"learning_rate": 2.0144004209063042e-05,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1740725338459015,
"step": 2525,
"valid_targets_mean": 4150.2,
"valid_targets_min": 772
},
{
"epoch": 3.844984802431611,
"grad_norm": 0.3823174418425911,
"learning_rate": 2.0068212977237983e-05,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14751499891281128,
"step": 2530,
"valid_targets_mean": 5399.6,
"valid_targets_min": 2779
},
{
"epoch": 3.8525835866261398,
"grad_norm": 0.4587095534889756,
"learning_rate": 1.999242076579398e-05,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19451266527175903,
"step": 2535,
"valid_targets_mean": 4256.1,
"valid_targets_min": 743
},
{
"epoch": 3.860182370820669,
"grad_norm": 0.45169233975095224,
"learning_rate": 1.9916628663196743e-05,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17704080045223236,
"step": 2540,
"valid_targets_mean": 4775.8,
"valid_targets_min": 2350
},
{
"epoch": 3.8677811550151975,
"grad_norm": 1.675127625058686,
"learning_rate": 1.9840837757910383e-05,
"loss": 0.1858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1759578138589859,
"step": 2545,
"valid_targets_mean": 4113.9,
"valid_targets_min": 720
},
{
"epoch": 3.8753799392097266,
"grad_norm": 0.43203621299681155,
"learning_rate": 1.976504913838184e-05,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1715025007724762,
"step": 2550,
"valid_targets_mean": 5221.4,
"valid_targets_min": 1839
},
{
"epoch": 3.882978723404255,
"grad_norm": 0.4384904057940854,
"learning_rate": 1.968926389302521e-05,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16733646392822266,
"step": 2555,
"valid_targets_mean": 4565.3,
"valid_targets_min": 609
},
{
"epoch": 3.8905775075987843,
"grad_norm": 0.4481617113710614,
"learning_rate": 1.9613483110206154e-05,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17321643233299255,
"step": 2560,
"valid_targets_mean": 4512.8,
"valid_targets_min": 895
},
{
"epoch": 3.898176291793313,
"grad_norm": 0.45819511671682567,
"learning_rate": 1.9537707878226216e-05,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17141106724739075,
"step": 2565,
"valid_targets_mean": 4315.5,
"valid_targets_min": 440
},
{
"epoch": 3.905775075987842,
"grad_norm": 0.4764235545857351,
"learning_rate": 1.9461939285307247e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1686917096376419,
"step": 2570,
"valid_targets_mean": 3827.4,
"valid_targets_min": 622
},
{
"epoch": 3.9133738601823707,
"grad_norm": 0.4437209902659711,
"learning_rate": 1.9386178419575745e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16246762871742249,
"step": 2575,
"valid_targets_mean": 4545.2,
"valid_targets_min": 746
},
{
"epoch": 3.9209726443768997,
"grad_norm": 0.3844261379651969,
"learning_rate": 1.931042636904724e-05,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17688338458538055,
"step": 2580,
"valid_targets_mean": 5911.6,
"valid_targets_min": 3130
},
{
"epoch": 3.928571428571429,
"grad_norm": 0.4052859116056726,
"learning_rate": 1.923468422161066e-05,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16950541734695435,
"step": 2585,
"valid_targets_mean": 5731.0,
"valid_targets_min": 509
},
{
"epoch": 3.9361702127659575,
"grad_norm": 0.4236870787112286,
"learning_rate": 1.9158953065012715e-05,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15792736411094666,
"step": 2590,
"valid_targets_mean": 5720.6,
"valid_targets_min": 2293
},
{
"epoch": 3.943768996960486,
"grad_norm": 0.46365326810020263,
"learning_rate": 1.9083233986842275e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17180944979190826,
"step": 2595,
"valid_targets_mean": 5083.0,
"valid_targets_min": 711
},
{
"epoch": 3.951367781155015,
"grad_norm": 0.44863750873052993,
"learning_rate": 1.900752807451475e-05,
"loss": 0.1793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16900160908699036,
"step": 2600,
"valid_targets_mean": 4392.1,
"valid_targets_min": 810
},
{
"epoch": 3.9589665653495443,
"grad_norm": 0.462622398920299,
"learning_rate": 1.8931836415256468e-05,
"loss": 0.1788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16800816357135773,
"step": 2605,
"valid_targets_mean": 4713.2,
"valid_targets_min": 740
},
{
"epoch": 3.966565349544073,
"grad_norm": 0.46050975543187894,
"learning_rate": 1.885616009608907e-05,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14823880791664124,
"step": 2610,
"valid_targets_mean": 4082.6,
"valid_targets_min": 401
},
{
"epoch": 3.9741641337386016,
"grad_norm": 0.46421973514436904,
"learning_rate": 1.8780500203813902e-05,
"loss": 0.1726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18864090740680695,
"step": 2615,
"valid_targets_mean": 4411.6,
"valid_targets_min": 655
},
{
"epoch": 3.9817629179331306,
"grad_norm": 0.4291031448782404,
"learning_rate": 1.870485782499638e-05,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17856952548027039,
"step": 2620,
"valid_targets_mean": 4765.4,
"valid_targets_min": 348
},
{
"epoch": 3.9893617021276597,
"grad_norm": 0.44985063891512206,
"learning_rate": 1.8629234045950434e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16248270869255066,
"step": 2625,
"valid_targets_mean": 4526.0,
"valid_targets_min": 1027
},
{
"epoch": 3.9969604863221884,
"grad_norm": 0.4752973434947488,
"learning_rate": 1.8553629952722853e-05,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17370517551898956,
"step": 2630,
"valid_targets_mean": 4128.8,
"valid_targets_min": 843
},
{
"epoch": 4.004559270516717,
"grad_norm": 0.4277885641586408,
"learning_rate": 1.8478046631077734e-05,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1758805513381958,
"step": 2635,
"valid_targets_mean": 4960.5,
"valid_targets_min": 647
},
{
"epoch": 4.0121580547112465,
"grad_norm": 0.4340489860844752,
"learning_rate": 1.8402485166480854e-05,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1884659081697464,
"step": 2640,
"valid_targets_mean": 5273.1,
"valid_targets_min": 787
},
{
"epoch": 4.019756838905775,
"grad_norm": 0.4325490917240746,
"learning_rate": 1.8326946644084112e-05,
"loss": 0.1573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1543048769235611,
"step": 2645,
"valid_targets_mean": 4604.4,
"valid_targets_min": 547
},
{
"epoch": 4.027355623100304,
"grad_norm": 0.5514612078158647,
"learning_rate": 1.8251432148709912e-05,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1609114408493042,
"step": 2650,
"valid_targets_mean": 3597.3,
"valid_targets_min": 695
},
{
"epoch": 4.0349544072948325,
"grad_norm": 0.43126338580266377,
"learning_rate": 1.817594276483563e-05,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18365256488323212,
"step": 2655,
"valid_targets_mean": 5326.8,
"valid_targets_min": 666
},
{
"epoch": 4.042553191489362,
"grad_norm": 0.4737332570423805,
"learning_rate": 1.8100479576577973e-05,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17224054038524628,
"step": 2660,
"valid_targets_mean": 4818.4,
"valid_targets_min": 918
},
{
"epoch": 4.050151975683891,
"grad_norm": 0.4438849641405412,
"learning_rate": 1.8025043667677484e-05,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1628122627735138,
"step": 2665,
"valid_targets_mean": 4852.9,
"valid_targets_min": 1421
},
{
"epoch": 4.057750759878419,
"grad_norm": 0.5200587086302579,
"learning_rate": 1.794963612148291e-05,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1755530685186386,
"step": 2670,
"valid_targets_mean": 3932.9,
"valid_targets_min": 844
},
{
"epoch": 4.065349544072948,
"grad_norm": 0.5142004311196928,
"learning_rate": 1.7874258020935708e-05,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16136983036994934,
"step": 2675,
"valid_targets_mean": 3818.9,
"valid_targets_min": 758
},
{
"epoch": 4.072948328267477,
"grad_norm": 0.47669155432301397,
"learning_rate": 1.7798910448554433e-05,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17607629299163818,
"step": 2680,
"valid_targets_mean": 4376.6,
"valid_targets_min": 1368
},
{
"epoch": 4.080547112462006,
"grad_norm": 0.4655137661586852,
"learning_rate": 1.7723594486419245e-05,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15961049497127533,
"step": 2685,
"valid_targets_mean": 4512.1,
"valid_targets_min": 1601
},
{
"epoch": 4.088145896656535,
"grad_norm": 0.7525257215139017,
"learning_rate": 1.764831121615631e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21296311914920807,
"step": 2690,
"valid_targets_mean": 4298.8,
"valid_targets_min": 756
},
{
"epoch": 4.095744680851064,
"grad_norm": 0.4433451433036404,
"learning_rate": 1.7573061718922347e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16739048063755035,
"step": 2695,
"valid_targets_mean": 5009.2,
"valid_targets_min": 853
},
{
"epoch": 4.103343465045593,
"grad_norm": 0.4830355618281073,
"learning_rate": 1.7497847075389004e-05,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16623979806900024,
"step": 2700,
"valid_targets_mean": 4105.4,
"valid_targets_min": 714
},
{
"epoch": 4.1109422492401215,
"grad_norm": 0.4179613714457159,
"learning_rate": 1.7422668365727428e-05,
"loss": 0.1572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16168740391731262,
"step": 2705,
"valid_targets_mean": 5317.4,
"valid_targets_min": 1811
},
{
"epoch": 4.11854103343465,
"grad_norm": 0.5056361715181314,
"learning_rate": 1.734752666959268e-05,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16789555549621582,
"step": 2710,
"valid_targets_mean": 4172.6,
"valid_targets_min": 666
},
{
"epoch": 4.12613981762918,
"grad_norm": 0.48722281404971973,
"learning_rate": 1.7272423066108306e-05,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17382162809371948,
"step": 2715,
"valid_targets_mean": 4376.5,
"valid_targets_min": 263
},
{
"epoch": 4.133738601823708,
"grad_norm": 0.4790825604864442,
"learning_rate": 1.7197358633850744e-05,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16230902075767517,
"step": 2720,
"valid_targets_mean": 4323.8,
"valid_targets_min": 370
},
{
"epoch": 4.141337386018237,
"grad_norm": 0.41425680904063444,
"learning_rate": 1.7122334450833933e-05,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18430155515670776,
"step": 2725,
"valid_targets_mean": 6086.1,
"valid_targets_min": 567
},
{
"epoch": 4.148936170212766,
"grad_norm": 0.4752171364109056,
"learning_rate": 1.7047351594493755e-05,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1950949728488922,
"step": 2730,
"valid_targets_mean": 5050.2,
"valid_targets_min": 804
},
{
"epoch": 4.156534954407295,
"grad_norm": 0.4757519244575605,
"learning_rate": 1.6972411141672614e-05,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1867167055606842,
"step": 2735,
"valid_targets_mean": 4470.1,
"valid_targets_min": 828
},
{
"epoch": 4.164133738601824,
"grad_norm": 0.4513608069410081,
"learning_rate": 1.6897514168603924e-05,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1613789200782776,
"step": 2740,
"valid_targets_mean": 4477.4,
"valid_targets_min": 742
},
{
"epoch": 4.171732522796352,
"grad_norm": 0.5141640145999388,
"learning_rate": 1.6822661750896707e-05,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19608411192893982,
"step": 2745,
"valid_targets_mean": 4257.2,
"valid_targets_min": 892
},
{
"epoch": 4.179331306990881,
"grad_norm": 0.4724318719284284,
"learning_rate": 1.67478549635201e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1456223726272583,
"step": 2750,
"valid_targets_mean": 4336.9,
"valid_targets_min": 541
},
{
"epoch": 4.186930091185411,
"grad_norm": 0.4970941462233452,
"learning_rate": 1.6673094880787933e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1658686399459839,
"step": 2755,
"valid_targets_mean": 4121.6,
"valid_targets_min": 601
},
{
"epoch": 4.194528875379939,
"grad_norm": 0.5000186608612818,
"learning_rate": 1.6598382576343312e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16827929019927979,
"step": 2760,
"valid_targets_mean": 5388.8,
"valid_targets_min": 1463
},
{
"epoch": 4.202127659574468,
"grad_norm": 0.4684433964610707,
"learning_rate": 1.6523719123143186e-05,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15693283081054688,
"step": 2765,
"valid_targets_mean": 4821.7,
"valid_targets_min": 746
},
{
"epoch": 4.2097264437689965,
"grad_norm": 0.45967354792383214,
"learning_rate": 1.6449105593442936e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19241458177566528,
"step": 2770,
"valid_targets_mean": 4597.6,
"valid_targets_min": 855
},
{
"epoch": 4.217325227963526,
"grad_norm": 0.4733160030781719,
"learning_rate": 1.6374543058780998e-05,
"loss": 0.1576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16462013125419617,
"step": 2775,
"valid_targets_mean": 4405.4,
"valid_targets_min": 850
},
{
"epoch": 4.224924012158055,
"grad_norm": 0.4815352707164652,
"learning_rate": 1.6300032589963436e-05,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15910238027572632,
"step": 2780,
"valid_targets_mean": 4541.5,
"valid_targets_min": 909
},
{
"epoch": 4.232522796352583,
"grad_norm": 0.47250106872988024,
"learning_rate": 1.6225575257048622e-05,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1517636775970459,
"step": 2785,
"valid_targets_mean": 4741.7,
"valid_targets_min": 1120
},
{
"epoch": 4.240121580547113,
"grad_norm": 1.1194758985013034,
"learning_rate": 1.6151172129331786e-05,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16665083169937134,
"step": 2790,
"valid_targets_mean": 4795.9,
"valid_targets_min": 567
},
{
"epoch": 4.2477203647416415,
"grad_norm": 0.5081276624925015,
"learning_rate": 1.6076824275329758e-05,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16445952653884888,
"step": 2795,
"valid_targets_mean": 4864.7,
"valid_targets_min": 1608
},
{
"epoch": 4.25531914893617,
"grad_norm": 0.48328270331504203,
"learning_rate": 1.6002532762765524e-05,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17975090444087982,
"step": 2800,
"valid_targets_mean": 4240.7,
"valid_targets_min": 616
},
{
"epoch": 4.262917933130699,
"grad_norm": 0.46912231409179,
"learning_rate": 1.5928298658552988e-05,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1919006109237671,
"step": 2805,
"valid_targets_mean": 5055.8,
"valid_targets_min": 588
},
{
"epoch": 4.270516717325228,
"grad_norm": 0.6210976552983519,
"learning_rate": 1.5854123028781557e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1582549810409546,
"step": 2810,
"valid_targets_mean": 3868.8,
"valid_targets_min": 365
},
{
"epoch": 4.278115501519757,
"grad_norm": 0.4072288493810071,
"learning_rate": 1.5780006938700917e-05,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16181963682174683,
"step": 2815,
"valid_targets_mean": 5906.6,
"valid_targets_min": 1016
},
{
"epoch": 4.285714285714286,
"grad_norm": 0.45582906884120683,
"learning_rate": 1.5705951452705654e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14693260192871094,
"step": 2820,
"valid_targets_mean": 4234.7,
"valid_targets_min": 811
},
{
"epoch": 4.293313069908814,
"grad_norm": 0.5429695412336001,
"learning_rate": 1.5631957634320048e-05,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1935248076915741,
"step": 2825,
"valid_targets_mean": 4832.9,
"valid_targets_min": 774
},
{
"epoch": 4.300911854103344,
"grad_norm": 0.46340922363130344,
"learning_rate": 1.555802654618272e-05,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17274600267410278,
"step": 2830,
"valid_targets_mean": 5227.2,
"valid_targets_min": 933
},
{
"epoch": 4.308510638297872,
"grad_norm": 0.8213856644150885,
"learning_rate": 1.5484159250031445e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17811016738414764,
"step": 2835,
"valid_targets_mean": 3817.1,
"valid_targets_min": 692
},
{
"epoch": 4.316109422492401,
"grad_norm": 0.4391910613617335,
"learning_rate": 1.541035680668785e-05,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17826610803604126,
"step": 2840,
"valid_targets_mean": 5220.5,
"valid_targets_min": 571
},
{
"epoch": 4.32370820668693,
"grad_norm": 0.5400136046572052,
"learning_rate": 1.5336620276042193e-05,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17823699116706848,
"step": 2845,
"valid_targets_mean": 4212.0,
"valid_targets_min": 156
},
{
"epoch": 4.331306990881459,
"grad_norm": 0.4689908498540122,
"learning_rate": 1.526295071703817e-05,
"loss": 0.1559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14596086740493774,
"step": 2850,
"valid_targets_mean": 4071.1,
"valid_targets_min": 842
},
{
"epoch": 4.338905775075988,
"grad_norm": 0.43293471403933603,
"learning_rate": 1.5189349187657665e-05,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1921626329421997,
"step": 2855,
"valid_targets_mean": 5745.9,
"valid_targets_min": 899
},
{
"epoch": 4.3465045592705165,
"grad_norm": 0.4470655930449328,
"learning_rate": 1.5115816744905596e-05,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.135872483253479,
"step": 2860,
"valid_targets_mean": 4759.4,
"valid_targets_min": 872
},
{
"epoch": 4.354103343465045,
"grad_norm": 0.5712823358033652,
"learning_rate": 1.504235444479469e-05,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20416559278964996,
"step": 2865,
"valid_targets_mean": 4337.3,
"valid_targets_min": 361
},
{
"epoch": 4.361702127659575,
"grad_norm": 0.4182532739028534,
"learning_rate": 1.4968963342330369e-05,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17232292890548706,
"step": 2870,
"valid_targets_mean": 5397.1,
"valid_targets_min": 1864
},
{
"epoch": 4.369300911854103,
"grad_norm": 0.4274336280548651,
"learning_rate": 1.4895644491495547e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17278841137886047,
"step": 2875,
"valid_targets_mean": 5085.6,
"valid_targets_min": 758
},
{
"epoch": 4.376899696048632,
"grad_norm": 0.4542314839910377,
"learning_rate": 1.4822398945235545e-05,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15121108293533325,
"step": 2880,
"valid_targets_mean": 4447.8,
"valid_targets_min": 422
},
{
"epoch": 4.3844984802431615,
"grad_norm": 0.4154772615137915,
"learning_rate": 1.4749227755442927e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1821514070034027,
"step": 2885,
"valid_targets_mean": 5593.2,
"valid_targets_min": 2877
},
{
"epoch": 4.39209726443769,
"grad_norm": 0.4559773456464244,
"learning_rate": 1.4676131972942416e-05,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16653896868228912,
"step": 2890,
"valid_targets_mean": 4738.8,
"valid_targets_min": 920
},
{
"epoch": 4.399696048632219,
"grad_norm": 0.41739506385968844,
"learning_rate": 1.4603112647475795e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15362367033958435,
"step": 2895,
"valid_targets_mean": 5320.4,
"valid_targets_min": 552
},
{
"epoch": 4.407294832826747,
"grad_norm": 0.3845071167642644,
"learning_rate": 1.4530170827686831e-05,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13495799899101257,
"step": 2900,
"valid_targets_mean": 5222.8,
"valid_targets_min": 583
},
{
"epoch": 4.414893617021277,
"grad_norm": 0.44390729359629055,
"learning_rate": 1.4457307561106226e-05,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15813395380973816,
"step": 2905,
"valid_targets_mean": 4969.7,
"valid_targets_min": 776
},
{
"epoch": 4.422492401215806,
"grad_norm": 0.5018673994147254,
"learning_rate": 1.438452389413656e-05,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15857061743736267,
"step": 2910,
"valid_targets_mean": 3932.9,
"valid_targets_min": 633
},
{
"epoch": 4.430091185410334,
"grad_norm": 0.4806146977648294,
"learning_rate": 1.4311820872037264e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1731853187084198,
"step": 2915,
"valid_targets_mean": 4577.8,
"valid_targets_min": 328
},
{
"epoch": 4.437689969604863,
"grad_norm": 0.4617241179372537,
"learning_rate": 1.423919953890963e-05,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18794915080070496,
"step": 2920,
"valid_targets_mean": 5022.4,
"valid_targets_min": 629
},
{
"epoch": 4.445288753799392,
"grad_norm": 0.48939540976668194,
"learning_rate": 1.4166660937681771e-05,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17850425839424133,
"step": 2925,
"valid_targets_mean": 4809.8,
"valid_targets_min": 409
},
{
"epoch": 4.452887537993921,
"grad_norm": 0.4842928277510236,
"learning_rate": 1.4094206110093712e-05,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1715683937072754,
"step": 2930,
"valid_targets_mean": 4601.0,
"valid_targets_min": 1634
},
{
"epoch": 4.46048632218845,
"grad_norm": 0.4074913023031158,
"learning_rate": 1.4021836096682343e-05,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1516132950782776,
"step": 2935,
"valid_targets_mean": 5510.4,
"valid_targets_min": 778
},
{
"epoch": 4.468085106382979,
"grad_norm": 0.42946649016106,
"learning_rate": 1.394955193676657e-05,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16095909476280212,
"step": 2940,
"valid_targets_mean": 5310.4,
"valid_targets_min": 1020
},
{
"epoch": 4.475683890577508,
"grad_norm": 0.4385638298379317,
"learning_rate": 1.3877354668432297e-05,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15726953744888306,
"step": 2945,
"valid_targets_mean": 4561.4,
"valid_targets_min": 590
},
{
"epoch": 4.4832826747720365,
"grad_norm": 0.5193379752723524,
"learning_rate": 1.38052453285176e-05,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16541394591331482,
"step": 2950,
"valid_targets_mean": 3761.6,
"valid_targets_min": 561
},
{
"epoch": 4.490881458966565,
"grad_norm": 0.4490166063535176,
"learning_rate": 1.3733224952597764e-05,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1475997269153595,
"step": 2955,
"valid_targets_mean": 4226.3,
"valid_targets_min": 666
},
{
"epoch": 4.498480243161095,
"grad_norm": 0.5152090350550662,
"learning_rate": 1.3661294574970485e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18321773409843445,
"step": 2960,
"valid_targets_mean": 4961.2,
"valid_targets_min": 602
},
{
"epoch": 4.506079027355623,
"grad_norm": 0.43396945945061266,
"learning_rate": 1.3589455228640938e-05,
"loss": 0.1754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17606866359710693,
"step": 2965,
"valid_targets_mean": 5181.6,
"valid_targets_min": 1460
},
{
"epoch": 4.513677811550152,
"grad_norm": 0.4690277765034569,
"learning_rate": 1.3517707945307013e-05,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18834683299064636,
"step": 2970,
"valid_targets_mean": 4646.1,
"valid_targets_min": 953
},
{
"epoch": 4.5212765957446805,
"grad_norm": 0.5066167184858231,
"learning_rate": 1.3446053755344439e-05,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15756574273109436,
"step": 2975,
"valid_targets_mean": 4516.5,
"valid_targets_min": 844
},
{
"epoch": 4.52887537993921,
"grad_norm": 0.5134300889609936,
"learning_rate": 1.3374493687792045e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19803106784820557,
"step": 2980,
"valid_targets_mean": 4092.7,
"valid_targets_min": 719
},
{
"epoch": 4.536474164133739,
"grad_norm": 0.4463665768466012,
"learning_rate": 1.3303028770336914e-05,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1606081873178482,
"step": 2985,
"valid_targets_mean": 4620.2,
"valid_targets_min": 714
},
{
"epoch": 4.544072948328267,
"grad_norm": 0.4159202471735973,
"learning_rate": 1.3231660029299703e-05,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16770178079605103,
"step": 2990,
"valid_targets_mean": 5974.0,
"valid_targets_min": 1221
},
{
"epoch": 4.551671732522796,
"grad_norm": 0.4174566017417907,
"learning_rate": 1.316038848961982e-05,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16645801067352295,
"step": 2995,
"valid_targets_mean": 5945.2,
"valid_targets_min": 1900
},
{
"epoch": 4.5592705167173255,
"grad_norm": 0.41700946512428255,
"learning_rate": 1.3089215174840783e-05,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15380007028579712,
"step": 3000,
"valid_targets_mean": 5489.1,
"valid_targets_min": 894
},
{
"epoch": 4.566869300911854,
"grad_norm": 0.5304865164006446,
"learning_rate": 1.3018141107095455e-05,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16447263956069946,
"step": 3005,
"valid_targets_mean": 3494.4,
"valid_targets_min": 491
},
{
"epoch": 4.574468085106383,
"grad_norm": 0.48520946915581575,
"learning_rate": 1.2947167307091424e-05,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15445218980312347,
"step": 3010,
"valid_targets_mean": 4516.8,
"valid_targets_min": 664
},
{
"epoch": 4.5820668693009114,
"grad_norm": 0.47660891700948743,
"learning_rate": 1.287629479409628e-05,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15592724084854126,
"step": 3015,
"valid_targets_mean": 4057.2,
"valid_targets_min": 905
},
{
"epoch": 4.589665653495441,
"grad_norm": 0.41867433836985307,
"learning_rate": 1.2805524585923048e-05,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1499272882938385,
"step": 3020,
"valid_targets_mean": 4869.1,
"valid_targets_min": 501
},
{
"epoch": 4.59726443768997,
"grad_norm": 0.40048802671676303,
"learning_rate": 1.2734857698915502e-05,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13745658099651337,
"step": 3025,
"valid_targets_mean": 5079.4,
"valid_targets_min": 1254
},
{
"epoch": 4.604863221884498,
"grad_norm": 0.4149531859078102,
"learning_rate": 1.266429514793363e-05,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15537427365779877,
"step": 3030,
"valid_targets_mean": 5211.1,
"valid_targets_min": 861
},
{
"epoch": 4.612462006079028,
"grad_norm": 0.6490039513363777,
"learning_rate": 1.2593837946339008e-05,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18460866808891296,
"step": 3035,
"valid_targets_mean": 4625.2,
"valid_targets_min": 918
},
{
"epoch": 4.620060790273556,
"grad_norm": 0.4992835453594247,
"learning_rate": 1.252348710598029e-05,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.167076975107193,
"step": 3040,
"valid_targets_mean": 4100.6,
"valid_targets_min": 432
},
{
"epoch": 4.627659574468085,
"grad_norm": 0.4615786144106656,
"learning_rate": 1.245324363717864e-05,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16426023840904236,
"step": 3045,
"valid_targets_mean": 4565.8,
"valid_targets_min": 828
},
{
"epoch": 4.635258358662614,
"grad_norm": 0.41965629757500533,
"learning_rate": 1.2383108548713254e-05,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1467415690422058,
"step": 3050,
"valid_targets_mean": 5088.9,
"valid_targets_min": 1159
},
{
"epoch": 4.642857142857143,
"grad_norm": 0.4441828730212559,
"learning_rate": 1.2313082847806852e-05,
"loss": 0.1776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1823854148387909,
"step": 3055,
"valid_targets_mean": 4715.0,
"valid_targets_min": 741
},
{
"epoch": 4.650455927051672,
"grad_norm": 0.459237281832204,
"learning_rate": 1.2243167540111216e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14467957615852356,
"step": 3060,
"valid_targets_mean": 3859.3,
"valid_targets_min": 673
},
{
"epoch": 4.6580547112462005,
"grad_norm": 0.4946697227727552,
"learning_rate": 1.2173363629692756e-05,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19268517196178436,
"step": 3065,
"valid_targets_mean": 3953.9,
"valid_targets_min": 931
},
{
"epoch": 4.665653495440729,
"grad_norm": 0.43385480300907053,
"learning_rate": 1.2103672119018086e-05,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15391963720321655,
"step": 3070,
"valid_targets_mean": 4950.1,
"valid_targets_min": 1644
},
{
"epoch": 4.673252279635259,
"grad_norm": 0.47954284812840575,
"learning_rate": 1.2034094008939624e-05,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19548840820789337,
"step": 3075,
"valid_targets_mean": 5021.8,
"valid_targets_min": 774
},
{
"epoch": 4.680851063829787,
"grad_norm": 0.4636621474235311,
"learning_rate": 1.1964630298681221e-05,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14948098361492157,
"step": 3080,
"valid_targets_mean": 3846.4,
"valid_targets_min": 940
},
{
"epoch": 4.688449848024316,
"grad_norm": 1.0079316283200346,
"learning_rate": 1.1895281985823815e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1952032595872879,
"step": 3085,
"valid_targets_mean": 3557.1,
"valid_targets_min": 570
},
{
"epoch": 4.696048632218845,
"grad_norm": 0.4689910480215768,
"learning_rate": 1.1826050066291097e-05,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16652071475982666,
"step": 3090,
"valid_targets_mean": 4480.4,
"valid_targets_min": 728
},
{
"epoch": 4.703647416413374,
"grad_norm": 0.451296162182404,
"learning_rate": 1.1756935534335212e-05,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13410750031471252,
"step": 3095,
"valid_targets_mean": 4405.3,
"valid_targets_min": 1325
},
{
"epoch": 4.711246200607903,
"grad_norm": 0.42448672661829445,
"learning_rate": 1.1687939382522493e-05,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1605660319328308,
"step": 3100,
"valid_targets_mean": 4885.4,
"valid_targets_min": 1135
},
{
"epoch": 4.718844984802431,
"grad_norm": 0.4707749031713044,
"learning_rate": 1.1619062601719171e-05,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1604931652545929,
"step": 3105,
"valid_targets_mean": 4170.2,
"valid_targets_min": 857
},
{
"epoch": 4.72644376899696,
"grad_norm": 0.4670653605297488,
"learning_rate": 1.15503061810772e-05,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16604188084602356,
"step": 3110,
"valid_targets_mean": 5626.7,
"valid_targets_min": 414
},
{
"epoch": 4.73404255319149,
"grad_norm": 0.4609235488117921,
"learning_rate": 1.1481671108019984e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23836404085159302,
"step": 3115,
"valid_targets_mean": 5899.8,
"valid_targets_min": 543
},
{
"epoch": 4.741641337386018,
"grad_norm": 0.46042215360634425,
"learning_rate": 1.1413158368228249e-05,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.163685142993927,
"step": 3120,
"valid_targets_mean": 4402.4,
"valid_targets_min": 512
},
{
"epoch": 4.749240121580547,
"grad_norm": 0.5338506865095787,
"learning_rate": 1.1344768945625884e-05,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1888251006603241,
"step": 3125,
"valid_targets_mean": 4155.4,
"valid_targets_min": 537
},
{
"epoch": 4.756838905775076,
"grad_norm": 0.40137648604950027,
"learning_rate": 1.127650382236578e-05,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14810852706432343,
"step": 3130,
"valid_targets_mean": 5314.3,
"valid_targets_min": 354
},
{
"epoch": 4.764437689969605,
"grad_norm": 0.5240009462617735,
"learning_rate": 1.1208363978815746e-05,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18549123406410217,
"step": 3135,
"valid_targets_mean": 4340.2,
"valid_targets_min": 593
},
{
"epoch": 4.772036474164134,
"grad_norm": 0.43622202592017323,
"learning_rate": 1.1140350393544422e-05,
"loss": 0.1593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15057966113090515,
"step": 3140,
"valid_targets_mean": 4826.1,
"valid_targets_min": 794
},
{
"epoch": 4.779635258358662,
"grad_norm": 0.46748847050986225,
"learning_rate": 1.1072464043307259e-05,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20890364050865173,
"step": 3145,
"valid_targets_mean": 4810.9,
"valid_targets_min": 434
},
{
"epoch": 4.787234042553192,
"grad_norm": 0.4709284580160048,
"learning_rate": 1.1004705903032406e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17572824656963348,
"step": 3150,
"valid_targets_mean": 4275.6,
"valid_targets_min": 787
},
{
"epoch": 4.7948328267477205,
"grad_norm": 0.4947193520586711,
"learning_rate": 1.0937076945806837e-05,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1653721183538437,
"step": 3155,
"valid_targets_mean": 3996.0,
"valid_targets_min": 608
},
{
"epoch": 4.802431610942249,
"grad_norm": 0.95424384071522,
"learning_rate": 1.0869578142862228e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15056976675987244,
"step": 3160,
"valid_targets_mean": 5264.1,
"valid_targets_min": 911
},
{
"epoch": 4.810030395136778,
"grad_norm": 0.436658942790459,
"learning_rate": 1.0802210463561166e-05,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15242451429367065,
"step": 3165,
"valid_targets_mean": 4430.6,
"valid_targets_min": 1307
},
{
"epoch": 4.817629179331307,
"grad_norm": 0.4940935042193495,
"learning_rate": 1.0734974875383066e-05,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15941178798675537,
"step": 3170,
"valid_targets_mean": 3658.3,
"valid_targets_min": 640
},
{
"epoch": 4.825227963525836,
"grad_norm": 0.5857976461421992,
"learning_rate": 1.0667872343910432e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16998814046382904,
"step": 3175,
"valid_targets_mean": 4214.1,
"valid_targets_min": 619
},
{
"epoch": 4.832826747720365,
"grad_norm": 0.447470023536544,
"learning_rate": 1.0600903832814856e-05,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16528019309043884,
"step": 3180,
"valid_targets_mean": 4406.2,
"valid_targets_min": 774
},
{
"epoch": 4.840425531914894,
"grad_norm": 0.45582176893752013,
"learning_rate": 1.0534070303843294e-05,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16366976499557495,
"step": 3185,
"valid_targets_mean": 4874.4,
"valid_targets_min": 531
},
{
"epoch": 4.848024316109423,
"grad_norm": 0.491211928315914,
"learning_rate": 1.0467372716804141e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18734398484230042,
"step": 3190,
"valid_targets_mean": 4573.7,
"valid_targets_min": 655
},
{
"epoch": 4.855623100303951,
"grad_norm": 0.5889214979063572,
"learning_rate": 1.0400812029553569e-05,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18033604323863983,
"step": 3195,
"valid_targets_mean": 3925.6,
"valid_targets_min": 545
},
{
"epoch": 4.86322188449848,
"grad_norm": 0.4334778399672226,
"learning_rate": 1.0334389197981638e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14970465004444122,
"step": 3200,
"valid_targets_mean": 4557.2,
"valid_targets_min": 736
},
{
"epoch": 4.870820668693009,
"grad_norm": 0.5178203832731765,
"learning_rate": 1.0268105175998713e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16531500220298767,
"step": 3205,
"valid_targets_mean": 3934.7,
"valid_targets_min": 616
},
{
"epoch": 4.878419452887538,
"grad_norm": 0.4677336984690735,
"learning_rate": 1.0201960915521614e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15597450733184814,
"step": 3210,
"valid_targets_mean": 4830.2,
"valid_targets_min": 631
},
{
"epoch": 4.886018237082067,
"grad_norm": 0.4582200792232965,
"learning_rate": 1.0135957366460087e-05,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14683008193969727,
"step": 3215,
"valid_targets_mean": 4210.8,
"valid_targets_min": 1151
},
{
"epoch": 4.8936170212765955,
"grad_norm": 2.6017818537468114,
"learning_rate": 1.0070095476703036e-05,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17961879074573517,
"step": 3220,
"valid_targets_mean": 4255.6,
"valid_targets_min": 544
},
{
"epoch": 4.901215805471125,
"grad_norm": 0.48429935318886524,
"learning_rate": 1.0004376192105032e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1917518824338913,
"step": 3225,
"valid_targets_mean": 4164.9,
"valid_targets_min": 683
},
{
"epoch": 4.908814589665654,
"grad_norm": 0.408755975822661,
"learning_rate": 9.938800456472603e-06,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15598323941230774,
"step": 3230,
"valid_targets_mean": 5235.6,
"valid_targets_min": 673
},
{
"epoch": 4.916413373860182,
"grad_norm": 0.5687286004991109,
"learning_rate": 9.87336921155081e-06,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1737002432346344,
"step": 3235,
"valid_targets_mean": 4874.2,
"valid_targets_min": 648
},
{
"epoch": 4.924012158054711,
"grad_norm": 0.4449749826597429,
"learning_rate": 9.80808339700959e-06,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18869557976722717,
"step": 3240,
"valid_targets_mean": 5077.7,
"valid_targets_min": 778
},
{
"epoch": 4.9316109422492405,
"grad_norm": 0.43592967879817196,
"learning_rate": 9.74294395043039e-06,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16350185871124268,
"step": 3245,
"valid_targets_mean": 4365.2,
"valid_targets_min": 579
},
{
"epoch": 4.939209726443769,
"grad_norm": 0.44671726836927617,
"learning_rate": 9.677951807292584e-06,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1710178405046463,
"step": 3250,
"valid_targets_mean": 4973.2,
"valid_targets_min": 456
},
{
"epoch": 4.946808510638298,
"grad_norm": 0.4273982901555888,
"learning_rate": 9.61310790096015e-06,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13666585087776184,
"step": 3255,
"valid_targets_mean": 4339.3,
"valid_targets_min": 970
},
{
"epoch": 4.954407294832826,
"grad_norm": 0.4111092281316594,
"learning_rate": 9.548413162668155e-06,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13993242383003235,
"step": 3260,
"valid_targets_mean": 5151.4,
"valid_targets_min": 1606
},
{
"epoch": 4.962006079027356,
"grad_norm": 0.4678973949276577,
"learning_rate": 9.483868521509492e-06,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17497044801712036,
"step": 3265,
"valid_targets_mean": 4569.8,
"valid_targets_min": 507
},
{
"epoch": 4.9696048632218845,
"grad_norm": 0.48923608505182986,
"learning_rate": 9.419474904421422e-06,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17405647039413452,
"step": 3270,
"valid_targets_mean": 4378.5,
"valid_targets_min": 646
},
{
"epoch": 4.977203647416413,
"grad_norm": 0.42080134203036884,
"learning_rate": 9.355233236172381e-06,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14896854758262634,
"step": 3275,
"valid_targets_mean": 4978.7,
"valid_targets_min": 1936
},
{
"epoch": 4.984802431610943,
"grad_norm": 0.45247817713087146,
"learning_rate": 9.2911444393486e-06,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14354351162910461,
"step": 3280,
"valid_targets_mean": 5089.9,
"valid_targets_min": 754
},
{
"epoch": 4.992401215805471,
"grad_norm": 0.4892191547497894,
"learning_rate": 9.227209434340914e-06,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1533418595790863,
"step": 3285,
"valid_targets_mean": 4154.1,
"valid_targets_min": 434
},
{
"epoch": 5.0,
"grad_norm": 0.4367103289579237,
"learning_rate": 9.163429139331516e-06,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1589938849210739,
"step": 3290,
"valid_targets_mean": 4928.7,
"valid_targets_min": 567
},
{
"epoch": 5.007598784194529,
"grad_norm": 0.5506166462705645,
"learning_rate": 9.099804470280791e-06,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1861366331577301,
"step": 3295,
"valid_targets_mean": 3553.4,
"valid_targets_min": 519
},
{
"epoch": 5.015197568389058,
"grad_norm": 0.44365514163643444,
"learning_rate": 9.036336340914138e-06,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18212465941905975,
"step": 3300,
"valid_targets_mean": 4840.4,
"valid_targets_min": 465
},
{
"epoch": 5.022796352583587,
"grad_norm": 0.5002686598117616,
"learning_rate": 8.973025662708875e-06,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16633297502994537,
"step": 3305,
"valid_targets_mean": 5309.5,
"valid_targets_min": 834
},
{
"epoch": 5.0303951367781155,
"grad_norm": 0.5141187748402867,
"learning_rate": 8.909873344881125e-06,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1726076900959015,
"step": 3310,
"valid_targets_mean": 4149.5,
"valid_targets_min": 1217
},
{
"epoch": 5.037993920972644,
"grad_norm": 0.42838999609845296,
"learning_rate": 8.846880294372777e-06,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1435108482837677,
"step": 3315,
"valid_targets_mean": 5703.1,
"valid_targets_min": 781
},
{
"epoch": 5.045592705167174,
"grad_norm": 0.4990807265797361,
"learning_rate": 8.784047415838446e-06,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15767478942871094,
"step": 3320,
"valid_targets_mean": 4732.1,
"valid_targets_min": 998
},
{
"epoch": 5.053191489361702,
"grad_norm": 0.4244905713932716,
"learning_rate": 8.721375611632494e-06,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15482358634471893,
"step": 3325,
"valid_targets_mean": 5283.4,
"valid_targets_min": 977
},
{
"epoch": 5.060790273556231,
"grad_norm": 0.5268949634896493,
"learning_rate": 8.658865781796059e-06,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16202573478221893,
"step": 3330,
"valid_targets_mean": 4009.4,
"valid_targets_min": 736
},
{
"epoch": 5.0683890577507595,
"grad_norm": 0.5222959380611226,
"learning_rate": 8.596518824044145e-06,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1700512319803238,
"step": 3335,
"valid_targets_mean": 4815.2,
"valid_targets_min": 1896
},
{
"epoch": 5.075987841945289,
"grad_norm": 0.48817810574292153,
"learning_rate": 8.53433563375271e-06,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15692004561424255,
"step": 3340,
"valid_targets_mean": 5081.4,
"valid_targets_min": 604
},
{
"epoch": 5.083586626139818,
"grad_norm": 0.5145519787891805,
"learning_rate": 8.472317103945827e-06,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15433713793754578,
"step": 3345,
"valid_targets_mean": 4923.5,
"valid_targets_min": 664
},
{
"epoch": 5.091185410334346,
"grad_norm": 0.49860669438741656,
"learning_rate": 8.410464125282842e-06,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18030579388141632,
"step": 3350,
"valid_targets_mean": 4054.4,
"valid_targets_min": 849
},
{
"epoch": 5.098784194528875,
"grad_norm": 0.4977104637629043,
"learning_rate": 8.348777586045599e-06,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16232091188430786,
"step": 3355,
"valid_targets_mean": 4112.1,
"valid_targets_min": 342
},
{
"epoch": 5.1063829787234045,
"grad_norm": 0.40792452628529047,
"learning_rate": 8.287258372125666e-06,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14980870485305786,
"step": 3360,
"valid_targets_mean": 5441.6,
"valid_targets_min": 828
},
{
"epoch": 5.113981762917933,
"grad_norm": 0.48624828153735117,
"learning_rate": 8.22590736701163e-06,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15524911880493164,
"step": 3365,
"valid_targets_mean": 4029.7,
"valid_targets_min": 527
},
{
"epoch": 5.121580547112462,
"grad_norm": 0.41260477481757823,
"learning_rate": 8.164725451776396e-06,
"loss": 0.139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11952009797096252,
"step": 3370,
"valid_targets_mean": 5127.4,
"valid_targets_min": 1259
},
{
"epoch": 5.129179331306991,
"grad_norm": 0.5121037283737604,
"learning_rate": 8.103713505064542e-06,
"loss": 0.147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13970546424388885,
"step": 3375,
"valid_targets_mean": 5086.4,
"valid_targets_min": 447
},
{
"epoch": 5.13677811550152,
"grad_norm": 0.554785879889902,
"learning_rate": 8.042872403079695e-06,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17848604917526245,
"step": 3380,
"valid_targets_mean": 4835.1,
"valid_targets_min": 229
},
{
"epoch": 5.144376899696049,
"grad_norm": 0.4543169082658653,
"learning_rate": 7.982203019571951e-06,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15885761380195618,
"step": 3385,
"valid_targets_mean": 4715.2,
"valid_targets_min": 614
},
{
"epoch": 5.151975683890577,
"grad_norm": 0.49519076224489234,
"learning_rate": 7.921706225825323e-06,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14728990197181702,
"step": 3390,
"valid_targets_mean": 4132.9,
"valid_targets_min": 705
},
{
"epoch": 5.159574468085107,
"grad_norm": 0.4692483655123735,
"learning_rate": 7.861382890645235e-06,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1677330732345581,
"step": 3395,
"valid_targets_mean": 4542.6,
"valid_targets_min": 571
},
{
"epoch": 5.167173252279635,
"grad_norm": 0.4981198573213941,
"learning_rate": 7.801233880346044e-06,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.152068629860878,
"step": 3400,
"valid_targets_mean": 4878.0,
"valid_targets_min": 1568
},
{
"epoch": 5.174772036474164,
"grad_norm": 0.496973792548942,
"learning_rate": 7.741260058738576e-06,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1845749020576477,
"step": 3405,
"valid_targets_mean": 4564.4,
"valid_targets_min": 333
},
{
"epoch": 5.182370820668693,
"grad_norm": 0.4801400629594902,
"learning_rate": 7.681462287117769e-06,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15920531749725342,
"step": 3410,
"valid_targets_mean": 4416.2,
"valid_targets_min": 618
},
{
"epoch": 5.189969604863222,
"grad_norm": 0.44717438624237565,
"learning_rate": 7.62184142425026e-06,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14159642159938812,
"step": 3415,
"valid_targets_mean": 5296.9,
"valid_targets_min": 1679
},
{
"epoch": 5.197568389057751,
"grad_norm": 0.5694531326181947,
"learning_rate": 7.562398326362068e-06,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1987701654434204,
"step": 3420,
"valid_targets_mean": 4228.2,
"valid_targets_min": 500
},
{
"epoch": 5.2051671732522795,
"grad_norm": 0.4837511107077152,
"learning_rate": 7.503133847126298e-06,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14547014236450195,
"step": 3425,
"valid_targets_mean": 4541.6,
"valid_targets_min": 537
},
{
"epoch": 5.212765957446808,
"grad_norm": 0.46751291957082003,
"learning_rate": 7.444048837650879e-06,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1482163369655609,
"step": 3430,
"valid_targets_mean": 4358.3,
"valid_targets_min": 464
},
{
"epoch": 5.220364741641338,
"grad_norm": 0.48046465195883326,
"learning_rate": 7.3851441464663455e-06,
"loss": 0.1505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15912845730781555,
"step": 3435,
"valid_targets_mean": 4258.4,
"valid_targets_min": 1734
},
{
"epoch": 5.227963525835866,
"grad_norm": 0.5201595463216373,
"learning_rate": 7.326420619513645e-06,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14452405273914337,
"step": 3440,
"valid_targets_mean": 4945.8,
"valid_targets_min": 2273
},
{
"epoch": 5.235562310030395,
"grad_norm": 0.4662188330800987,
"learning_rate": 7.267879100131996e-06,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16573692858219147,
"step": 3445,
"valid_targets_mean": 5350.9,
"valid_targets_min": 1272
},
{
"epoch": 5.243161094224924,
"grad_norm": 0.5445679437490333,
"learning_rate": 7.209520429046768e-06,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14232224225997925,
"step": 3450,
"valid_targets_mean": 3531.5,
"valid_targets_min": 756
},
{
"epoch": 5.250759878419453,
"grad_norm": 0.48341944333718034,
"learning_rate": 7.151345444357418e-06,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15717411041259766,
"step": 3455,
"valid_targets_mean": 4357.9,
"valid_targets_min": 410
},
{
"epoch": 5.258358662613982,
"grad_norm": 0.46774893892784875,
"learning_rate": 7.0933549815254465e-06,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16652044653892517,
"step": 3460,
"valid_targets_mean": 5190.8,
"valid_targets_min": 433
},
{
"epoch": 5.26595744680851,
"grad_norm": 0.47602862093431514,
"learning_rate": 7.035549873362406e-06,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14074617624282837,
"step": 3465,
"valid_targets_mean": 4641.2,
"valid_targets_min": 1537
},
{
"epoch": 5.27355623100304,
"grad_norm": 0.49943887077257887,
"learning_rate": 6.97793095001793e-06,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15125201642513275,
"step": 3470,
"valid_targets_mean": 4864.9,
"valid_targets_min": 754
},
{
"epoch": 5.281155015197569,
"grad_norm": 0.56912423597624,
"learning_rate": 6.920499038967825e-06,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1387101113796234,
"step": 3475,
"valid_targets_mean": 4497.3,
"valid_targets_min": 780
},
{
"epoch": 5.288753799392097,
"grad_norm": 0.6031298612179781,
"learning_rate": 6.863254965002178e-06,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17738491296768188,
"step": 3480,
"valid_targets_mean": 2821.3,
"valid_targets_min": 271
},
{
"epoch": 5.296352583586626,
"grad_norm": 0.42528213654923797,
"learning_rate": 6.80619955021351e-06,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13962329924106598,
"step": 3485,
"valid_targets_mean": 5226.1,
"valid_targets_min": 1805
},
{
"epoch": 5.303951367781155,
"grad_norm": 0.4641682316415047,
"learning_rate": 6.749333613984979e-06,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17883500456809998,
"step": 3490,
"valid_targets_mean": 5505.0,
"valid_targets_min": 2227
},
{
"epoch": 5.311550151975684,
"grad_norm": 0.41287597531580333,
"learning_rate": 6.6926579729786025e-06,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13076046109199524,
"step": 3495,
"valid_targets_mean": 5253.1,
"valid_targets_min": 624
},
{
"epoch": 5.319148936170213,
"grad_norm": 0.47804228992277803,
"learning_rate": 6.636173441123537e-06,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13578727841377258,
"step": 3500,
"valid_targets_mean": 4141.2,
"valid_targets_min": 974
},
{
"epoch": 5.326747720364741,
"grad_norm": 0.6043580771376642,
"learning_rate": 6.5798808296043835e-06,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1580887734889984,
"step": 3505,
"valid_targets_mean": 3810.6,
"valid_targets_min": 769
},
{
"epoch": 5.334346504559271,
"grad_norm": 0.5078101575478104,
"learning_rate": 6.52378094684954e-06,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17107361555099487,
"step": 3510,
"valid_targets_mean": 3934.2,
"valid_targets_min": 280
},
{
"epoch": 5.3419452887537995,
"grad_norm": 0.4141414829732433,
"learning_rate": 6.467874598519597e-06,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14241334795951843,
"step": 3515,
"valid_targets_mean": 5362.5,
"valid_targets_min": 2329
},
{
"epoch": 5.349544072948328,
"grad_norm": 0.4458140032344141,
"learning_rate": 6.412162587495754e-06,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13986560702323914,
"step": 3520,
"valid_targets_mean": 4640.0,
"valid_targets_min": 593
},
{
"epoch": 5.357142857142857,
"grad_norm": 0.49980298962190683,
"learning_rate": 6.3566457138683015e-06,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1622404009103775,
"step": 3525,
"valid_targets_mean": 4144.8,
"valid_targets_min": 523
},
{
"epoch": 5.364741641337386,
"grad_norm": 0.5309190846014655,
"learning_rate": 6.301324774925128e-06,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1419864147901535,
"step": 3530,
"valid_targets_mean": 4773.5,
"valid_targets_min": 601
},
{
"epoch": 5.372340425531915,
"grad_norm": 0.4394509557877868,
"learning_rate": 6.246200565140266e-06,
"loss": 0.1382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1346133053302765,
"step": 3535,
"valid_targets_mean": 5314.5,
"valid_targets_min": 1831
},
{
"epoch": 5.379939209726444,
"grad_norm": 0.6157551616826415,
"learning_rate": 6.191273876162487e-06,
"loss": 0.1559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16742759943008423,
"step": 3540,
"valid_targets_mean": 4461.9,
"valid_targets_min": 632
},
{
"epoch": 5.387537993920972,
"grad_norm": 0.5207893779334158,
"learning_rate": 6.136545496803925e-06,
"loss": 0.1576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.173904150724411,
"step": 3545,
"valid_targets_mean": 4806.9,
"valid_targets_min": 816
},
{
"epoch": 5.395136778115502,
"grad_norm": 0.41444365615563894,
"learning_rate": 6.082016213028761e-06,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14027008414268494,
"step": 3550,
"valid_targets_mean": 5664.4,
"valid_targets_min": 840
},
{
"epoch": 5.40273556231003,
"grad_norm": 0.4453222293778615,
"learning_rate": 6.0276868079419235e-06,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1503615528345108,
"step": 3555,
"valid_targets_mean": 5143.4,
"valid_targets_min": 979
},
{
"epoch": 5.410334346504559,
"grad_norm": 0.4781236892192554,
"learning_rate": 5.973558061777849e-06,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15819337964057922,
"step": 3560,
"valid_targets_mean": 5053.2,
"valid_targets_min": 664
},
{
"epoch": 5.4179331306990886,
"grad_norm": 0.41198950921824895,
"learning_rate": 5.919630751889274e-06,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13387863337993622,
"step": 3565,
"valid_targets_mean": 5390.4,
"valid_targets_min": 1116
},
{
"epoch": 5.425531914893617,
"grad_norm": 0.516010838368697,
"learning_rate": 5.865905652736072e-06,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17436817288398743,
"step": 3570,
"valid_targets_mean": 4064.7,
"valid_targets_min": 894
},
{
"epoch": 5.433130699088146,
"grad_norm": 0.5141562761832758,
"learning_rate": 5.812383535874131e-06,
"loss": 0.1428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13484925031661987,
"step": 3575,
"valid_targets_mean": 3949.4,
"valid_targets_min": 1312
},
{
"epoch": 5.4407294832826745,
"grad_norm": 0.45662210514471807,
"learning_rate": 5.759065169944274e-06,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1350744068622589,
"step": 3580,
"valid_targets_mean": 4565.4,
"valid_targets_min": 381
},
{
"epoch": 5.448328267477204,
"grad_norm": 0.49698187827992,
"learning_rate": 5.705951320661222e-06,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14174014329910278,
"step": 3585,
"valid_targets_mean": 4722.2,
"valid_targets_min": 2183
},
{
"epoch": 5.455927051671733,
"grad_norm": 0.45234338868163015,
"learning_rate": 5.653042750802591e-06,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14616911113262177,
"step": 3590,
"valid_targets_mean": 4943.4,
"valid_targets_min": 1261
},
{
"epoch": 5.463525835866261,
"grad_norm": 0.4806481881918089,
"learning_rate": 5.600340220197946e-06,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17162683606147766,
"step": 3595,
"valid_targets_mean": 4331.8,
"valid_targets_min": 414
},
{
"epoch": 5.47112462006079,
"grad_norm": 0.46035606110531224,
"learning_rate": 5.547844485717884e-06,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14485681056976318,
"step": 3600,
"valid_targets_mean": 4167.1,
"valid_targets_min": 1119
},
{
"epoch": 5.4787234042553195,
"grad_norm": 0.4684818904402137,
"learning_rate": 5.4955563012631606e-06,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14429020881652832,
"step": 3605,
"valid_targets_mean": 5013.6,
"valid_targets_min": 1788
},
{
"epoch": 5.486322188449848,
"grad_norm": 0.6076128140539062,
"learning_rate": 5.443476417753877e-06,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17048346996307373,
"step": 3610,
"valid_targets_mean": 2878.3,
"valid_targets_min": 491
},
{
"epoch": 5.493920972644377,
"grad_norm": 0.46825002881973943,
"learning_rate": 5.39160558311868e-06,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17676037549972534,
"step": 3615,
"valid_targets_mean": 4354.2,
"valid_targets_min": 646
},
{
"epoch": 5.501519756838906,
"grad_norm": 0.49007855328228217,
"learning_rate": 5.33994454228403e-06,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17580349743366241,
"step": 3620,
"valid_targets_mean": 5169.6,
"valid_targets_min": 953
},
{
"epoch": 5.509118541033435,
"grad_norm": 0.44768382223068853,
"learning_rate": 5.2884940371634915e-06,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14162276685237885,
"step": 3625,
"valid_targets_mean": 5179.9,
"valid_targets_min": 1051
},
{
"epoch": 5.5167173252279635,
"grad_norm": 0.4352121315996926,
"learning_rate": 5.237254806647117e-06,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1292266994714737,
"step": 3630,
"valid_targets_mean": 4936.1,
"valid_targets_min": 912
},
{
"epoch": 5.524316109422492,
"grad_norm": 0.5433474427694438,
"learning_rate": 5.1862275865907575e-06,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1526874601840973,
"step": 3635,
"valid_targets_mean": 3939.9,
"valid_targets_min": 1082
},
{
"epoch": 5.531914893617021,
"grad_norm": 0.4664875248042157,
"learning_rate": 5.135413109805596e-06,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14586284756660461,
"step": 3640,
"valid_targets_mean": 4819.6,
"valid_targets_min": 1708
},
{
"epoch": 5.53951367781155,
"grad_norm": 0.4479408250207293,
"learning_rate": 5.084812106047525e-06,
"loss": 0.1325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13202941417694092,
"step": 3645,
"valid_targets_mean": 5479.3,
"valid_targets_min": 1475
},
{
"epoch": 5.547112462006079,
"grad_norm": 0.46875681135292097,
"learning_rate": 5.034425302006751e-06,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15239191055297852,
"step": 3650,
"valid_targets_mean": 4168.7,
"valid_targets_min": 534
},
{
"epoch": 5.554711246200608,
"grad_norm": 0.5099225903083285,
"learning_rate": 4.984253421297285e-06,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15130409598350525,
"step": 3655,
"valid_targets_mean": 3672.7,
"valid_targets_min": 465
},
{
"epoch": 5.562310030395137,
"grad_norm": 0.44549612335892824,
"learning_rate": 4.934297184446617e-06,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15832307934761047,
"step": 3660,
"valid_targets_mean": 5213.5,
"valid_targets_min": 1002
},
{
"epoch": 5.569908814589666,
"grad_norm": 0.5093597450581251,
"learning_rate": 4.884557308885302e-06,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16333602368831635,
"step": 3665,
"valid_targets_mean": 4690.4,
"valid_targets_min": 876
},
{
"epoch": 5.577507598784194,
"grad_norm": 0.5062778786472242,
"learning_rate": 4.835034508936736e-06,
"loss": 0.152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15072304010391235,
"step": 3670,
"valid_targets_mean": 4472.8,
"valid_targets_min": 863
},
{
"epoch": 5.585106382978723,
"grad_norm": 0.4887232514300285,
"learning_rate": 4.785729495806804e-06,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1506553441286087,
"step": 3675,
"valid_targets_mean": 4468.6,
"valid_targets_min": 1870
},
{
"epoch": 5.592705167173253,
"grad_norm": 0.5178118286048965,
"learning_rate": 4.736642977573745e-06,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14603829383850098,
"step": 3680,
"valid_targets_mean": 3900.1,
"valid_targets_min": 314
},
{
"epoch": 5.600303951367781,
"grad_norm": 0.49021784557999176,
"learning_rate": 4.6877756591779465e-06,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1614750772714615,
"step": 3685,
"valid_targets_mean": 4549.1,
"valid_targets_min": 1530
},
{
"epoch": 5.60790273556231,
"grad_norm": 0.46685253564728685,
"learning_rate": 4.63912824241183e-06,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15664935111999512,
"step": 3690,
"valid_targets_mean": 4078.2,
"valid_targets_min": 702
},
{
"epoch": 5.6155015197568385,
"grad_norm": 0.4476391544726595,
"learning_rate": 4.590701425909763e-06,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1614711433649063,
"step": 3695,
"valid_targets_mean": 5204.6,
"valid_targets_min": 1871
},
{
"epoch": 5.623100303951368,
"grad_norm": 0.46752237532336416,
"learning_rate": 4.5424959051380376e-06,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14600232243537903,
"step": 3700,
"valid_targets_mean": 4345.4,
"valid_targets_min": 1418
},
{
"epoch": 5.630699088145897,
"grad_norm": 0.498907377725208,
"learning_rate": 4.4945123723848785e-06,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16958801448345184,
"step": 3705,
"valid_targets_mean": 4744.0,
"valid_targets_min": 655
},
{
"epoch": 5.638297872340425,
"grad_norm": 0.47032248993505454,
"learning_rate": 4.446751516750496e-06,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15484699606895447,
"step": 3710,
"valid_targets_mean": 4455.9,
"valid_targets_min": 513
},
{
"epoch": 5.645896656534955,
"grad_norm": 0.49291725666506586,
"learning_rate": 4.399214024137199e-06,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1515854448080063,
"step": 3715,
"valid_targets_mean": 4026.5,
"valid_targets_min": 401
},
{
"epoch": 5.6534954407294835,
"grad_norm": 0.42768293201723206,
"learning_rate": 4.351900577239534e-06,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1308768093585968,
"step": 3720,
"valid_targets_mean": 5203.2,
"valid_targets_min": 511
},
{
"epoch": 5.661094224924012,
"grad_norm": 0.419913357256391,
"learning_rate": 4.30481185553449e-06,
"loss": 0.143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15996746718883514,
"step": 3725,
"valid_targets_mean": 6209.4,
"valid_targets_min": 3964
},
{
"epoch": 5.668693009118541,
"grad_norm": 0.5024514745126758,
"learning_rate": 4.2579485352717365e-06,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14928898215293884,
"step": 3730,
"valid_targets_mean": 5061.5,
"valid_targets_min": 854
},
{
"epoch": 5.676291793313069,
"grad_norm": 0.6107697257765264,
"learning_rate": 4.211311289463913e-06,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.212265282869339,
"step": 3735,
"valid_targets_mean": 2980.9,
"valid_targets_min": 613
},
{
"epoch": 5.683890577507599,
"grad_norm": 0.40762228356266644,
"learning_rate": 4.164900787876958e-06,
"loss": 0.1572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15725256502628326,
"step": 3740,
"valid_targets_mean": 5801.9,
"valid_targets_min": 1647
},
{
"epoch": 5.691489361702128,
"grad_norm": 0.42068151608687643,
"learning_rate": 4.118717697020503e-06,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15178656578063965,
"step": 3745,
"valid_targets_mean": 5270.4,
"valid_targets_min": 714
},
{
"epoch": 5.699088145896656,
"grad_norm": 0.510742750219421,
"learning_rate": 4.072762680138283e-06,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16748473048210144,
"step": 3750,
"valid_targets_mean": 4111.5,
"valid_targets_min": 690
},
{
"epoch": 5.706686930091186,
"grad_norm": 0.4725979697075687,
"learning_rate": 4.02703639719863e-06,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16421647369861603,
"step": 3755,
"valid_targets_mean": 5007.1,
"valid_targets_min": 1593
},
{
"epoch": 5.714285714285714,
"grad_norm": 0.4858255836304888,
"learning_rate": 3.981539504884975e-06,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1452382504940033,
"step": 3760,
"valid_targets_mean": 4335.0,
"valid_targets_min": 268
},
{
"epoch": 5.721884498480243,
"grad_norm": 0.496365033025088,
"learning_rate": 3.936272656586455e-06,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1607646495103836,
"step": 3765,
"valid_targets_mean": 4691.0,
"valid_targets_min": 801
},
{
"epoch": 5.729483282674772,
"grad_norm": 0.49339220005728074,
"learning_rate": 3.891236502388463e-06,
"loss": 0.1399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12876826524734497,
"step": 3770,
"valid_targets_mean": 3568.1,
"valid_targets_min": 629
},
{
"epoch": 5.737082066869301,
"grad_norm": 0.42864321603538963,
"learning_rate": 3.846431689063395e-06,
"loss": 0.1598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14634914696216583,
"step": 3775,
"valid_targets_mean": 5067.4,
"valid_targets_min": 1740
},
{
"epoch": 5.74468085106383,
"grad_norm": 0.4858809112101771,
"learning_rate": 3.801858860061276e-06,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15183153748512268,
"step": 3780,
"valid_targets_mean": 4308.7,
"valid_targets_min": 2342
},
{
"epoch": 5.7522796352583585,
"grad_norm": 0.430010773677836,
"learning_rate": 3.757518655500607e-06,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11490476876497269,
"step": 3785,
"valid_targets_mean": 4636.7,
"valid_targets_min": 1770
},
{
"epoch": 5.759878419452887,
"grad_norm": 0.44137928337029025,
"learning_rate": 3.7134117121590783e-06,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1602618247270584,
"step": 3790,
"valid_targets_mean": 5387.0,
"valid_targets_min": 1520
},
{
"epoch": 5.767477203647417,
"grad_norm": 0.49716171756169814,
"learning_rate": 3.6695386634645268e-06,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17046484351158142,
"step": 3795,
"valid_targets_mean": 3979.0,
"valid_targets_min": 637
},
{
"epoch": 5.775075987841945,
"grad_norm": 0.6225472640133536,
"learning_rate": 3.625900139485732e-06,
"loss": 0.1483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16933000087738037,
"step": 3800,
"valid_targets_mean": 3247.3,
"valid_targets_min": 403
},
{
"epoch": 5.782674772036474,
"grad_norm": 0.4826561130766123,
"learning_rate": 3.5824967669234712e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14927777647972107,
"step": 3805,
"valid_targets_mean": 4297.8,
"valid_targets_min": 479
},
{
"epoch": 5.7902735562310035,
"grad_norm": 0.4594251420598871,
"learning_rate": 3.539329169101424e-06,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15365689992904663,
"step": 3810,
"valid_targets_mean": 5167.4,
"valid_targets_min": 892
},
{
"epoch": 5.797872340425532,
"grad_norm": 0.4557619581698914,
"learning_rate": 3.49639796595731e-06,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1744815707206726,
"step": 3815,
"valid_targets_mean": 5195.3,
"valid_targets_min": 634
},
{
"epoch": 5.805471124620061,
"grad_norm": 0.46537892238846895,
"learning_rate": 3.453703774033901e-06,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14466017484664917,
"step": 3820,
"valid_targets_mean": 4648.0,
"valid_targets_min": 736
},
{
"epoch": 5.813069908814589,
"grad_norm": 0.5247551115664364,
"learning_rate": 3.4112472064702473e-06,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16951002180576324,
"step": 3825,
"valid_targets_mean": 4100.8,
"valid_targets_min": 529
},
{
"epoch": 5.820668693009118,
"grad_norm": 0.4408079538837663,
"learning_rate": 3.369028872992792e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15143227577209473,
"step": 3830,
"valid_targets_mean": 5215.6,
"valid_targets_min": 1009
},
{
"epoch": 5.828267477203648,
"grad_norm": 0.5248938288172915,
"learning_rate": 3.327049379906695e-06,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17994189262390137,
"step": 3835,
"valid_targets_mean": 4604.6,
"valid_targets_min": 570
},
{
"epoch": 5.835866261398176,
"grad_norm": 0.5052356507109963,
"learning_rate": 3.2853093300870452e-06,
"loss": 0.1457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1394600123167038,
"step": 3840,
"valid_targets_mean": 4017.8,
"valid_targets_min": 736
},
{
"epoch": 5.843465045592705,
"grad_norm": 0.47463044811940924,
"learning_rate": 3.2438093229702905e-06,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15373006463050842,
"step": 3845,
"valid_targets_mean": 4134.0,
"valid_targets_min": 410
},
{
"epoch": 5.851063829787234,
"grad_norm": 0.513814275937601,
"learning_rate": 3.202549954545533e-06,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23078633844852448,
"step": 3850,
"valid_targets_mean": 5543.1,
"valid_targets_min": 655
},
{
"epoch": 5.858662613981763,
"grad_norm": 0.48073524570765763,
"learning_rate": 3.161531817346062e-06,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17668002843856812,
"step": 3855,
"valid_targets_mean": 4446.9,
"valid_targets_min": 449
},
{
"epoch": 5.866261398176292,
"grad_norm": 0.4258287069585612,
"learning_rate": 3.120755500440762e-06,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14281289279460907,
"step": 3860,
"valid_targets_mean": 5058.1,
"valid_targets_min": 1100
},
{
"epoch": 5.87386018237082,
"grad_norm": 0.4556314380528612,
"learning_rate": 3.0802215894257336e-06,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15817520022392273,
"step": 3865,
"valid_targets_mean": 4869.2,
"valid_targets_min": 2426
},
{
"epoch": 5.88145896656535,
"grad_norm": 0.632880711013422,
"learning_rate": 3.0399306664158e-06,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440334916114807,
"step": 3870,
"valid_targets_mean": 4294.8,
"valid_targets_min": 1072
},
{
"epoch": 5.8890577507598785,
"grad_norm": 0.40158185981708566,
"learning_rate": 2.9998833100362336e-06,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1560600996017456,
"step": 3875,
"valid_targets_mean": 5631.6,
"valid_targets_min": 1728
},
{
"epoch": 5.896656534954407,
"grad_norm": 0.500623763450671,
"learning_rate": 2.9600800954143572e-06,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1587526947259903,
"step": 3880,
"valid_targets_mean": 4028.8,
"valid_targets_min": 666
},
{
"epoch": 5.904255319148936,
"grad_norm": 0.4944868321896879,
"learning_rate": 2.9205215941713704e-06,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16634200513362885,
"step": 3885,
"valid_targets_mean": 4611.9,
"valid_targets_min": 732
},
{
"epoch": 5.911854103343465,
"grad_norm": 0.5115742550534301,
"learning_rate": 2.8812083744140616e-06,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15021023154258728,
"step": 3890,
"valid_targets_mean": 4236.3,
"valid_targets_min": 1104
},
{
"epoch": 5.919452887537994,
"grad_norm": 0.48224861462921226,
"learning_rate": 2.842141000726726e-06,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1501300185918808,
"step": 3895,
"valid_targets_mean": 4213.5,
"valid_targets_min": 774
},
{
"epoch": 5.927051671732523,
"grad_norm": 0.4030631035629361,
"learning_rate": 2.8033200341629886e-06,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12463116645812988,
"step": 3900,
"valid_targets_mean": 5398.5,
"valid_targets_min": 1514
},
{
"epoch": 5.934650455927052,
"grad_norm": 0.45096444866968627,
"learning_rate": 2.7647460322377927e-06,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17850109934806824,
"step": 3905,
"valid_targets_mean": 5562.8,
"valid_targets_min": 569
},
{
"epoch": 5.942249240121581,
"grad_norm": 0.41781952891112895,
"learning_rate": 2.72641954891937e-06,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.145452082157135,
"step": 3910,
"valid_targets_mean": 5237.6,
"valid_targets_min": 787
},
{
"epoch": 5.949848024316109,
"grad_norm": 0.462920182118315,
"learning_rate": 2.688341134621295e-06,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1589956283569336,
"step": 3915,
"valid_targets_mean": 5620.2,
"valid_targets_min": 797
},
{
"epoch": 5.957446808510638,
"grad_norm": 0.48846090610407683,
"learning_rate": 2.6505113361945833e-06,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18880805373191833,
"step": 3920,
"valid_targets_mean": 4641.4,
"valid_targets_min": 879
},
{
"epoch": 5.9650455927051675,
"grad_norm": 0.440227878411004,
"learning_rate": 2.612930696919822e-06,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13358448445796967,
"step": 3925,
"valid_targets_mean": 4184.0,
"valid_targets_min": 559
},
{
"epoch": 5.972644376899696,
"grad_norm": 0.4575207059455806,
"learning_rate": 2.5755997564993894e-06,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14469373226165771,
"step": 3930,
"valid_targets_mean": 4649.6,
"valid_targets_min": 2261
},
{
"epoch": 5.980243161094225,
"grad_norm": 0.5005233906873359,
"learning_rate": 2.5385190510496858e-06,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17244486510753632,
"step": 3935,
"valid_targets_mean": 4924.8,
"valid_targets_min": 171
},
{
"epoch": 5.9878419452887535,
"grad_norm": 0.4458252216107338,
"learning_rate": 2.5016891130934463e-06,
"loss": 0.1457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13665539026260376,
"step": 3940,
"valid_targets_mean": 4990.1,
"valid_targets_min": 500
},
{
"epoch": 5.995440729483283,
"grad_norm": 0.4846406288628859,
"learning_rate": 2.465110471552086e-06,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16603650152683258,
"step": 3945,
"valid_targets_mean": 4758.2,
"valid_targets_min": 599
},
{
"epoch": 6.003039513677812,
"grad_norm": 0.44214905635705837,
"learning_rate": 2.4287836517381113e-06,
"loss": 0.1349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11986207216978073,
"step": 3950,
"valid_targets_mean": 4267.4,
"valid_targets_min": 335
},
{
"epoch": 6.01063829787234,
"grad_norm": 0.4887571085350468,
"learning_rate": 2.392709175347554e-06,
"loss": 0.1505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14001381397247314,
"step": 3955,
"valid_targets_mean": 4841.9,
"valid_targets_min": 797
},
{
"epoch": 6.018237082066869,
"grad_norm": 0.5312808060591666,
"learning_rate": 2.356887560452528e-06,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17127478122711182,
"step": 3960,
"valid_targets_mean": 3657.6,
"valid_targets_min": 713
},
{
"epoch": 6.025835866261398,
"grad_norm": 0.49420144944896355,
"learning_rate": 2.321319321493718e-06,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15153075754642487,
"step": 3965,
"valid_targets_mean": 4141.9,
"valid_targets_min": 792
},
{
"epoch": 6.033434650455927,
"grad_norm": 0.43348847119788875,
"learning_rate": 2.2860049692730745e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15093687176704407,
"step": 3970,
"valid_targets_mean": 5298.1,
"valid_targets_min": 491
},
{
"epoch": 6.041033434650456,
"grad_norm": 0.4852668062537144,
"learning_rate": 2.2509450109463903e-06,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15192578732967377,
"step": 3975,
"valid_targets_mean": 4195.6,
"valid_targets_min": 646
},
{
"epoch": 6.048632218844984,
"grad_norm": 0.4985600383895827,
"learning_rate": 2.2161399500161005e-06,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12650343775749207,
"step": 3980,
"valid_targets_mean": 4298.5,
"valid_targets_min": 1887
},
{
"epoch": 6.056231003039514,
"grad_norm": 0.46036482703942144,
"learning_rate": 2.1815902863239826e-06,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12870556116104126,
"step": 3985,
"valid_targets_mean": 4722.8,
"valid_targets_min": 1027
},
{
"epoch": 6.0638297872340425,
"grad_norm": 0.4724257952962997,
"learning_rate": 2.1472965160440307e-06,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15059977769851685,
"step": 3990,
"valid_targets_mean": 4350.8,
"valid_targets_min": 1618
},
{
"epoch": 6.071428571428571,
"grad_norm": 0.4736941877158723,
"learning_rate": 2.1132591316752824e-06,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12970831990242004,
"step": 3995,
"valid_targets_mean": 4671.1,
"valid_targets_min": 1136
},
{
"epoch": 6.079027355623101,
"grad_norm": 0.4790995642913263,
"learning_rate": 2.079478622034803e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1599026918411255,
"step": 4000,
"valid_targets_mean": 5553.9,
"valid_targets_min": 2157
},
{
"epoch": 6.086626139817629,
"grad_norm": 0.5750210601223926,
"learning_rate": 2.045955472250598e-06,
"loss": 0.1557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1329852193593979,
"step": 4005,
"valid_targets_mean": 4740.1,
"valid_targets_min": 658
},
{
"epoch": 6.094224924012158,
"grad_norm": 0.5356962782262873,
"learning_rate": 2.012690163754716e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1583370566368103,
"step": 4010,
"valid_targets_mean": 3881.9,
"valid_targets_min": 833
},
{
"epoch": 6.101823708206687,
"grad_norm": 0.5430593717962985,
"learning_rate": 1.9796831742762658e-06,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17519140243530273,
"step": 4015,
"valid_targets_mean": 4008.7,
"valid_targets_min": 513
},
{
"epoch": 6.109422492401216,
"grad_norm": 0.5395476454999809,
"learning_rate": 1.9469349778346223e-06,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1673513501882553,
"step": 4020,
"valid_targets_mean": 3863.8,
"valid_targets_min": 862
},
{
"epoch": 6.117021276595745,
"grad_norm": 0.6041814504745721,
"learning_rate": 1.9144460447325564e-06,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16433076560497284,
"step": 4025,
"valid_targets_mean": 4698.3,
"valid_targets_min": 821
},
{
"epoch": 6.124620060790273,
"grad_norm": 0.6094776194613557,
"learning_rate": 1.8822168415495422e-06,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13730981945991516,
"step": 4030,
"valid_targets_mean": 4077.6,
"valid_targets_min": 901
},
{
"epoch": 6.132218844984802,
"grad_norm": 0.45063574077263974,
"learning_rate": 1.8502478311349947e-06,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16246050596237183,
"step": 4035,
"valid_targets_mean": 5466.6,
"valid_targets_min": 2424
},
{
"epoch": 6.139817629179332,
"grad_norm": 0.4816199109533305,
"learning_rate": 1.8185394726016791e-06,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1370609700679779,
"step": 4040,
"valid_targets_mean": 4561.9,
"valid_targets_min": 743
},
{
"epoch": 6.14741641337386,
"grad_norm": 0.6732958197054807,
"learning_rate": 1.7870922213190755e-06,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16209891438484192,
"step": 4045,
"valid_targets_mean": 3887.8,
"valid_targets_min": 550
},
{
"epoch": 6.155015197568389,
"grad_norm": 0.4601061012528339,
"learning_rate": 1.7559065289068633e-06,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13671234250068665,
"step": 4050,
"valid_targets_mean": 5133.4,
"valid_targets_min": 479
},
{
"epoch": 6.1626139817629175,
"grad_norm": 0.43746420290219207,
"learning_rate": 1.72498284322842e-06,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1267484724521637,
"step": 4055,
"valid_targets_mean": 5035.9,
"valid_targets_min": 1853
},
{
"epoch": 6.170212765957447,
"grad_norm": 0.4569139573946025,
"learning_rate": 1.694321608384406e-06,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14077520370483398,
"step": 4060,
"valid_targets_mean": 5069.5,
"valid_targets_min": 2002
},
{
"epoch": 6.177811550151976,
"grad_norm": 0.43274533973618445,
"learning_rate": 1.663923264706373e-06,
"loss": 0.1329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14554743468761444,
"step": 4065,
"valid_targets_mean": 5077.8,
"valid_targets_min": 519
},
{
"epoch": 6.185410334346504,
"grad_norm": 0.47582107432910764,
"learning_rate": 1.6337882487504452e-06,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14857840538024902,
"step": 4070,
"valid_targets_mean": 4424.7,
"valid_targets_min": 674
},
{
"epoch": 6.193009118541034,
"grad_norm": 0.5274167558239128,
"learning_rate": 1.603916993291048e-06,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14230819046497345,
"step": 4075,
"valid_targets_mean": 3961.1,
"valid_targets_min": 654
},
{
"epoch": 6.2006079027355625,
"grad_norm": 0.49913070570635226,
"learning_rate": 1.5743099273146967e-06,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440865695476532,
"step": 4080,
"valid_targets_mean": 5009.5,
"valid_targets_min": 444
},
{
"epoch": 6.208206686930091,
"grad_norm": 0.4571022258136094,
"learning_rate": 1.5449674760138344e-06,
"loss": 0.1355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1474510282278061,
"step": 4085,
"valid_targets_mean": 4348.4,
"valid_targets_min": 770
},
{
"epoch": 6.21580547112462,
"grad_norm": 0.4714848047264726,
"learning_rate": 1.5158900607807248e-06,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16296353936195374,
"step": 4090,
"valid_targets_mean": 4949.5,
"valid_targets_min": 694
},
{
"epoch": 6.223404255319149,
"grad_norm": 0.4322780542533103,
"learning_rate": 1.4870780992013956e-06,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13294166326522827,
"step": 4095,
"valid_targets_mean": 4950.1,
"valid_targets_min": 329
},
{
"epoch": 6.231003039513678,
"grad_norm": 0.5464674366866006,
"learning_rate": 1.4585320050496531e-06,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15174424648284912,
"step": 4100,
"valid_targets_mean": 4007.2,
"valid_targets_min": 834
},
{
"epoch": 6.238601823708207,
"grad_norm": 0.42685774893365297,
"learning_rate": 1.4302521882811316e-06,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1383514404296875,
"step": 4105,
"valid_targets_mean": 5403.9,
"valid_targets_min": 918
},
{
"epoch": 6.246200607902735,
"grad_norm": 0.5366963612937214,
"learning_rate": 1.4022390550274034e-06,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15787436068058014,
"step": 4110,
"valid_targets_mean": 3990.0,
"valid_targets_min": 434
},
{
"epoch": 6.253799392097265,
"grad_norm": 0.46724324680744234,
"learning_rate": 1.3744930075901563e-06,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14154699444770813,
"step": 4115,
"valid_targets_mean": 4727.9,
"valid_targets_min": 588
},
{
"epoch": 6.261398176291793,
"grad_norm": 0.41711994711720174,
"learning_rate": 1.3470144444354061e-06,
"loss": 0.1499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1419452279806137,
"step": 4120,
"valid_targets_mean": 5510.2,
"valid_targets_min": 713
},
{
"epoch": 6.268996960486322,
"grad_norm": 0.5220642496809625,
"learning_rate": 1.3198037601877789e-06,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1353391706943512,
"step": 4125,
"valid_targets_mean": 4115.4,
"valid_targets_min": 450
},
{
"epoch": 6.276595744680851,
"grad_norm": 0.4939240759429581,
"learning_rate": 1.2928613456248473e-06,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15414312481880188,
"step": 4130,
"valid_targets_mean": 5176.1,
"valid_targets_min": 571
},
{
"epoch": 6.28419452887538,
"grad_norm": 0.442808139834025,
"learning_rate": 1.266187587671508e-06,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15302585065364838,
"step": 4135,
"valid_targets_mean": 5258.6,
"valid_targets_min": 2495
},
{
"epoch": 6.291793313069909,
"grad_norm": 0.4548322696937593,
"learning_rate": 1.2397828693944346e-06,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14306071400642395,
"step": 4140,
"valid_targets_mean": 4863.1,
"valid_targets_min": 1948
},
{
"epoch": 6.2993920972644375,
"grad_norm": 0.46459072507225524,
"learning_rate": 1.2136475699965766e-06,
"loss": 0.1448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1553143858909607,
"step": 4145,
"valid_targets_mean": 4614.7,
"valid_targets_min": 816
},
{
"epoch": 6.306990881458967,
"grad_norm": 0.4740383536049804,
"learning_rate": 1.1877820648117045e-06,
"loss": 0.1487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13636600971221924,
"step": 4150,
"valid_targets_mean": 4426.7,
"valid_targets_min": 668
},
{
"epoch": 6.314589665653496,
"grad_norm": 0.6354900899788738,
"learning_rate": 1.162186725299026e-06,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.155159130692482,
"step": 4155,
"valid_targets_mean": 3329.7,
"valid_targets_min": 585
},
{
"epoch": 6.322188449848024,
"grad_norm": 0.4835553520976796,
"learning_rate": 1.1368619190378527e-06,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17658662796020508,
"step": 4160,
"valid_targets_mean": 4895.8,
"valid_targets_min": 1482
},
{
"epoch": 6.329787234042553,
"grad_norm": 0.4554986467408132,
"learning_rate": 1.1118080097223194e-06,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15265491604804993,
"step": 4165,
"valid_targets_mean": 5167.2,
"valid_targets_min": 1292
},
{
"epoch": 6.3373860182370825,
"grad_norm": 0.41973694830585506,
"learning_rate": 1.0870253571561595e-06,
"loss": 0.1551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12299495190382004,
"step": 4170,
"valid_targets_mean": 4780.7,
"valid_targets_min": 970
},
{
"epoch": 6.344984802431611,
"grad_norm": 0.5118900681918644,
"learning_rate": 1.0625143172475404e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15326988697052002,
"step": 4175,
"valid_targets_mean": 4208.6,
"valid_targets_min": 636
},
{
"epoch": 6.35258358662614,
"grad_norm": 0.49642090601129557,
"learning_rate": 1.0382752420039455e-06,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15455183386802673,
"step": 4180,
"valid_targets_mean": 4102.3,
"valid_targets_min": 997
},
{
"epoch": 6.360182370820668,
"grad_norm": 0.45380918848581747,
"learning_rate": 1.0143084795271329e-06,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15013962984085083,
"step": 4185,
"valid_targets_mean": 4628.6,
"valid_targets_min": 1572
},
{
"epoch": 6.367781155015198,
"grad_norm": 0.5198176682483998,
"learning_rate": 9.906143740081232e-07,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15279626846313477,
"step": 4190,
"valid_targets_mean": 3914.1,
"valid_targets_min": 365
},
{
"epoch": 6.375379939209727,
"grad_norm": 0.4840441603322201,
"learning_rate": 9.671932657222593e-07,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14245177805423737,
"step": 4195,
"valid_targets_mean": 4812.6,
"valid_targets_min": 370
},
{
"epoch": 6.382978723404255,
"grad_norm": 0.49127649884609786,
"learning_rate": 9.440454910243235e-07,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1520758867263794,
"step": 4200,
"valid_targets_mean": 4315.1,
"valid_targets_min": 517
},
{
"epoch": 6.390577507598784,
"grad_norm": 0.4383379165078549,
"learning_rate": 9.211713823437063e-07,
"loss": 0.135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1275199055671692,
"step": 4205,
"valid_targets_mean": 5704.6,
"valid_targets_min": 581
},
{
"epoch": 6.398176291793313,
"grad_norm": 0.5022657150694129,
"learning_rate": 8.985712681796288e-07,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17914274334907532,
"step": 4210,
"valid_targets_mean": 4508.4,
"valid_targets_min": 640
},
{
"epoch": 6.405775075987842,
"grad_norm": 0.443057452645931,
"learning_rate": 8.762454730964265e-07,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15875935554504395,
"step": 4215,
"valid_targets_mean": 5279.9,
"valid_targets_min": 972
},
{
"epoch": 6.413373860182371,
"grad_norm": 0.5449589653106505,
"learning_rate": 8.541943177188882e-07,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14582566916942596,
"step": 4220,
"valid_targets_mean": 4343.2,
"valid_targets_min": 892
},
{
"epoch": 6.420972644376899,
"grad_norm": 0.4997679647771693,
"learning_rate": 8.324181187276581e-07,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15510517358779907,
"step": 4225,
"valid_targets_mean": 4085.7,
"valid_targets_min": 912
},
{
"epoch": 6.428571428571429,
"grad_norm": 0.44678133251760943,
"learning_rate": 8.109171888546763e-07,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15751153230667114,
"step": 4230,
"valid_targets_mean": 5778.9,
"valid_targets_min": 1954
},
{
"epoch": 6.4361702127659575,
"grad_norm": 0.46788177391921826,
"learning_rate": 7.896918368786921e-07,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15475589036941528,
"step": 4235,
"valid_targets_mean": 5169.8,
"valid_targets_min": 398
},
{
"epoch": 6.443768996960486,
"grad_norm": 0.5529538967645823,
"learning_rate": 7.687423676208361e-07,
"loss": 0.1455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13819439709186554,
"step": 4240,
"valid_targets_mean": 3202.6,
"valid_targets_min": 528
},
{
"epoch": 6.451367781155016,
"grad_norm": 0.5420949591531663,
"learning_rate": 7.480690819402348e-07,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1723976731300354,
"step": 4245,
"valid_targets_mean": 3846.0,
"valid_targets_min": 630
},
{
"epoch": 6.458966565349544,
"grad_norm": 0.46741861641823984,
"learning_rate": 7.276722767296873e-07,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1849384605884552,
"step": 4250,
"valid_targets_mean": 5119.9,
"valid_targets_min": 883
},
{
"epoch": 6.466565349544073,
"grad_norm": 0.4582713436855528,
"learning_rate": 7.075522449114158e-07,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15820877254009247,
"step": 4255,
"valid_targets_mean": 5030.8,
"valid_targets_min": 802
},
{
"epoch": 6.474164133738602,
"grad_norm": 0.5211860109572727,
"learning_rate": 6.877092754328419e-07,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13718628883361816,
"step": 4260,
"valid_targets_mean": 3807.9,
"valid_targets_min": 845
},
{
"epoch": 6.481762917933131,
"grad_norm": 0.45451059770584273,
"learning_rate": 6.681436532624474e-07,
"loss": 0.1487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1656309813261032,
"step": 4265,
"valid_targets_mean": 5183.2,
"valid_targets_min": 1002
},
{
"epoch": 6.48936170212766,
"grad_norm": 0.47843071748812777,
"learning_rate": 6.488556593856809e-07,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.150562584400177,
"step": 4270,
"valid_targets_mean": 4543.6,
"valid_targets_min": 656
},
{
"epoch": 6.496960486322188,
"grad_norm": 0.5319539824885515,
"learning_rate": 6.298455708009176e-07,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15512758493423462,
"step": 4275,
"valid_targets_mean": 3799.5,
"valid_targets_min": 395
},
{
"epoch": 6.504559270516717,
"grad_norm": 0.4705596941066166,
"learning_rate": 6.111136605154877e-07,
"loss": 0.1457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16856907308101654,
"step": 4280,
"valid_targets_mean": 4642.4,
"valid_targets_min": 589
},
{
"epoch": 6.5121580547112465,
"grad_norm": 0.46141711207212177,
"learning_rate": 5.926601975417501e-07,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17225798964500427,
"step": 4285,
"valid_targets_mean": 4939.4,
"valid_targets_min": 706
},
{
"epoch": 6.519756838905775,
"grad_norm": 0.4495104074555779,
"learning_rate": 5.744854468932315e-07,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1445414125919342,
"step": 4290,
"valid_targets_mean": 4603.4,
"valid_targets_min": 810
},
{
"epoch": 6.527355623100304,
"grad_norm": 0.5733777706336946,
"learning_rate": 5.565896695808203e-07,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16275358200073242,
"step": 4295,
"valid_targets_mean": 4785.0,
"valid_targets_min": 599
},
{
"epoch": 6.5349544072948325,
"grad_norm": 0.8991578623134154,
"learning_rate": 5.389731226090189e-07,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14771892130374908,
"step": 4300,
"valid_targets_mean": 4996.3,
"valid_targets_min": 981
},
{
"epoch": 6.542553191489362,
"grad_norm": 0.4730812664882942,
"learning_rate": 5.216360589722546e-07,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12634432315826416,
"step": 4305,
"valid_targets_mean": 4793.1,
"valid_targets_min": 689
},
{
"epoch": 6.550151975683891,
"grad_norm": 0.7912559796750507,
"learning_rate": 5.045787276512371e-07,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14239290356636047,
"step": 4310,
"valid_targets_mean": 4268.8,
"valid_targets_min": 558
},
{
"epoch": 6.557750759878419,
"grad_norm": 0.5029546562969596,
"learning_rate": 4.878013736093979e-07,
"loss": 0.1436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1558806449174881,
"step": 4315,
"valid_targets_mean": 4656.5,
"valid_targets_min": 767
},
{
"epoch": 6.565349544072948,
"grad_norm": 0.4604621873568329,
"learning_rate": 4.713042377893562e-07,
"loss": 0.1377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1444740742444992,
"step": 4320,
"valid_targets_mean": 4422.7,
"valid_targets_min": 346
},
{
"epoch": 6.572948328267477,
"grad_norm": 0.4561980791707648,
"learning_rate": 4.550875571094726e-07,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14359544217586517,
"step": 4325,
"valid_targets_mean": 4979.9,
"valid_targets_min": 2820
},
{
"epoch": 6.580547112462006,
"grad_norm": 0.47209358910428856,
"learning_rate": 4.391515644604383e-07,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1348213255405426,
"step": 4330,
"valid_targets_mean": 4494.7,
"valid_targets_min": 589
},
{
"epoch": 6.588145896656535,
"grad_norm": 0.4994707929739602,
"learning_rate": 4.2349648870193103e-07,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15195885300636292,
"step": 4335,
"valid_targets_mean": 4239.8,
"valid_targets_min": 307
},
{
"epoch": 6.595744680851064,
"grad_norm": 0.44042761045131223,
"learning_rate": 4.081225546593337e-07,
"loss": 0.1513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.129265695810318,
"step": 4340,
"valid_targets_mean": 5283.0,
"valid_targets_min": 1159
},
{
"epoch": 6.603343465045593,
"grad_norm": 0.47257646281879734,
"learning_rate": 3.9302998312049865e-07,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14243176579475403,
"step": 4345,
"valid_targets_mean": 5513.4,
"valid_targets_min": 1072
},
{
"epoch": 6.6109422492401215,
"grad_norm": 0.5058368728464357,
"learning_rate": 3.782189908325817e-07,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14209382236003876,
"step": 4350,
"valid_targets_mean": 4845.4,
"valid_targets_min": 876
},
{
"epoch": 6.61854103343465,
"grad_norm": 0.7222155225557564,
"learning_rate": 3.636897904989312e-07,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17290833592414856,
"step": 4355,
"valid_targets_mean": 5422.5,
"valid_targets_min": 833
},
{
"epoch": 6.62613981762918,
"grad_norm": 0.5233180981965705,
"learning_rate": 3.494425907760235e-07,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1492675244808197,
"step": 4360,
"valid_targets_mean": 4823.8,
"valid_targets_min": 1224
},
{
"epoch": 6.633738601823708,
"grad_norm": 0.5428953839010765,
"learning_rate": 3.3547759627047927e-07,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16122207045555115,
"step": 4365,
"valid_targets_mean": 3899.6,
"valid_targets_min": 753
},
{
"epoch": 6.641337386018237,
"grad_norm": 0.4419180172745714,
"learning_rate": 3.2179500753611423e-07,
"loss": 0.1436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.135797381401062,
"step": 4370,
"valid_targets_mean": 5275.6,
"valid_targets_min": 861
},
{
"epoch": 6.648936170212766,
"grad_norm": 0.4922555679423693,
"learning_rate": 3.0839502107106625e-07,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13909777998924255,
"step": 4375,
"valid_targets_mean": 3951.1,
"valid_targets_min": 702
},
{
"epoch": 6.656534954407295,
"grad_norm": 0.5087072512502506,
"learning_rate": 2.952778293149705e-07,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16498416662216187,
"step": 4380,
"valid_targets_mean": 4312.6,
"valid_targets_min": 429
},
{
"epoch": 6.664133738601824,
"grad_norm": 0.4560459158918358,
"learning_rate": 2.8244362064619777e-07,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13717833161354065,
"step": 4385,
"valid_targets_mean": 5210.4,
"valid_targets_min": 864
},
{
"epoch": 6.671732522796352,
"grad_norm": 0.5227653302420172,
"learning_rate": 2.698925793791407e-07,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13961048424243927,
"step": 4390,
"valid_targets_mean": 4236.1,
"valid_targets_min": 534
},
{
"epoch": 6.679331306990882,
"grad_norm": 0.6213258302004528,
"learning_rate": 2.576248857615826e-07,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14259956777095795,
"step": 4395,
"valid_targets_mean": 4035.6,
"valid_targets_min": 752
},
{
"epoch": 6.686930091185411,
"grad_norm": 0.4688652989866426,
"learning_rate": 2.4564071597209304e-07,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15681865811347961,
"step": 4400,
"valid_targets_mean": 4584.2,
"valid_targets_min": 869
},
{
"epoch": 6.694528875379939,
"grad_norm": 0.44005419382672806,
"learning_rate": 2.3394024211750964e-07,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1523476541042328,
"step": 4405,
"valid_targets_mean": 4952.2,
"valid_targets_min": 646
},
{
"epoch": 6.702127659574468,
"grad_norm": 0.5205262877358279,
"learning_rate": 2.2252363223045358e-07,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16646242141723633,
"step": 4410,
"valid_targets_mean": 4151.1,
"valid_targets_min": 820
},
{
"epoch": 6.7097264437689965,
"grad_norm": 0.40766981515095174,
"learning_rate": 2.1139105026693586e-07,
"loss": 0.139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11196255683898926,
"step": 4415,
"valid_targets_mean": 5557.6,
"valid_targets_min": 2410
},
{
"epoch": 6.717325227963526,
"grad_norm": 0.4673986831108265,
"learning_rate": 2.0054265610397916e-07,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1210668534040451,
"step": 4420,
"valid_targets_mean": 3992.8,
"valid_targets_min": 936
},
{
"epoch": 6.724924012158055,
"grad_norm": 0.5619671678982381,
"learning_rate": 1.8997860553733981e-07,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17317882180213928,
"step": 4425,
"valid_targets_mean": 3874.4,
"valid_targets_min": 446
},
{
"epoch": 6.732522796352583,
"grad_norm": 0.4280630319229206,
"learning_rate": 1.7969905027926504e-07,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1904495656490326,
"step": 4430,
"valid_targets_mean": 6671.5,
"valid_targets_min": 907
},
{
"epoch": 6.740121580547113,
"grad_norm": 0.44122684787277994,
"learning_rate": 1.6970413795631025e-07,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14559206366539001,
"step": 4435,
"valid_targets_mean": 5373.0,
"valid_targets_min": 595
},
{
"epoch": 6.7477203647416415,
"grad_norm": 0.5080820811124032,
"learning_rate": 1.5999401210722075e-07,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1340736597776413,
"step": 4440,
"valid_targets_mean": 3668.2,
"valid_targets_min": 694
},
{
"epoch": 6.75531914893617,
"grad_norm": 0.5257059339394762,
"learning_rate": 1.5056881218088016e-07,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15984541177749634,
"step": 4445,
"valid_targets_mean": 4337.5,
"valid_targets_min": 498
},
{
"epoch": 6.762917933130699,
"grad_norm": 0.43327223465331344,
"learning_rate": 1.4142867353428514e-07,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.157816082239151,
"step": 4450,
"valid_targets_mean": 5491.9,
"valid_targets_min": 827
},
{
"epoch": 6.770516717325228,
"grad_norm": 0.50219861891989,
"learning_rate": 1.3257372743063157e-07,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11714717745780945,
"step": 4455,
"valid_targets_mean": 3812.8,
"valid_targets_min": 502
},
{
"epoch": 6.778115501519757,
"grad_norm": 0.45055666905824504,
"learning_rate": 1.2400410103740045e-07,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14584630727767944,
"step": 4460,
"valid_targets_mean": 5178.9,
"valid_targets_min": 516
},
{
"epoch": 6.785714285714286,
"grad_norm": 0.43952764279896794,
"learning_rate": 1.157199174245549e-07,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13095200061798096,
"step": 4465,
"valid_targets_mean": 5314.9,
"valid_targets_min": 1217
},
{
"epoch": 6.793313069908814,
"grad_norm": 0.4738968512497199,
"learning_rate": 1.0772129556275268e-07,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12924160063266754,
"step": 4470,
"valid_targets_mean": 4845.8,
"valid_targets_min": 843
},
{
"epoch": 6.800911854103344,
"grad_norm": 0.5060295374260998,
"learning_rate": 1.0000835032165645e-07,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1658594310283661,
"step": 4475,
"valid_targets_mean": 4230.7,
"valid_targets_min": 915
},
{
"epoch": 6.808510638297872,
"grad_norm": 0.4466023053432,
"learning_rate": 9.258119246826625e-08,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1489754319190979,
"step": 4480,
"valid_targets_mean": 5316.6,
"valid_targets_min": 2627
},
{
"epoch": 6.816109422492401,
"grad_norm": 0.46338292936158193,
"learning_rate": 8.543992866534734e-08,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14392951130867004,
"step": 4485,
"valid_targets_mean": 4956.6,
"valid_targets_min": 409
},
{
"epoch": 6.823708206686931,
"grad_norm": 0.5158394667496263,
"learning_rate": 7.858466146988042e-08,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16497617959976196,
"step": 4490,
"valid_targets_mean": 4279.7,
"valid_targets_min": 775
},
{
"epoch": 6.831306990881459,
"grad_norm": 0.42417696152695383,
"learning_rate": 7.201548933160275e-08,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14127472043037415,
"step": 4495,
"valid_targets_mean": 5479.2,
"valid_targets_min": 2631
},
{
"epoch": 6.838905775075988,
"grad_norm": 0.5211912905058261,
"learning_rate": 6.573250659158481e-08,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14878888428211212,
"step": 4500,
"valid_targets_mean": 4435.9,
"valid_targets_min": 2412
},
{
"epoch": 6.8465045592705165,
"grad_norm": 0.43147229360794226,
"learning_rate": 5.973580348088259e-08,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15211549401283264,
"step": 4505,
"valid_targets_mean": 5367.4,
"valid_targets_min": 2364
},
{
"epoch": 6.854103343465045,
"grad_norm": 0.4561025698955299,
"learning_rate": 5.4025466119234094e-08,
"loss": 0.152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13766488432884216,
"step": 4510,
"valid_targets_mean": 5133.6,
"valid_targets_min": 655
},
{
"epoch": 6.861702127659575,
"grad_norm": 0.4670200688124053,
"learning_rate": 4.860157651383146e-08,
"loss": 0.1457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12196432799100876,
"step": 4515,
"valid_targets_mean": 5354.1,
"valid_targets_min": 1941
},
{
"epoch": 6.869300911854103,
"grad_norm": 0.46811141014194185,
"learning_rate": 4.346421255813527e-08,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1508735716342926,
"step": 4520,
"valid_targets_mean": 4876.9,
"valid_targets_min": 647
},
{
"epoch": 6.876899696048632,
"grad_norm": 0.5309409348069238,
"learning_rate": 3.8613448030759836e-08,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1319991499185562,
"step": 4525,
"valid_targets_mean": 4153.0,
"valid_targets_min": 558
},
{
"epoch": 6.8844984802431615,
"grad_norm": 0.4583034610783906,
"learning_rate": 3.404935259441633e-08,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1385440230369568,
"step": 4530,
"valid_targets_mean": 5040.1,
"valid_targets_min": 666
},
{
"epoch": 6.89209726443769,
"grad_norm": 0.5760708842558298,
"learning_rate": 2.977199179490686e-08,
"loss": 0.152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16344650089740753,
"step": 4535,
"valid_targets_mean": 4789.9,
"valid_targets_min": 774
},
{
"epoch": 6.899696048632219,
"grad_norm": 0.5268446726565859,
"learning_rate": 2.5781427060183052e-08,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1606959104537964,
"step": 4540,
"valid_targets_mean": 4283.8,
"valid_targets_min": 229
},
{
"epoch": 6.907294832826747,
"grad_norm": 0.4734646023589767,
"learning_rate": 2.2077715699468928e-08,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14003373682498932,
"step": 4545,
"valid_targets_mean": 4974.8,
"valid_targets_min": 773
},
{
"epoch": 6.914893617021277,
"grad_norm": 0.4360796739556199,
"learning_rate": 1.8660910902434936e-08,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12974536418914795,
"step": 4550,
"valid_targets_mean": 5910.8,
"valid_targets_min": 1114
},
{
"epoch": 6.922492401215806,
"grad_norm": 0.48684145305746557,
"learning_rate": 1.5531061738436327e-08,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15198959410190582,
"step": 4555,
"valid_targets_mean": 3936.3,
"valid_targets_min": 1779
},
{
"epoch": 6.930091185410334,
"grad_norm": 0.5091294127835059,
"learning_rate": 1.2688213155802598e-08,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1628214567899704,
"step": 4560,
"valid_targets_mean": 4214.5,
"valid_targets_min": 683
},
{
"epoch": 6.937689969604863,
"grad_norm": 0.43005172219863,
"learning_rate": 1.0132405981195804e-08,
"loss": 0.1287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13487809896469116,
"step": 4565,
"valid_targets_mean": 5104.1,
"valid_targets_min": 2548
},
{
"epoch": 6.945288753799392,
"grad_norm": 0.5851616543398429,
"learning_rate": 7.863676919031005e-09,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13807334005832672,
"step": 4570,
"valid_targets_mean": 4572.6,
"valid_targets_min": 792
},
{
"epoch": 6.952887537993921,
"grad_norm": 0.5007425137471639,
"learning_rate": 5.882058550932268e-09,
"loss": 0.1427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1591353416442871,
"step": 4575,
"valid_targets_mean": 3956.2,
"valid_targets_min": 447
},
{
"epoch": 6.96048632218845,
"grad_norm": 0.5253135197553259,
"learning_rate": 4.187579335281911e-09,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16565826535224915,
"step": 4580,
"valid_targets_mean": 3869.7,
"valid_targets_min": 1117
},
{
"epoch": 6.968085106382979,
"grad_norm": 0.5136974200238252,
"learning_rate": 2.780263606805278e-09,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1372585892677307,
"step": 4585,
"valid_targets_mean": 4006.6,
"valid_targets_min": 538
},
{
"epoch": 6.975683890577508,
"grad_norm": 0.5478996499330996,
"learning_rate": 1.6601315762154735e-09,
"loss": 0.1487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1610221564769745,
"step": 4590,
"valid_targets_mean": 4602.3,
"valid_targets_min": 741
},
{
"epoch": 6.9832826747720365,
"grad_norm": 0.48873947966074016,
"learning_rate": 8.271993299358017e-10,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16153308749198914,
"step": 4595,
"valid_targets_mean": 4922.5,
"valid_targets_min": 589
},
{
"epoch": 6.990881458966565,
"grad_norm": 0.484585895107589,
"learning_rate": 2.814788298532989e-10,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14617104828357697,
"step": 4600,
"valid_targets_mean": 4203.9,
"valid_targets_min": 714
},
{
"epoch": 6.998480243161094,
"grad_norm": 0.4567401537531439,
"learning_rate": 2.2977913158861444e-11,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15201044082641602,
"step": 4605,
"valid_targets_mean": 5189.9,
"valid_targets_min": 511
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1645904779434204,
"step": 4606,
"total_flos": 1702570888593408.0,
"train_loss": 0.19200077259858897,
"train_runtime": 28350.7795,
"train_samples_per_second": 2.597,
"train_steps_per_second": 0.162,
"valid_targets_mean": 3879.8,
"valid_targets_min": 728
}
],
"logging_steps": 5,
"max_steps": 4606,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1702570888593408.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}