a1-stack_rust / trainer_state.json
EtashGuha's picture
Upload folder using huggingface_hub
dfd2831 verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4403,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.00794912559618442,
"grad_norm": 17.84746630996863,
"learning_rate": 3.6281179138322e-07,
"loss": 0.6173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6814424991607666,
"step": 5,
"valid_targets_mean": 4120.6,
"valid_targets_min": 293
},
{
"epoch": 0.01589825119236884,
"grad_norm": 17.156517918811076,
"learning_rate": 8.163265306122449e-07,
"loss": 0.6758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6257226467132568,
"step": 10,
"valid_targets_mean": 3674.1,
"valid_targets_min": 434
},
{
"epoch": 0.02384737678855326,
"grad_norm": 18.01419791342929,
"learning_rate": 1.26984126984127e-06,
"loss": 0.7098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7265408635139465,
"step": 15,
"valid_targets_mean": 3347.9,
"valid_targets_min": 619
},
{
"epoch": 0.03179650238473768,
"grad_norm": 11.167185739612897,
"learning_rate": 1.723356009070295e-06,
"loss": 0.6202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5243589282035828,
"step": 20,
"valid_targets_mean": 4327.7,
"valid_targets_min": 295
},
{
"epoch": 0.0397456279809221,
"grad_norm": 8.22954319900581,
"learning_rate": 2.17687074829932e-06,
"loss": 0.5494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5256298780441284,
"step": 25,
"valid_targets_mean": 3764.8,
"valid_targets_min": 1259
},
{
"epoch": 0.04769475357710652,
"grad_norm": 5.286623836409655,
"learning_rate": 2.6303854875283447e-06,
"loss": 0.5207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5739851593971252,
"step": 30,
"valid_targets_mean": 3315.1,
"valid_targets_min": 936
},
{
"epoch": 0.05564387917329094,
"grad_norm": 3.091625342947559,
"learning_rate": 3.08390022675737e-06,
"loss": 0.4249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46355006098747253,
"step": 35,
"valid_targets_mean": 3561.8,
"valid_targets_min": 557
},
{
"epoch": 0.06359300476947535,
"grad_norm": 1.6120343190128226,
"learning_rate": 3.537414965986395e-06,
"loss": 0.4443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.429388165473938,
"step": 40,
"valid_targets_mean": 4614.9,
"valid_targets_min": 834
},
{
"epoch": 0.07154213036565978,
"grad_norm": 1.1722091804408992,
"learning_rate": 3.99092970521542e-06,
"loss": 0.3702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38033077120780945,
"step": 45,
"valid_targets_mean": 4552.9,
"valid_targets_min": 606
},
{
"epoch": 0.0794912559618442,
"grad_norm": 1.2237202548885548,
"learning_rate": 4.444444444444444e-06,
"loss": 0.4028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39322787523269653,
"step": 50,
"valid_targets_mean": 2935.4,
"valid_targets_min": 654
},
{
"epoch": 0.08744038155802862,
"grad_norm": 0.9959193308010645,
"learning_rate": 4.897959183673469e-06,
"loss": 0.3929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3938031792640686,
"step": 55,
"valid_targets_mean": 3294.7,
"valid_targets_min": 357
},
{
"epoch": 0.09538950715421304,
"grad_norm": 0.7829705793426464,
"learning_rate": 5.3514739229024945e-06,
"loss": 0.3598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37601467967033386,
"step": 60,
"valid_targets_mean": 4138.0,
"valid_targets_min": 266
},
{
"epoch": 0.10333863275039745,
"grad_norm": 0.7891875286042732,
"learning_rate": 5.80498866213152e-06,
"loss": 0.3652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31892889738082886,
"step": 65,
"valid_targets_mean": 3174.8,
"valid_targets_min": 359
},
{
"epoch": 0.11128775834658187,
"grad_norm": 0.5962960338010875,
"learning_rate": 6.258503401360545e-06,
"loss": 0.336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2778470516204834,
"step": 70,
"valid_targets_mean": 4142.1,
"valid_targets_min": 917
},
{
"epoch": 0.1192368839427663,
"grad_norm": 0.6600711718977473,
"learning_rate": 6.71201814058957e-06,
"loss": 0.3393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32065966725349426,
"step": 75,
"valid_targets_mean": 3403.6,
"valid_targets_min": 836
},
{
"epoch": 0.1271860095389507,
"grad_norm": 0.5724896809709736,
"learning_rate": 7.165532879818595e-06,
"loss": 0.3093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3127829134464264,
"step": 80,
"valid_targets_mean": 3913.0,
"valid_targets_min": 241
},
{
"epoch": 0.13513513513513514,
"grad_norm": 0.6797026306142546,
"learning_rate": 7.61904761904762e-06,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32160434126853943,
"step": 85,
"valid_targets_mean": 3563.1,
"valid_targets_min": 262
},
{
"epoch": 0.14308426073131955,
"grad_norm": 0.7278883756953868,
"learning_rate": 8.072562358276645e-06,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3462420701980591,
"step": 90,
"valid_targets_mean": 2732.4,
"valid_targets_min": 755
},
{
"epoch": 0.151033386327504,
"grad_norm": 0.5708083904356873,
"learning_rate": 8.52607709750567e-06,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3244127333164215,
"step": 95,
"valid_targets_mean": 4137.4,
"valid_targets_min": 281
},
{
"epoch": 0.1589825119236884,
"grad_norm": 0.6276207848939579,
"learning_rate": 8.979591836734695e-06,
"loss": 0.3111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26650288701057434,
"step": 100,
"valid_targets_mean": 3918.8,
"valid_targets_min": 679
},
{
"epoch": 0.1669316375198728,
"grad_norm": 0.5159242585947521,
"learning_rate": 9.43310657596372e-06,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2642788887023926,
"step": 105,
"valid_targets_mean": 4179.4,
"valid_targets_min": 1342
},
{
"epoch": 0.17488076311605724,
"grad_norm": 0.507714398672033,
"learning_rate": 9.886621315192746e-06,
"loss": 0.2774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23547717928886414,
"step": 110,
"valid_targets_mean": 3923.2,
"valid_targets_min": 469
},
{
"epoch": 0.18282988871224165,
"grad_norm": 0.5564144664645884,
"learning_rate": 1.034013605442177e-05,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28326016664505005,
"step": 115,
"valid_targets_mean": 3575.0,
"valid_targets_min": 269
},
{
"epoch": 0.1907790143084261,
"grad_norm": 0.5695684791526006,
"learning_rate": 1.0793650793650794e-05,
"loss": 0.2816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26167941093444824,
"step": 120,
"valid_targets_mean": 3303.6,
"valid_targets_min": 641
},
{
"epoch": 0.1987281399046105,
"grad_norm": 0.5237201400320065,
"learning_rate": 1.124716553287982e-05,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28204721212387085,
"step": 125,
"valid_targets_mean": 4681.8,
"valid_targets_min": 569
},
{
"epoch": 0.2066772655007949,
"grad_norm": 0.49001217913037826,
"learning_rate": 1.1700680272108845e-05,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25121694803237915,
"step": 130,
"valid_targets_mean": 4638.6,
"valid_targets_min": 1821
},
{
"epoch": 0.21462639109697934,
"grad_norm": 0.5448380739456933,
"learning_rate": 1.215419501133787e-05,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24607300758361816,
"step": 135,
"valid_targets_mean": 3504.9,
"valid_targets_min": 673
},
{
"epoch": 0.22257551669316375,
"grad_norm": 0.5687526210815153,
"learning_rate": 1.2607709750566895e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2677372694015503,
"step": 140,
"valid_targets_mean": 3854.4,
"valid_targets_min": 1329
},
{
"epoch": 0.23052464228934816,
"grad_norm": 0.6758185299669368,
"learning_rate": 1.3061224489795918e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31545472145080566,
"step": 145,
"valid_targets_mean": 3157.5,
"valid_targets_min": 748
},
{
"epoch": 0.2384737678855326,
"grad_norm": 0.5061882696731755,
"learning_rate": 1.3514739229024945e-05,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2856583595275879,
"step": 150,
"valid_targets_mean": 4388.9,
"valid_targets_min": 478
},
{
"epoch": 0.246422893481717,
"grad_norm": 0.5014286356533292,
"learning_rate": 1.3968253968253968e-05,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2581082582473755,
"step": 155,
"valid_targets_mean": 4534.4,
"valid_targets_min": 891
},
{
"epoch": 0.2543720190779014,
"grad_norm": 0.45068416242985176,
"learning_rate": 1.4421768707482994e-05,
"loss": 0.2487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21287065744400024,
"step": 160,
"valid_targets_mean": 4851.8,
"valid_targets_min": 1754
},
{
"epoch": 0.26232114467408585,
"grad_norm": 0.47658632064664735,
"learning_rate": 1.4875283446712018e-05,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22702300548553467,
"step": 165,
"valid_targets_mean": 4325.5,
"valid_targets_min": 343
},
{
"epoch": 0.2702702702702703,
"grad_norm": 0.5277022645179128,
"learning_rate": 1.5328798185941044e-05,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2435617595911026,
"step": 170,
"valid_targets_mean": 3762.1,
"valid_targets_min": 581
},
{
"epoch": 0.27821939586645467,
"grad_norm": 0.5760228675809232,
"learning_rate": 1.578231292517007e-05,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2474684715270996,
"step": 175,
"valid_targets_mean": 4084.1,
"valid_targets_min": 740
},
{
"epoch": 0.2861685214626391,
"grad_norm": 0.6439319078197573,
"learning_rate": 1.6235827664399097e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3096400797367096,
"step": 180,
"valid_targets_mean": 2994.4,
"valid_targets_min": 273
},
{
"epoch": 0.29411764705882354,
"grad_norm": 0.5928535221147084,
"learning_rate": 1.668934240362812e-05,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24331536889076233,
"step": 185,
"valid_targets_mean": 3329.2,
"valid_targets_min": 714
},
{
"epoch": 0.302066772655008,
"grad_norm": 1.033627870156792,
"learning_rate": 1.7142857142857142e-05,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2561456561088562,
"step": 190,
"valid_targets_mean": 3033.4,
"valid_targets_min": 683
},
{
"epoch": 0.31001589825119236,
"grad_norm": 0.669117146581437,
"learning_rate": 1.759637188208617e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26669400930404663,
"step": 195,
"valid_targets_mean": 3196.8,
"valid_targets_min": 279
},
{
"epoch": 0.3179650238473768,
"grad_norm": 0.5158072838218852,
"learning_rate": 1.8049886621315194e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20886510610580444,
"step": 200,
"valid_targets_mean": 3514.2,
"valid_targets_min": 230
},
{
"epoch": 0.32591414944356123,
"grad_norm": 0.4417940976227962,
"learning_rate": 1.8503401360544218e-05,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2474132776260376,
"step": 205,
"valid_targets_mean": 5143.9,
"valid_targets_min": 657
},
{
"epoch": 0.3338632750397456,
"grad_norm": 0.5669027262046396,
"learning_rate": 1.8956916099773243e-05,
"loss": 0.2495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2375866174697876,
"step": 210,
"valid_targets_mean": 4060.5,
"valid_targets_min": 787
},
{
"epoch": 0.34181240063593005,
"grad_norm": 0.5058043503905316,
"learning_rate": 1.941043083900227e-05,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21849530935287476,
"step": 215,
"valid_targets_mean": 4479.1,
"valid_targets_min": 871
},
{
"epoch": 0.3497615262321145,
"grad_norm": 0.7472969855667505,
"learning_rate": 1.9863945578231295e-05,
"loss": 0.2491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22537925839424133,
"step": 220,
"valid_targets_mean": 3716.9,
"valid_targets_min": 1008
},
{
"epoch": 0.35771065182829886,
"grad_norm": 0.4763106253774264,
"learning_rate": 2.031746031746032e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22549283504486084,
"step": 225,
"valid_targets_mean": 4696.7,
"valid_targets_min": 1345
},
{
"epoch": 0.3656597774244833,
"grad_norm": 0.5870776260460628,
"learning_rate": 2.0770975056689343e-05,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2403266578912735,
"step": 230,
"valid_targets_mean": 3434.6,
"valid_targets_min": 659
},
{
"epoch": 0.37360890302066774,
"grad_norm": 0.5224207873951022,
"learning_rate": 2.122448979591837e-05,
"loss": 0.2284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20927098393440247,
"step": 235,
"valid_targets_mean": 3761.1,
"valid_targets_min": 233
},
{
"epoch": 0.3815580286168522,
"grad_norm": 0.5356608057317997,
"learning_rate": 2.1678004535147395e-05,
"loss": 0.2234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22495192289352417,
"step": 240,
"valid_targets_mean": 3884.0,
"valid_targets_min": 976
},
{
"epoch": 0.38950715421303655,
"grad_norm": 0.5368634114039467,
"learning_rate": 2.213151927437642e-05,
"loss": 0.2288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.202118381857872,
"step": 245,
"valid_targets_mean": 4109.8,
"valid_targets_min": 366
},
{
"epoch": 0.397456279809221,
"grad_norm": 0.5223166530343325,
"learning_rate": 2.2585034013605444e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2209833413362503,
"step": 250,
"valid_targets_mean": 4501.5,
"valid_targets_min": 589
},
{
"epoch": 0.40540540540540543,
"grad_norm": 0.6182508332886121,
"learning_rate": 2.3038548752834472e-05,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25408124923706055,
"step": 255,
"valid_targets_mean": 3629.1,
"valid_targets_min": 601
},
{
"epoch": 0.4133545310015898,
"grad_norm": 0.5912718878361719,
"learning_rate": 2.3492063492063496e-05,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24555028975009918,
"step": 260,
"valid_targets_mean": 3606.7,
"valid_targets_min": 327
},
{
"epoch": 0.42130365659777425,
"grad_norm": 0.5750322104699228,
"learning_rate": 2.394557823129252e-05,
"loss": 0.2432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21299511194229126,
"step": 265,
"valid_targets_mean": 3439.4,
"valid_targets_min": 314
},
{
"epoch": 0.4292527821939587,
"grad_norm": 0.706039350107576,
"learning_rate": 2.439909297052154e-05,
"loss": 0.2283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22689072787761688,
"step": 270,
"valid_targets_mean": 2713.6,
"valid_targets_min": 614
},
{
"epoch": 0.43720190779014306,
"grad_norm": 0.4645382324491832,
"learning_rate": 2.4852607709750566e-05,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.186517596244812,
"step": 275,
"valid_targets_mean": 4288.1,
"valid_targets_min": 1067
},
{
"epoch": 0.4451510333863275,
"grad_norm": 0.5461367695964425,
"learning_rate": 2.5306122448979597e-05,
"loss": 0.2365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21831746399402618,
"step": 280,
"valid_targets_mean": 3579.9,
"valid_targets_min": 598
},
{
"epoch": 0.45310015898251194,
"grad_norm": 0.4657927124996843,
"learning_rate": 2.5759637188208618e-05,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1893748790025711,
"step": 285,
"valid_targets_mean": 4740.9,
"valid_targets_min": 1740
},
{
"epoch": 0.4610492845786963,
"grad_norm": 0.6348763363997716,
"learning_rate": 2.6213151927437642e-05,
"loss": 0.2334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19953399896621704,
"step": 290,
"valid_targets_mean": 2926.6,
"valid_targets_min": 542
},
{
"epoch": 0.46899841017488075,
"grad_norm": 0.625040649676204,
"learning_rate": 2.6666666666666667e-05,
"loss": 0.2139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24280428886413574,
"step": 295,
"valid_targets_mean": 3343.4,
"valid_targets_min": 699
},
{
"epoch": 0.4769475357710652,
"grad_norm": 0.6020091340791197,
"learning_rate": 2.7120181405895694e-05,
"loss": 0.2236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2328951060771942,
"step": 300,
"valid_targets_mean": 3270.6,
"valid_targets_min": 349
},
{
"epoch": 0.4848966613672496,
"grad_norm": 0.5774743472055955,
"learning_rate": 2.757369614512472e-05,
"loss": 0.2074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18854255974292755,
"step": 305,
"valid_targets_mean": 3489.1,
"valid_targets_min": 670
},
{
"epoch": 0.492845786963434,
"grad_norm": 0.5002918848960409,
"learning_rate": 2.8027210884353743e-05,
"loss": 0.1993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20658744871616364,
"step": 310,
"valid_targets_mean": 4087.5,
"valid_targets_min": 646
},
{
"epoch": 0.5007949125596184,
"grad_norm": 0.5258071361084128,
"learning_rate": 2.8480725623582767e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26666340231895447,
"step": 315,
"valid_targets_mean": 4920.9,
"valid_targets_min": 711
},
{
"epoch": 0.5087440381558028,
"grad_norm": 0.5359657194543509,
"learning_rate": 2.893424036281179e-05,
"loss": 0.2231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2450794130563736,
"step": 320,
"valid_targets_mean": 4277.5,
"valid_targets_min": 811
},
{
"epoch": 0.5166931637519873,
"grad_norm": 0.47155499713480653,
"learning_rate": 2.938775510204082e-05,
"loss": 0.2315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22731101512908936,
"step": 325,
"valid_targets_mean": 4231.8,
"valid_targets_min": 649
},
{
"epoch": 0.5246422893481717,
"grad_norm": 0.5626140591094698,
"learning_rate": 2.9841269841269844e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24118876457214355,
"step": 330,
"valid_targets_mean": 3969.8,
"valid_targets_min": 614
},
{
"epoch": 0.5325914149443561,
"grad_norm": 0.4432872807332565,
"learning_rate": 3.0294784580498868e-05,
"loss": 0.2225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19566431641578674,
"step": 335,
"valid_targets_mean": 4741.9,
"valid_targets_min": 601
},
{
"epoch": 0.5405405405405406,
"grad_norm": 0.938740381890964,
"learning_rate": 3.074829931972789e-05,
"loss": 0.2466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24197694659233093,
"step": 340,
"valid_targets_mean": 3894.6,
"valid_targets_min": 533
},
{
"epoch": 0.548489666136725,
"grad_norm": 0.5053259602931793,
"learning_rate": 3.1201814058956924e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2000350058078766,
"step": 345,
"valid_targets_mean": 4115.1,
"valid_targets_min": 639
},
{
"epoch": 0.5564387917329093,
"grad_norm": 0.5110974452473003,
"learning_rate": 3.1655328798185945e-05,
"loss": 0.2078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20815539360046387,
"step": 350,
"valid_targets_mean": 4070.4,
"valid_targets_min": 1042
},
{
"epoch": 0.5643879173290938,
"grad_norm": 0.5374530089049312,
"learning_rate": 3.2108843537414965e-05,
"loss": 0.2073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19174043834209442,
"step": 355,
"valid_targets_mean": 3816.1,
"valid_targets_min": 481
},
{
"epoch": 0.5723370429252782,
"grad_norm": 0.5278680977737629,
"learning_rate": 3.256235827664399e-05,
"loss": 0.216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19281309843063354,
"step": 360,
"valid_targets_mean": 4304.8,
"valid_targets_min": 1126
},
{
"epoch": 0.5802861685214626,
"grad_norm": 0.5556493209390555,
"learning_rate": 3.3015873015873014e-05,
"loss": 0.2157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20964595675468445,
"step": 365,
"valid_targets_mean": 3496.3,
"valid_targets_min": 249
},
{
"epoch": 0.5882352941176471,
"grad_norm": 0.5099107198036154,
"learning_rate": 3.346938775510204e-05,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1972021907567978,
"step": 370,
"valid_targets_mean": 4024.8,
"valid_targets_min": 644
},
{
"epoch": 0.5961844197138315,
"grad_norm": 0.5259960559393442,
"learning_rate": 3.392290249433107e-05,
"loss": 0.2207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2222093790769577,
"step": 375,
"valid_targets_mean": 3776.1,
"valid_targets_min": 872
},
{
"epoch": 0.604133545310016,
"grad_norm": 0.5644984822926026,
"learning_rate": 3.437641723356009e-05,
"loss": 0.2339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1983184814453125,
"step": 380,
"valid_targets_mean": 3157.5,
"valid_targets_min": 273
},
{
"epoch": 0.6120826709062003,
"grad_norm": 0.526845185443891,
"learning_rate": 3.482993197278912e-05,
"loss": 0.2421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21050560474395752,
"step": 385,
"valid_targets_mean": 4162.3,
"valid_targets_min": 257
},
{
"epoch": 0.6200317965023847,
"grad_norm": 0.5111567928477996,
"learning_rate": 3.5283446712018146e-05,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2091737687587738,
"step": 390,
"valid_targets_mean": 4373.3,
"valid_targets_min": 1257
},
{
"epoch": 0.6279809220985691,
"grad_norm": 0.4792741938563976,
"learning_rate": 3.573696145124717e-05,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21705269813537598,
"step": 395,
"valid_targets_mean": 4804.3,
"valid_targets_min": 1353
},
{
"epoch": 0.6359300476947536,
"grad_norm": 0.5918892454757362,
"learning_rate": 3.6190476190476195e-05,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2312270998954773,
"step": 400,
"valid_targets_mean": 3560.3,
"valid_targets_min": 1152
},
{
"epoch": 0.643879173290938,
"grad_norm": 0.5068901074600425,
"learning_rate": 3.6643990929705216e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1908341348171234,
"step": 405,
"valid_targets_mean": 3449.1,
"valid_targets_min": 261
},
{
"epoch": 0.6518282988871225,
"grad_norm": 0.5793934181213,
"learning_rate": 3.7097505668934243e-05,
"loss": 0.2184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1862396001815796,
"step": 410,
"valid_targets_mean": 2984.0,
"valid_targets_min": 636
},
{
"epoch": 0.6597774244833068,
"grad_norm": 0.5690118134642445,
"learning_rate": 3.755102040816327e-05,
"loss": 0.2236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23144859075546265,
"step": 415,
"valid_targets_mean": 4501.0,
"valid_targets_min": 1604
},
{
"epoch": 0.6677265500794912,
"grad_norm": 0.5776584245877077,
"learning_rate": 3.800453514739229e-05,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21334588527679443,
"step": 420,
"valid_targets_mean": 3043.1,
"valid_targets_min": 277
},
{
"epoch": 0.6756756756756757,
"grad_norm": 0.4713962722172494,
"learning_rate": 3.845804988662132e-05,
"loss": 0.2073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.193765789270401,
"step": 425,
"valid_targets_mean": 4792.8,
"valid_targets_min": 1292
},
{
"epoch": 0.6836248012718601,
"grad_norm": 0.43246949767784015,
"learning_rate": 3.891156462585034e-05,
"loss": 0.2252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1918296366930008,
"step": 430,
"valid_targets_mean": 5232.2,
"valid_targets_min": 818
},
{
"epoch": 0.6915739268680445,
"grad_norm": 0.6617748262724793,
"learning_rate": 3.936507936507937e-05,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21801866590976715,
"step": 435,
"valid_targets_mean": 2876.1,
"valid_targets_min": 1104
},
{
"epoch": 0.699523052464229,
"grad_norm": 0.5970309098523798,
"learning_rate": 3.9818594104308396e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21752095222473145,
"step": 440,
"valid_targets_mean": 3932.8,
"valid_targets_min": 813
},
{
"epoch": 0.7074721780604134,
"grad_norm": 0.5161262404357317,
"learning_rate": 3.999994341346418e-05,
"loss": 0.2103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.221147358417511,
"step": 445,
"valid_targets_mean": 3660.2,
"valid_targets_min": 736
},
{
"epoch": 0.7154213036565977,
"grad_norm": 0.5628100325252552,
"learning_rate": 3.999959760801596e-05,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2509196400642395,
"step": 450,
"valid_targets_mean": 3745.4,
"valid_targets_min": 668
},
{
"epoch": 0.7233704292527822,
"grad_norm": 0.4798788268427838,
"learning_rate": 3.999893743951281e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.249254047870636,
"step": 455,
"valid_targets_mean": 4542.9,
"valid_targets_min": 675
},
{
"epoch": 0.7313195548489666,
"grad_norm": 0.5152240231525378,
"learning_rate": 3.9997962918331554e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19418257474899292,
"step": 460,
"valid_targets_mean": 3978.0,
"valid_targets_min": 678
},
{
"epoch": 0.739268680445151,
"grad_norm": 0.5512712084043713,
"learning_rate": 3.999667405979019e-05,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20612534880638123,
"step": 465,
"valid_targets_mean": 2988.6,
"valid_targets_min": 618
},
{
"epoch": 0.7472178060413355,
"grad_norm": 0.7851942416001637,
"learning_rate": 3.9995070884147604e-05,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22632327675819397,
"step": 470,
"valid_targets_mean": 3359.4,
"valid_targets_min": 968
},
{
"epoch": 0.7551669316375199,
"grad_norm": 0.5537518840736152,
"learning_rate": 3.999315341660325e-05,
"loss": 0.2036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21473893523216248,
"step": 475,
"valid_targets_mean": 3244.5,
"valid_targets_min": 581
},
{
"epoch": 0.7631160572337043,
"grad_norm": 0.5088365488324662,
"learning_rate": 3.9990921687296785e-05,
"loss": 0.219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21233266592025757,
"step": 480,
"valid_targets_mean": 4417.6,
"valid_targets_min": 673
},
{
"epoch": 0.7710651828298887,
"grad_norm": 0.5591275224242683,
"learning_rate": 3.998837573130758e-05,
"loss": 0.2236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23937103152275085,
"step": 485,
"valid_targets_mean": 3575.7,
"valid_targets_min": 534
},
{
"epoch": 0.7790143084260731,
"grad_norm": 0.41500354568791326,
"learning_rate": 3.9985515588654166e-05,
"loss": 0.2215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19625945389270782,
"step": 490,
"valid_targets_mean": 4809.2,
"valid_targets_min": 2182
},
{
"epoch": 0.7869634340222575,
"grad_norm": 0.5197016278046811,
"learning_rate": 3.99823413042936e-05,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16841718554496765,
"step": 495,
"valid_targets_mean": 3910.1,
"valid_targets_min": 1124
},
{
"epoch": 0.794912559618442,
"grad_norm": 0.42605527843070085,
"learning_rate": 3.997885292812078e-05,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21589577198028564,
"step": 500,
"valid_targets_mean": 5083.4,
"valid_targets_min": 631
},
{
"epoch": 0.8028616852146264,
"grad_norm": 0.6563615392059224,
"learning_rate": 3.997505051496764e-05,
"loss": 0.2244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.269468754529953,
"step": 505,
"valid_targets_mean": 3249.7,
"valid_targets_min": 612
},
{
"epoch": 0.8108108108108109,
"grad_norm": 0.511370927432411,
"learning_rate": 3.997093412460229e-05,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23530468344688416,
"step": 510,
"valid_targets_mean": 4039.5,
"valid_targets_min": 671
},
{
"epoch": 0.8187599364069952,
"grad_norm": 0.46207600265174703,
"learning_rate": 3.9966503821728074e-05,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18872712552547455,
"step": 515,
"valid_targets_mean": 3918.5,
"valid_targets_min": 911
},
{
"epoch": 0.8267090620031796,
"grad_norm": 0.518466058860564,
"learning_rate": 3.996175967598258e-05,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.258210152387619,
"step": 520,
"valid_targets_mean": 3838.6,
"valid_targets_min": 509
},
{
"epoch": 0.834658187599364,
"grad_norm": 0.5496770684162091,
"learning_rate": 3.995670176193651e-05,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1955585479736328,
"step": 525,
"valid_targets_mean": 3015.4,
"valid_targets_min": 601
},
{
"epoch": 0.8426073131955485,
"grad_norm": 0.5141119419529661,
"learning_rate": 3.9951330159092554e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1896553933620453,
"step": 530,
"valid_targets_mean": 3632.0,
"valid_targets_min": 235
},
{
"epoch": 0.8505564387917329,
"grad_norm": 0.6019780534491145,
"learning_rate": 3.994564495188405e-05,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19973322749137878,
"step": 535,
"valid_targets_mean": 3989.1,
"valid_targets_min": 545
},
{
"epoch": 0.8585055643879174,
"grad_norm": 0.43954090925747025,
"learning_rate": 3.9939646229673775e-05,
"loss": 0.2075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1840040683746338,
"step": 540,
"valid_targets_mean": 4522.1,
"valid_targets_min": 1633
},
{
"epoch": 0.8664546899841018,
"grad_norm": 0.5977708417760155,
"learning_rate": 3.993333408675244e-05,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20497910678386688,
"step": 545,
"valid_targets_mean": 2984.9,
"valid_targets_min": 656
},
{
"epoch": 0.8744038155802861,
"grad_norm": 0.4757849711588045,
"learning_rate": 3.9926708622337285e-05,
"loss": 0.214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24841903150081635,
"step": 550,
"valid_targets_mean": 4137.8,
"valid_targets_min": 556
},
{
"epoch": 0.8823529411764706,
"grad_norm": 0.4822074195433229,
"learning_rate": 3.991976994057046e-05,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1875840723514557,
"step": 555,
"valid_targets_mean": 4260.8,
"valid_targets_min": 1101
},
{
"epoch": 0.890302066772655,
"grad_norm": 0.5842684547912087,
"learning_rate": 3.991251815051741e-05,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19977149367332458,
"step": 560,
"valid_targets_mean": 2972.9,
"valid_targets_min": 534
},
{
"epoch": 0.8982511923688394,
"grad_norm": 0.652464883044752,
"learning_rate": 3.990495336616519e-05,
"loss": 0.2,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20372867584228516,
"step": 565,
"valid_targets_mean": 3338.4,
"valid_targets_min": 622
},
{
"epoch": 0.9062003179650239,
"grad_norm": 0.6216148839044923,
"learning_rate": 3.989707570642062e-05,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19672566652297974,
"step": 570,
"valid_targets_mean": 3842.1,
"valid_targets_min": 1334
},
{
"epoch": 0.9141494435612083,
"grad_norm": 0.5103176135370198,
"learning_rate": 3.988888529510844e-05,
"loss": 0.2139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20896919071674347,
"step": 575,
"valid_targets_mean": 3890.2,
"valid_targets_min": 679
},
{
"epoch": 0.9220985691573926,
"grad_norm": 0.5595134395559079,
"learning_rate": 3.988038226096939e-05,
"loss": 0.2112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2230646163225174,
"step": 580,
"valid_targets_mean": 3206.8,
"valid_targets_min": 255
},
{
"epoch": 0.9300476947535771,
"grad_norm": 0.46172488073234735,
"learning_rate": 3.9871566737658144e-05,
"loss": 0.1983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17313021421432495,
"step": 585,
"valid_targets_mean": 3876.9,
"valid_targets_min": 734
},
{
"epoch": 0.9379968203497615,
"grad_norm": 0.4500918322083041,
"learning_rate": 3.986243886374124e-05,
"loss": 0.2054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1883338987827301,
"step": 590,
"valid_targets_mean": 4360.1,
"valid_targets_min": 729
},
{
"epoch": 0.9459459459459459,
"grad_norm": 0.46535487326329783,
"learning_rate": 3.985299878269486e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.238117516040802,
"step": 595,
"valid_targets_mean": 4255.5,
"valid_targets_min": 1384
},
{
"epoch": 0.9538950715421304,
"grad_norm": 0.49612437665460657,
"learning_rate": 3.9843246642902646e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22181783616542816,
"step": 600,
"valid_targets_mean": 3831.8,
"valid_targets_min": 305
},
{
"epoch": 0.9618441971383148,
"grad_norm": 0.48706304600729844,
"learning_rate": 3.98331825976533e-05,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1820496767759323,
"step": 605,
"valid_targets_mean": 3962.2,
"valid_targets_min": 960
},
{
"epoch": 0.9697933227344993,
"grad_norm": 0.4308975740551794,
"learning_rate": 3.98228068051382e-05,
"loss": 0.2069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21952344477176666,
"step": 610,
"valid_targets_mean": 5032.3,
"valid_targets_min": 2134
},
{
"epoch": 0.9777424483306836,
"grad_norm": 0.5474648098644498,
"learning_rate": 3.9812119428448926e-05,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20172721147537231,
"step": 615,
"valid_targets_mean": 3203.3,
"valid_targets_min": 588
},
{
"epoch": 0.985691573926868,
"grad_norm": 0.4453809222709813,
"learning_rate": 3.9801120635574664e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1718732863664627,
"step": 620,
"valid_targets_mean": 3914.3,
"valid_targets_min": 560
},
{
"epoch": 0.9936406995230525,
"grad_norm": 0.5334825618659923,
"learning_rate": 3.978981059939961e-05,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20379891991615295,
"step": 625,
"valid_targets_mean": 3863.4,
"valid_targets_min": 619
},
{
"epoch": 1.0015898251192368,
"grad_norm": 0.5529835485096336,
"learning_rate": 3.977818949770022e-05,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2112482190132141,
"step": 630,
"valid_targets_mean": 3267.1,
"valid_targets_min": 308
},
{
"epoch": 1.0095389507154213,
"grad_norm": 0.5122916288062801,
"learning_rate": 3.976625751314241e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2054670751094818,
"step": 635,
"valid_targets_mean": 4767.6,
"valid_targets_min": 908
},
{
"epoch": 1.0174880763116056,
"grad_norm": 0.5068393688463881,
"learning_rate": 3.975401483327871e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1859699785709381,
"step": 640,
"valid_targets_mean": 3215.8,
"valid_targets_min": 691
},
{
"epoch": 1.0254372019077902,
"grad_norm": 0.4145850767881214,
"learning_rate": 3.974146165054532e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2187093198299408,
"step": 645,
"valid_targets_mean": 4994.4,
"valid_targets_min": 1438
},
{
"epoch": 1.0333863275039745,
"grad_norm": 0.4582537603183787,
"learning_rate": 3.972859816225904e-05,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1593848317861557,
"step": 650,
"valid_targets_mean": 3891.4,
"valid_targets_min": 297
},
{
"epoch": 1.041335453100159,
"grad_norm": 0.4567275257490204,
"learning_rate": 3.97154245706142e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18935450911521912,
"step": 655,
"valid_targets_mean": 4475.3,
"valid_targets_min": 560
},
{
"epoch": 1.0492845786963434,
"grad_norm": 0.5140859045337463,
"learning_rate": 3.970194108267952e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18552550673484802,
"step": 660,
"valid_targets_mean": 3475.7,
"valid_targets_min": 240
},
{
"epoch": 1.0572337042925277,
"grad_norm": 0.40778078731763423,
"learning_rate": 3.968814791039477e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18175040185451508,
"step": 665,
"valid_targets_mean": 4828.3,
"valid_targets_min": 781
},
{
"epoch": 1.0651828298887123,
"grad_norm": 0.5263082294572751,
"learning_rate": 3.967404527056751e-05,
"loss": 0.2161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25833356380462646,
"step": 670,
"valid_targets_mean": 4129.8,
"valid_targets_min": 604
},
{
"epoch": 1.0731319554848966,
"grad_norm": 0.4960768768163948,
"learning_rate": 3.9659633384869626e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17353063821792603,
"step": 675,
"valid_targets_mean": 4446.4,
"valid_targets_min": 1213
},
{
"epoch": 1.0810810810810811,
"grad_norm": 0.48100083595612203,
"learning_rate": 3.964491247983392e-05,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1870320737361908,
"step": 680,
"valid_targets_mean": 3895.7,
"valid_targets_min": 605
},
{
"epoch": 1.0890302066772655,
"grad_norm": 0.61106090311707,
"learning_rate": 3.962988278685047e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19367003440856934,
"step": 685,
"valid_targets_mean": 3629.8,
"valid_targets_min": 369
},
{
"epoch": 1.09697933227345,
"grad_norm": 0.4365754632817891,
"learning_rate": 3.961454454216305e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19389833509922028,
"step": 690,
"valid_targets_mean": 4258.8,
"valid_targets_min": 197
},
{
"epoch": 1.1049284578696343,
"grad_norm": 0.5262716250941029,
"learning_rate": 3.9598897986865364e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19017469882965088,
"step": 695,
"valid_targets_mean": 3231.6,
"valid_targets_min": 628
},
{
"epoch": 1.1128775834658187,
"grad_norm": 0.49861602576948466,
"learning_rate": 3.9582943366897316e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1815868318080902,
"step": 700,
"valid_targets_mean": 3687.8,
"valid_targets_min": 510
},
{
"epoch": 1.1208267090620032,
"grad_norm": 0.48175933314623326,
"learning_rate": 3.956668093304112e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1780034601688385,
"step": 705,
"valid_targets_mean": 4006.3,
"valid_targets_min": 824
},
{
"epoch": 1.1287758346581875,
"grad_norm": 0.5179802897696733,
"learning_rate": 3.9550110940917313e-05,
"loss": 0.198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20583273470401764,
"step": 710,
"valid_targets_mean": 3334.9,
"valid_targets_min": 598
},
{
"epoch": 1.136724960254372,
"grad_norm": 0.4267427875463337,
"learning_rate": 3.953323365098082e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18678268790245056,
"step": 715,
"valid_targets_mean": 4681.6,
"valid_targets_min": 1042
},
{
"epoch": 1.1446740858505564,
"grad_norm": 0.4891452481904024,
"learning_rate": 3.9516049328516795e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19785034656524658,
"step": 720,
"valid_targets_mean": 4126.4,
"valid_targets_min": 524
},
{
"epoch": 1.1526232114467407,
"grad_norm": 0.5279349481342677,
"learning_rate": 3.949855824363647e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19800621271133423,
"step": 725,
"valid_targets_mean": 3239.9,
"valid_targets_min": 846
},
{
"epoch": 1.1605723370429253,
"grad_norm": 0.8095806249907248,
"learning_rate": 3.948076067127294e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17679157853126526,
"step": 730,
"valid_targets_mean": 3760.4,
"valid_targets_min": 352
},
{
"epoch": 1.1685214626391096,
"grad_norm": 0.7153084766269169,
"learning_rate": 3.946265689117677e-05,
"loss": 0.1968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1971210539340973,
"step": 735,
"valid_targets_mean": 2638.4,
"valid_targets_min": 787
},
{
"epoch": 1.1764705882352942,
"grad_norm": 0.4535582899393148,
"learning_rate": 3.944424718791169e-05,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16410158574581146,
"step": 740,
"valid_targets_mean": 3738.6,
"valid_targets_min": 1269
},
{
"epoch": 1.1844197138314785,
"grad_norm": 0.47691889948518285,
"learning_rate": 3.942553185085003e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19451865553855896,
"step": 745,
"valid_targets_mean": 3723.2,
"valid_targets_min": 502
},
{
"epoch": 1.192368839427663,
"grad_norm": 0.4783725873079702,
"learning_rate": 3.940651117416824e-05,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17500782012939453,
"step": 750,
"valid_targets_mean": 3733.9,
"valid_targets_min": 375
},
{
"epoch": 1.2003179650238474,
"grad_norm": 0.45013056800116047,
"learning_rate": 3.9387185456842247e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1873418688774109,
"step": 755,
"valid_targets_mean": 4532.6,
"valid_targets_min": 649
},
{
"epoch": 1.2082670906200317,
"grad_norm": 0.4513636003405965,
"learning_rate": 3.936755500264274e-05,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19119738042354584,
"step": 760,
"valid_targets_mean": 3633.2,
"valid_targets_min": 614
},
{
"epoch": 1.2162162162162162,
"grad_norm": 0.43039183768805145,
"learning_rate": 3.9347620120130384e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19387167692184448,
"step": 765,
"valid_targets_mean": 5013.5,
"valid_targets_min": 671
},
{
"epoch": 1.2241653418124006,
"grad_norm": 0.5545872512419363,
"learning_rate": 3.932738112265103e-05,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1966329962015152,
"step": 770,
"valid_targets_mean": 3744.9,
"valid_targets_min": 295
},
{
"epoch": 1.232114467408585,
"grad_norm": 0.44088445810305865,
"learning_rate": 3.930683832833073e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1997533142566681,
"step": 775,
"valid_targets_mean": 4225.8,
"valid_targets_min": 1304
},
{
"epoch": 1.2400635930047694,
"grad_norm": 0.5628393929224067,
"learning_rate": 3.928599206007076e-05,
"loss": 0.1894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16368547081947327,
"step": 780,
"valid_targets_mean": 4202.9,
"valid_targets_min": 245
},
{
"epoch": 1.248012718600954,
"grad_norm": 0.5044797716972268,
"learning_rate": 3.926484264554253e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2036869078874588,
"step": 785,
"valid_targets_mean": 3405.1,
"valid_targets_min": 656
},
{
"epoch": 1.2559618441971383,
"grad_norm": 0.5129578399604017,
"learning_rate": 3.924339041718247e-05,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19128306210041046,
"step": 790,
"valid_targets_mean": 3456.4,
"valid_targets_min": 658
},
{
"epoch": 1.2639109697933226,
"grad_norm": 0.563159848952125,
"learning_rate": 3.922163571218676e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2012992799282074,
"step": 795,
"valid_targets_mean": 3187.4,
"valid_targets_min": 987
},
{
"epoch": 1.2718600953895072,
"grad_norm": 0.6173273492357961,
"learning_rate": 3.919957887250606e-05,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22333335876464844,
"step": 800,
"valid_targets_mean": 2847.9,
"valid_targets_min": 630
},
{
"epoch": 1.2798092209856915,
"grad_norm": 0.44827689109710595,
"learning_rate": 3.917722024484011e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18572327494621277,
"step": 805,
"valid_targets_mean": 4246.1,
"valid_targets_min": 621
},
{
"epoch": 1.287758346581876,
"grad_norm": 0.6751673561517912,
"learning_rate": 3.915456018063232e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20056423544883728,
"step": 810,
"valid_targets_mean": 2438.5,
"valid_targets_min": 225
},
{
"epoch": 1.2957074721780604,
"grad_norm": 0.7720325184700507,
"learning_rate": 3.9131599036064204e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1767432987689972,
"step": 815,
"valid_targets_mean": 3982.4,
"valid_targets_min": 669
},
{
"epoch": 1.303656597774245,
"grad_norm": 0.4366411337881234,
"learning_rate": 3.9108337172049794e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21016202867031097,
"step": 820,
"valid_targets_mean": 4805.6,
"valid_targets_min": 1425
},
{
"epoch": 1.3116057233704292,
"grad_norm": 0.5069327068809399,
"learning_rate": 3.908477495422998e-05,
"loss": 0.1969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19924074411392212,
"step": 825,
"valid_targets_mean": 3997.4,
"valid_targets_min": 286
},
{
"epoch": 1.3195548489666136,
"grad_norm": 0.445873116262987,
"learning_rate": 3.906091275296676e-05,
"loss": 0.1923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17496737837791443,
"step": 830,
"valid_targets_mean": 4272.1,
"valid_targets_min": 1011
},
{
"epoch": 1.3275039745627981,
"grad_norm": 0.9206148708023212,
"learning_rate": 3.903675094333739e-05,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2181253880262375,
"step": 835,
"valid_targets_mean": 3913.7,
"valid_targets_min": 702
},
{
"epoch": 1.3354531001589824,
"grad_norm": 0.5133359649094603,
"learning_rate": 3.901228990512854e-05,
"loss": 0.1987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2114499807357788,
"step": 840,
"valid_targets_mean": 3686.8,
"valid_targets_min": 308
},
{
"epoch": 1.343402225755167,
"grad_norm": 0.4696592099080785,
"learning_rate": 3.898753002283027e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.209947407245636,
"step": 845,
"valid_targets_mean": 3526.2,
"valid_targets_min": 619
},
{
"epoch": 1.3513513513513513,
"grad_norm": 0.5149647286915602,
"learning_rate": 3.896247168563004e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22973836958408356,
"step": 850,
"valid_targets_mean": 4359.3,
"valid_targets_min": 1080
},
{
"epoch": 1.3593004769475359,
"grad_norm": 0.45847358766247315,
"learning_rate": 3.8937115287406524e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20062896609306335,
"step": 855,
"valid_targets_mean": 4928.5,
"valid_targets_min": 434
},
{
"epoch": 1.3672496025437202,
"grad_norm": 0.5460254266383082,
"learning_rate": 3.891146122672349e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20617523789405823,
"step": 860,
"valid_targets_mean": 3505.1,
"valid_targets_min": 904
},
{
"epoch": 1.3751987281399045,
"grad_norm": 0.5461178071898645,
"learning_rate": 3.8885509906823496e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19545643031597137,
"step": 865,
"valid_targets_mean": 3159.5,
"valid_targets_min": 1402
},
{
"epoch": 1.383147853736089,
"grad_norm": 0.4558363745882089,
"learning_rate": 3.885926173562157e-05,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18399888277053833,
"step": 870,
"valid_targets_mean": 3677.1,
"valid_targets_min": 309
},
{
"epoch": 1.3910969793322734,
"grad_norm": 0.3899280590888697,
"learning_rate": 3.883271712569875e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20818111300468445,
"step": 875,
"valid_targets_mean": 5354.6,
"valid_targets_min": 1826
},
{
"epoch": 1.399046104928458,
"grad_norm": 0.4639547086845976,
"learning_rate": 3.8805876494295694e-05,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17379283905029297,
"step": 880,
"valid_targets_mean": 4342.3,
"valid_targets_min": 735
},
{
"epoch": 1.4069952305246423,
"grad_norm": 0.39181296096344126,
"learning_rate": 3.877874026330602e-05,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15908557176589966,
"step": 885,
"valid_targets_mean": 4897.9,
"valid_targets_min": 592
},
{
"epoch": 1.4149443561208268,
"grad_norm": 0.4132604124999311,
"learning_rate": 3.875130885926973e-05,
"loss": 0.1866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18337678909301758,
"step": 890,
"valid_targets_mean": 4757.7,
"valid_targets_min": 330
},
{
"epoch": 1.4228934817170111,
"grad_norm": 0.5105514719522013,
"learning_rate": 3.872358271336651e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19865591824054718,
"step": 895,
"valid_targets_mean": 3313.8,
"valid_targets_min": 487
},
{
"epoch": 1.4308426073131955,
"grad_norm": 0.5235070348886672,
"learning_rate": 3.8695562261408915e-05,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1919848918914795,
"step": 900,
"valid_targets_mean": 2859.2,
"valid_targets_min": 549
},
{
"epoch": 1.43879173290938,
"grad_norm": 0.47312190085140265,
"learning_rate": 3.8667247943835555e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20830847322940826,
"step": 905,
"valid_targets_mean": 4533.8,
"valid_targets_min": 727
},
{
"epoch": 1.4467408585055643,
"grad_norm": 0.5175775434248544,
"learning_rate": 3.863864020570414e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19121363759040833,
"step": 910,
"valid_targets_mean": 3036.8,
"valid_targets_min": 699
},
{
"epoch": 1.4546899841017489,
"grad_norm": 0.5781223268494494,
"learning_rate": 3.860973949668454e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20266948640346527,
"step": 915,
"valid_targets_mean": 2671.8,
"valid_targets_min": 254
},
{
"epoch": 1.4626391096979332,
"grad_norm": 0.4567922909167134,
"learning_rate": 3.8580546271051634e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18493634462356567,
"step": 920,
"valid_targets_mean": 4128.1,
"valid_targets_min": 282
},
{
"epoch": 1.4705882352941178,
"grad_norm": 0.47418699448382096,
"learning_rate": 3.8551060987678236e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18517082929611206,
"step": 925,
"valid_targets_mean": 3606.5,
"valid_targets_min": 694
},
{
"epoch": 1.478537360890302,
"grad_norm": 0.4220236091213908,
"learning_rate": 3.852128411002787e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19654536247253418,
"step": 930,
"valid_targets_mean": 5133.6,
"valid_targets_min": 670
},
{
"epoch": 1.4864864864864864,
"grad_norm": 0.4573542025228096,
"learning_rate": 3.849121610614745e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21628251671791077,
"step": 935,
"valid_targets_mean": 4146.7,
"valid_targets_min": 590
},
{
"epoch": 1.494435612082671,
"grad_norm": 0.455624363723731,
"learning_rate": 3.8460857448659975e-05,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16024024784564972,
"step": 940,
"valid_targets_mean": 3990.5,
"valid_targets_min": 534
},
{
"epoch": 1.5023847376788553,
"grad_norm": 0.8397075238280883,
"learning_rate": 3.8430208614757044e-05,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19728557765483856,
"step": 945,
"valid_targets_mean": 3193.9,
"valid_targets_min": 1069
},
{
"epoch": 1.5103338632750396,
"grad_norm": 0.6455640246915216,
"learning_rate": 3.8399270086191425e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18609043955802917,
"step": 950,
"valid_targets_mean": 3671.4,
"valid_targets_min": 598
},
{
"epoch": 1.5182829888712241,
"grad_norm": 0.4393679011147717,
"learning_rate": 3.8368042349269405e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18841350078582764,
"step": 955,
"valid_targets_mean": 4189.6,
"valid_targets_min": 1160
},
{
"epoch": 1.5262321144674087,
"grad_norm": 0.4748654125112523,
"learning_rate": 3.83365258948432e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18544679880142212,
"step": 960,
"valid_targets_mean": 4059.8,
"valid_targets_min": 537
},
{
"epoch": 1.534181240063593,
"grad_norm": 0.44195423356853586,
"learning_rate": 3.830472121830323e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17977693676948547,
"step": 965,
"valid_targets_mean": 4036.9,
"valid_targets_min": 719
},
{
"epoch": 1.5421303656597773,
"grad_norm": 0.4190445460085609,
"learning_rate": 3.82726288195703e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15075984597206116,
"step": 970,
"valid_targets_mean": 3788.1,
"valid_targets_min": 919
},
{
"epoch": 1.550079491255962,
"grad_norm": 0.38824323345082057,
"learning_rate": 3.824024920308781e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16938742995262146,
"step": 975,
"valid_targets_mean": 4616.4,
"valid_targets_min": 617
},
{
"epoch": 1.5580286168521462,
"grad_norm": 0.4803671121375321,
"learning_rate": 3.820758287781374e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21928074955940247,
"step": 980,
"valid_targets_mean": 4322.5,
"valid_targets_min": 693
},
{
"epoch": 1.5659777424483305,
"grad_norm": 0.4853782041831188,
"learning_rate": 3.8174630357212714e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17328375577926636,
"step": 985,
"valid_targets_mean": 4317.4,
"valid_targets_min": 690
},
{
"epoch": 1.573926868044515,
"grad_norm": 0.47169665339515204,
"learning_rate": 3.8141392159247905e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21782585978507996,
"step": 990,
"valid_targets_mean": 3688.9,
"valid_targets_min": 636
},
{
"epoch": 1.5818759936406996,
"grad_norm": 0.4690651486120993,
"learning_rate": 3.81078688063729e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19451123476028442,
"step": 995,
"valid_targets_mean": 3713.2,
"valid_targets_min": 281
},
{
"epoch": 1.589825119236884,
"grad_norm": 0.4346450046592069,
"learning_rate": 3.807406082552348e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16455082595348358,
"step": 1000,
"valid_targets_mean": 3809.7,
"valid_targets_min": 260
},
{
"epoch": 1.5977742448330683,
"grad_norm": 0.41932684002795517,
"learning_rate": 3.803996874810934e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17046436667442322,
"step": 1005,
"valid_targets_mean": 4024.4,
"valid_targets_min": 273
},
{
"epoch": 1.6057233704292528,
"grad_norm": 0.3705151557622996,
"learning_rate": 3.800559311000575e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1598929464817047,
"step": 1010,
"valid_targets_mean": 5066.7,
"valid_targets_min": 570
},
{
"epoch": 1.6136724960254372,
"grad_norm": 0.43289861621038134,
"learning_rate": 3.7970934451545104e-05,
"loss": 0.1925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1886836290359497,
"step": 1015,
"valid_targets_mean": 4769.2,
"valid_targets_min": 651
},
{
"epoch": 1.6216216216216215,
"grad_norm": 0.45330830989766385,
"learning_rate": 3.7935993317508455e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18560412526130676,
"step": 1020,
"valid_targets_mean": 4132.1,
"valid_targets_min": 622
},
{
"epoch": 1.629570747217806,
"grad_norm": 0.515537997297837,
"learning_rate": 3.790077025711694e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21635811030864716,
"step": 1025,
"valid_targets_mean": 3410.8,
"valid_targets_min": 233
},
{
"epoch": 1.6375198728139906,
"grad_norm": 0.4946566085078078,
"learning_rate": 3.786526582402313e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17097623646259308,
"step": 1030,
"valid_targets_mean": 3390.3,
"valid_targets_min": 649
},
{
"epoch": 1.645468998410175,
"grad_norm": 0.4669861404848048,
"learning_rate": 3.782948057630236e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19812054932117462,
"step": 1035,
"valid_targets_mean": 3441.6,
"valid_targets_min": 624
},
{
"epoch": 1.6534181240063592,
"grad_norm": 0.4939545083568682,
"learning_rate": 3.779341507644394e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17919695377349854,
"step": 1040,
"valid_targets_mean": 3929.4,
"valid_targets_min": 302
},
{
"epoch": 1.6613672496025438,
"grad_norm": 0.540991144768767,
"learning_rate": 3.775706989134231e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20103199779987335,
"step": 1045,
"valid_targets_mean": 3738.6,
"valid_targets_min": 709
},
{
"epoch": 1.669316375198728,
"grad_norm": 0.4963684293040473,
"learning_rate": 3.772044559228813e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19030243158340454,
"step": 1050,
"valid_targets_mean": 3166.8,
"valid_targets_min": 252
},
{
"epoch": 1.6772655007949124,
"grad_norm": 0.501401895351916,
"learning_rate": 3.768354275495933e-05,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1745380461215973,
"step": 1055,
"valid_targets_mean": 3242.2,
"valid_targets_min": 285
},
{
"epoch": 1.685214626391097,
"grad_norm": 0.4968401136342654,
"learning_rate": 3.764636195941198e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17797568440437317,
"step": 1060,
"valid_targets_mean": 3188.0,
"valid_targets_min": 262
},
{
"epoch": 1.6931637519872815,
"grad_norm": 0.4884093983436614,
"learning_rate": 3.760890379007129e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2129162847995758,
"step": 1065,
"valid_targets_mean": 4418.9,
"valid_targets_min": 523
},
{
"epoch": 1.7011128775834659,
"grad_norm": 0.44076053571984003,
"learning_rate": 3.757116883572232e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1850593388080597,
"step": 1070,
"valid_targets_mean": 4093.6,
"valid_targets_min": 821
},
{
"epoch": 1.7090620031796502,
"grad_norm": 0.542297894741752,
"learning_rate": 3.753315768950079e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21836097538471222,
"step": 1075,
"valid_targets_mean": 3133.3,
"valid_targets_min": 204
},
{
"epoch": 1.7170111287758347,
"grad_norm": 0.5168670041375298,
"learning_rate": 3.74948709488837e-05,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18428263068199158,
"step": 1080,
"valid_targets_mean": 3062.6,
"valid_targets_min": 606
},
{
"epoch": 1.724960254372019,
"grad_norm": 0.5653952426228848,
"learning_rate": 3.745630921568004e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17465798556804657,
"step": 1085,
"valid_targets_mean": 2868.4,
"valid_targets_min": 273
},
{
"epoch": 1.7329093799682034,
"grad_norm": 0.46856535469042454,
"learning_rate": 3.741747309602117e-05,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20139528810977936,
"step": 1090,
"valid_targets_mean": 4477.7,
"valid_targets_min": 212
},
{
"epoch": 1.740858505564388,
"grad_norm": 0.41928118910953777,
"learning_rate": 3.737836320035146e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18881118297576904,
"step": 1095,
"valid_targets_mean": 4088.9,
"valid_targets_min": 1217
},
{
"epoch": 1.7488076311605725,
"grad_norm": 0.4251393076302139,
"learning_rate": 3.733898014341858e-05,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18259574472904205,
"step": 1100,
"valid_targets_mean": 4110.7,
"valid_targets_min": 294
},
{
"epoch": 1.7567567567567568,
"grad_norm": 0.3931735507262585,
"learning_rate": 3.729932454426391e-05,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18538832664489746,
"step": 1105,
"valid_targets_mean": 5117.2,
"valid_targets_min": 1011
},
{
"epoch": 1.7647058823529411,
"grad_norm": 0.4529514349775154,
"learning_rate": 3.725939702621273e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18618038296699524,
"step": 1110,
"valid_targets_mean": 4018.2,
"valid_targets_min": 607
},
{
"epoch": 1.7726550079491257,
"grad_norm": 0.4503816594471195,
"learning_rate": 3.72191982168645e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15615426003932953,
"step": 1115,
"valid_targets_mean": 3476.6,
"valid_targets_min": 679
},
{
"epoch": 1.78060413354531,
"grad_norm": 0.5088702362995737,
"learning_rate": 3.717872874808298e-05,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21099695563316345,
"step": 1120,
"valid_targets_mean": 3103.6,
"valid_targets_min": 637
},
{
"epoch": 1.7885532591414943,
"grad_norm": 0.7999181539319212,
"learning_rate": 3.713798925598623e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19236738979816437,
"step": 1125,
"valid_targets_mean": 3830.4,
"valid_targets_min": 612
},
{
"epoch": 1.7965023847376789,
"grad_norm": 0.4307921702238077,
"learning_rate": 3.709698038093671e-05,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16169005632400513,
"step": 1130,
"valid_targets_mean": 3835.4,
"valid_targets_min": 1344
},
{
"epoch": 1.8044515103338634,
"grad_norm": 0.485741913256061,
"learning_rate": 3.705570276753116e-05,
"loss": 0.1851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18286767601966858,
"step": 1135,
"valid_targets_mean": 3094.0,
"valid_targets_min": 270
},
{
"epoch": 1.8124006359300477,
"grad_norm": 0.5255452896790747,
"learning_rate": 3.701415706459044e-05,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19145852327346802,
"step": 1140,
"valid_targets_mean": 3693.2,
"valid_targets_min": 555
},
{
"epoch": 1.820349761526232,
"grad_norm": 0.5046926635208234,
"learning_rate": 3.697234392514942e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2077309787273407,
"step": 1145,
"valid_targets_mean": 3055.6,
"valid_targets_min": 607
},
{
"epoch": 1.8282988871224166,
"grad_norm": 0.4368221113650411,
"learning_rate": 3.693026400644662e-05,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18555589020252228,
"step": 1150,
"valid_targets_mean": 4117.4,
"valid_targets_min": 279
},
{
"epoch": 1.836248012718601,
"grad_norm": 0.4836963066254356,
"learning_rate": 3.6887917969913944e-05,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2165643572807312,
"step": 1155,
"valid_targets_mean": 3562.9,
"valid_targets_min": 525
},
{
"epoch": 1.8441971383147853,
"grad_norm": 0.4084280506680083,
"learning_rate": 3.684530648116625e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17716243863105774,
"step": 1160,
"valid_targets_mean": 4411.1,
"valid_targets_min": 245
},
{
"epoch": 1.8521462639109698,
"grad_norm": 0.44584904009558374,
"learning_rate": 3.68024302099909e-05,
"loss": 0.1894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19152897596359253,
"step": 1165,
"valid_targets_mean": 3953.6,
"valid_targets_min": 450
},
{
"epoch": 1.8600953895071544,
"grad_norm": 0.5649727314954088,
"learning_rate": 3.6759289830337246e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1756046712398529,
"step": 1170,
"valid_targets_mean": 4100.8,
"valid_targets_min": 1298
},
{
"epoch": 1.8680445151033387,
"grad_norm": 0.49736684064600023,
"learning_rate": 3.6715886020306e-05,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16673019528388977,
"step": 1175,
"valid_targets_mean": 3085.4,
"valid_targets_min": 551
},
{
"epoch": 1.875993640699523,
"grad_norm": 0.45789796811072,
"learning_rate": 3.6672219462138604e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1682954877614975,
"step": 1180,
"valid_targets_mean": 4273.3,
"valid_targets_min": 299
},
{
"epoch": 1.8839427662957076,
"grad_norm": 0.4895932235353001,
"learning_rate": 3.6628290842206495e-05,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19178809225559235,
"step": 1185,
"valid_targets_mean": 3406.9,
"valid_targets_min": 611
},
{
"epoch": 1.8918918918918919,
"grad_norm": 0.45298370929710946,
"learning_rate": 3.658410085100034e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21535128355026245,
"step": 1190,
"valid_targets_mean": 4193.9,
"valid_targets_min": 1461
},
{
"epoch": 1.8998410174880762,
"grad_norm": 0.44589909041567644,
"learning_rate": 3.6539650183119126e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18020093441009521,
"step": 1195,
"valid_targets_mean": 3717.2,
"valid_targets_min": 651
},
{
"epoch": 1.9077901430842608,
"grad_norm": 0.3600027728462642,
"learning_rate": 3.64949395372593e-05,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17888964712619781,
"step": 1200,
"valid_targets_mean": 5276.8,
"valid_targets_min": 1291
},
{
"epoch": 1.9157392686804453,
"grad_norm": 0.4993758462348809,
"learning_rate": 3.644996961620378e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17506229877471924,
"step": 1205,
"valid_targets_mean": 3077.0,
"valid_targets_min": 279
},
{
"epoch": 1.9236883942766294,
"grad_norm": 0.5207237968380335,
"learning_rate": 3.6404741126810854e-05,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18324558436870575,
"step": 1210,
"valid_targets_mean": 3340.1,
"valid_targets_min": 465
},
{
"epoch": 1.931637519872814,
"grad_norm": 0.5043242801398989,
"learning_rate": 3.635925478000315e-05,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19553515315055847,
"step": 1215,
"valid_targets_mean": 3118.6,
"valid_targets_min": 625
},
{
"epoch": 1.9395866454689985,
"grad_norm": 0.3968462413963593,
"learning_rate": 3.631351129075638e-05,
"loss": 0.1762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19829094409942627,
"step": 1220,
"valid_targets_mean": 4999.4,
"valid_targets_min": 1898
},
{
"epoch": 1.9475357710651828,
"grad_norm": 0.5208428823666412,
"learning_rate": 3.6267511378088174e-05,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18420946598052979,
"step": 1225,
"valid_targets_mean": 4461.8,
"valid_targets_min": 735
},
{
"epoch": 1.9554848966613672,
"grad_norm": 0.531760446350055,
"learning_rate": 3.622125576504674e-05,
"loss": 0.1776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2018202245235443,
"step": 1230,
"valid_targets_mean": 2726.6,
"valid_targets_min": 257
},
{
"epoch": 1.9634340222575517,
"grad_norm": 0.5155602824722777,
"learning_rate": 3.6174745178699484e-05,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20093253254890442,
"step": 1235,
"valid_targets_mean": 2971.2,
"valid_targets_min": 542
},
{
"epoch": 1.9713831478537363,
"grad_norm": 0.48459979840868433,
"learning_rate": 3.612798035012161e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17393648624420166,
"step": 1240,
"valid_targets_mean": 3234.2,
"valid_targets_min": 269
},
{
"epoch": 1.9793322734499204,
"grad_norm": 0.4476136626874852,
"learning_rate": 3.608096201438465e-05,
"loss": 0.1969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17231547832489014,
"step": 1245,
"valid_targets_mean": 3629.6,
"valid_targets_min": 559
},
{
"epoch": 1.987281399046105,
"grad_norm": 0.430623482890761,
"learning_rate": 3.603369091054484e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1765379011631012,
"step": 1250,
"valid_targets_mean": 3597.4,
"valid_targets_min": 1075
},
{
"epoch": 1.9952305246422894,
"grad_norm": 0.436331980026303,
"learning_rate": 3.5986167781631556e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1572694480419159,
"step": 1255,
"valid_targets_mean": 4041.3,
"valid_targets_min": 300
},
{
"epoch": 2.0031796502384736,
"grad_norm": 0.43495258070360787,
"learning_rate": 3.5938393374635634e-05,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17657440900802612,
"step": 1260,
"valid_targets_mean": 3687.1,
"valid_targets_min": 768
},
{
"epoch": 2.011128775834658,
"grad_norm": 0.44734489727626625,
"learning_rate": 3.589036844049762e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16207647323608398,
"step": 1265,
"valid_targets_mean": 3986.1,
"valid_targets_min": 524
},
{
"epoch": 2.0190779014308426,
"grad_norm": 0.46524088697899335,
"learning_rate": 3.584209373409593e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16202375292778015,
"step": 1270,
"valid_targets_mean": 3613.5,
"valid_targets_min": 670
},
{
"epoch": 2.027027027027027,
"grad_norm": 0.45070406893947157,
"learning_rate": 3.579357001423505e-05,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17059147357940674,
"step": 1275,
"valid_targets_mean": 3577.6,
"valid_targets_min": 665
},
{
"epoch": 2.0349761526232113,
"grad_norm": 0.4499960165350608,
"learning_rate": 3.5744798043633566e-05,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18004930019378662,
"step": 1280,
"valid_targets_mean": 4093.8,
"valid_targets_min": 566
},
{
"epoch": 2.042925278219396,
"grad_norm": 0.5580419519655596,
"learning_rate": 3.569577858891219e-05,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1862042248249054,
"step": 1285,
"valid_targets_mean": 2967.2,
"valid_targets_min": 673
},
{
"epoch": 2.0508744038155804,
"grad_norm": 0.4779943776711724,
"learning_rate": 3.56465124205817e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22631016373634338,
"step": 1290,
"valid_targets_mean": 3858.1,
"valid_targets_min": 590
},
{
"epoch": 2.0588235294117645,
"grad_norm": 0.4911452381940732,
"learning_rate": 3.559700031303082e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16386955976486206,
"step": 1295,
"valid_targets_mean": 3233.1,
"valid_targets_min": 294
},
{
"epoch": 2.066772655007949,
"grad_norm": 0.5288525437496359,
"learning_rate": 3.554724304451411e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1542258858680725,
"step": 1300,
"valid_targets_mean": 3689.6,
"valid_targets_min": 710
},
{
"epoch": 2.0747217806041336,
"grad_norm": 0.6612223596945518,
"learning_rate": 3.549724139713962e-05,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17203554511070251,
"step": 1305,
"valid_targets_mean": 3336.7,
"valid_targets_min": 294
},
{
"epoch": 2.082670906200318,
"grad_norm": 0.4373776224124723,
"learning_rate": 3.544699615685671e-05,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14887259900569916,
"step": 1310,
"valid_targets_mean": 4026.8,
"valid_targets_min": 755
},
{
"epoch": 2.0906200317965022,
"grad_norm": 0.5037762968017296,
"learning_rate": 3.539650811344363e-05,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1626054346561432,
"step": 1315,
"valid_targets_mean": 3763.6,
"valid_targets_min": 258
},
{
"epoch": 2.098569157392687,
"grad_norm": 0.6313496812038843,
"learning_rate": 3.534577806049512e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15829899907112122,
"step": 1320,
"valid_targets_mean": 3636.2,
"valid_targets_min": 682
},
{
"epoch": 2.1065182829888713,
"grad_norm": 0.4425905414584769,
"learning_rate": 3.529480679540996e-05,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15318667888641357,
"step": 1325,
"valid_targets_mean": 4196.6,
"valid_targets_min": 583
},
{
"epoch": 2.1144674085850554,
"grad_norm": 0.6185724943267303,
"learning_rate": 3.524359511937838e-05,
"loss": 0.1786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16072843968868256,
"step": 1330,
"valid_targets_mean": 2547.9,
"valid_targets_min": 263
},
{
"epoch": 2.12241653418124,
"grad_norm": 0.48298978637493106,
"learning_rate": 3.5192143837369523e-05,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19100898504257202,
"step": 1335,
"valid_targets_mean": 3434.8,
"valid_targets_min": 296
},
{
"epoch": 2.1303656597774245,
"grad_norm": 0.5247741664837559,
"learning_rate": 3.514045375811878e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16440363228321075,
"step": 1340,
"valid_targets_mean": 2886.7,
"valid_targets_min": 201
},
{
"epoch": 2.138314785373609,
"grad_norm": 0.4645350321366234,
"learning_rate": 3.508852569411506e-05,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16781508922576904,
"step": 1345,
"valid_targets_mean": 3687.1,
"valid_targets_min": 1028
},
{
"epoch": 2.146263910969793,
"grad_norm": 0.4185673015572621,
"learning_rate": 3.503636046158803e-05,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15546417236328125,
"step": 1350,
"valid_targets_mean": 4516.6,
"valid_targets_min": 876
},
{
"epoch": 2.1542130365659777,
"grad_norm": 0.49044816100084626,
"learning_rate": 3.498395888049526e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19985926151275635,
"step": 1355,
"valid_targets_mean": 3536.6,
"valid_targets_min": 636
},
{
"epoch": 2.1621621621621623,
"grad_norm": 0.4570482087101892,
"learning_rate": 3.4931321774509396e-05,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15912221372127533,
"step": 1360,
"valid_targets_mean": 3607.9,
"valid_targets_min": 299
},
{
"epoch": 2.1701112877583464,
"grad_norm": 0.4292180835767507,
"learning_rate": 3.487844997100515e-05,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19553008675575256,
"step": 1365,
"valid_targets_mean": 4204.5,
"valid_targets_min": 307
},
{
"epoch": 2.178060413354531,
"grad_norm": 0.524906614575372,
"learning_rate": 3.482534430104633e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.174746572971344,
"step": 1370,
"valid_targets_mean": 3015.8,
"valid_targets_min": 324
},
{
"epoch": 2.1860095389507155,
"grad_norm": 0.460503992627472,
"learning_rate": 3.4772005599372764e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17967626452445984,
"step": 1375,
"valid_targets_mean": 3896.6,
"valid_targets_min": 821
},
{
"epoch": 2.1939586645469,
"grad_norm": 0.44690523777838326,
"learning_rate": 3.4718434704387174e-05,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1710180938243866,
"step": 1380,
"valid_targets_mean": 4478.8,
"valid_targets_min": 1388
},
{
"epoch": 2.201907790143084,
"grad_norm": 0.41765151372647924,
"learning_rate": 3.4664632458142016e-05,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15442225337028503,
"step": 1385,
"valid_targets_mean": 4279.1,
"valid_targets_min": 559
},
{
"epoch": 2.2098569157392687,
"grad_norm": 0.434025285839872,
"learning_rate": 3.461059970632622e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14256054162979126,
"step": 1390,
"valid_targets_mean": 3645.9,
"valid_targets_min": 682
},
{
"epoch": 2.2178060413354532,
"grad_norm": 0.39810648920310915,
"learning_rate": 3.4556337298251943e-05,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14162832498550415,
"step": 1395,
"valid_targets_mean": 4033.1,
"valid_targets_min": 253
},
{
"epoch": 2.2257551669316373,
"grad_norm": 0.5481937999092757,
"learning_rate": 3.450184608684114e-05,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1893032193183899,
"step": 1400,
"valid_targets_mean": 2773.9,
"valid_targets_min": 637
},
{
"epoch": 2.233704292527822,
"grad_norm": 0.43591132617223516,
"learning_rate": 3.444712692861224e-05,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12860910594463348,
"step": 1405,
"valid_targets_mean": 3698.6,
"valid_targets_min": 891
},
{
"epoch": 2.2416534181240064,
"grad_norm": 0.43573783141415084,
"learning_rate": 3.439218068366663e-05,
"loss": 0.1613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1642727553844452,
"step": 1410,
"valid_targets_mean": 3836.3,
"valid_targets_min": 608
},
{
"epoch": 2.249602543720191,
"grad_norm": 0.4326278702113856,
"learning_rate": 3.433700821567516e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14071246981620789,
"step": 1415,
"valid_targets_mean": 4719.1,
"valid_targets_min": 244
},
{
"epoch": 2.257551669316375,
"grad_norm": 0.5549303616093954,
"learning_rate": 3.428161039186456e-05,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18680042028427124,
"step": 1420,
"valid_targets_mean": 3738.0,
"valid_targets_min": 327
},
{
"epoch": 2.2655007949125596,
"grad_norm": 0.8319518010193951,
"learning_rate": 3.42259880830038e-05,
"loss": 0.1682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17515277862548828,
"step": 1425,
"valid_targets_mean": 3830.8,
"valid_targets_min": 859
},
{
"epoch": 2.273449920508744,
"grad_norm": 0.4319372849950979,
"learning_rate": 3.417014216339043e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18945015966892242,
"step": 1430,
"valid_targets_mean": 4180.6,
"valid_targets_min": 568
},
{
"epoch": 2.2813990461049283,
"grad_norm": 0.4645369639888501,
"learning_rate": 3.4114073510836794e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17300865054130554,
"step": 1435,
"valid_targets_mean": 3716.4,
"valid_targets_min": 1337
},
{
"epoch": 2.289348171701113,
"grad_norm": 0.4624581509651132,
"learning_rate": 3.4057783006656274e-05,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1803177446126938,
"step": 1440,
"valid_targets_mean": 3995.3,
"valid_targets_min": 609
},
{
"epoch": 2.2972972972972974,
"grad_norm": 0.3990685274728258,
"learning_rate": 3.400127153564941e-05,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1542663425207138,
"step": 1445,
"valid_targets_mean": 4452.5,
"valid_targets_min": 1190
},
{
"epoch": 2.3052464228934815,
"grad_norm": 0.6187952481541217,
"learning_rate": 3.394453998609001e-05,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18409979343414307,
"step": 1450,
"valid_targets_mean": 2894.1,
"valid_targets_min": 281
},
{
"epoch": 2.313195548489666,
"grad_norm": 0.49894187881909596,
"learning_rate": 3.388758924971117e-05,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18296250700950623,
"step": 1455,
"valid_targets_mean": 3416.9,
"valid_targets_min": 703
},
{
"epoch": 2.3211446740858506,
"grad_norm": 0.5357473334854262,
"learning_rate": 3.3830420221691286e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18557733297348022,
"step": 1460,
"valid_targets_mean": 3307.2,
"valid_targets_min": 591
},
{
"epoch": 2.329093799682035,
"grad_norm": 0.3962622061174984,
"learning_rate": 3.377303380063995e-05,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14266249537467957,
"step": 1465,
"valid_targets_mean": 4369.6,
"valid_targets_min": 1371
},
{
"epoch": 2.337042925278219,
"grad_norm": 0.3785010810778657,
"learning_rate": 3.371543088858384e-05,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16492611169815063,
"step": 1470,
"valid_targets_mean": 5120.1,
"valid_targets_min": 621
},
{
"epoch": 2.3449920508744038,
"grad_norm": 0.48881533304790475,
"learning_rate": 3.365761239095253e-05,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16915087401866913,
"step": 1475,
"valid_targets_mean": 3925.3,
"valid_targets_min": 576
},
{
"epoch": 2.3529411764705883,
"grad_norm": 0.48720287373725557,
"learning_rate": 3.3599579216564314e-05,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17547118663787842,
"step": 1480,
"valid_targets_mean": 3980.4,
"valid_targets_min": 706
},
{
"epoch": 2.360890302066773,
"grad_norm": 0.5303350453029894,
"learning_rate": 3.354133227761181e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.172575443983078,
"step": 1485,
"valid_targets_mean": 4342.2,
"valid_targets_min": 1065
},
{
"epoch": 2.368839427662957,
"grad_norm": 0.5948787016804042,
"learning_rate": 3.3482872489647745e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16050350666046143,
"step": 1490,
"valid_targets_mean": 4073.2,
"valid_targets_min": 279
},
{
"epoch": 2.3767885532591415,
"grad_norm": 0.4793825142162827,
"learning_rate": 3.342420077157047e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1763351708650589,
"step": 1495,
"valid_targets_mean": 3483.2,
"valid_targets_min": 643
},
{
"epoch": 2.384737678855326,
"grad_norm": 0.4530776431878804,
"learning_rate": 3.336531804560957e-05,
"loss": 0.1526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14177027344703674,
"step": 1500,
"valid_targets_mean": 3812.7,
"valid_targets_min": 600
},
{
"epoch": 2.39268680445151,
"grad_norm": 0.48697483476860215,
"learning_rate": 3.330622523731136e-05,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15083934366703033,
"step": 1505,
"valid_targets_mean": 2873.0,
"valid_targets_min": 224
},
{
"epoch": 2.4006359300476947,
"grad_norm": 0.49665518829864685,
"learning_rate": 3.32469232755243e-05,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1856893002986908,
"step": 1510,
"valid_targets_mean": 3365.2,
"valid_targets_min": 904
},
{
"epoch": 2.4085850556438793,
"grad_norm": 0.45662940616841696,
"learning_rate": 3.318741309238444e-05,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18095698952674866,
"step": 1515,
"valid_targets_mean": 3817.8,
"valid_targets_min": 671
},
{
"epoch": 2.4165341812400634,
"grad_norm": 0.4040458879915397,
"learning_rate": 3.312769562330075e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1404886543750763,
"step": 1520,
"valid_targets_mean": 4547.6,
"valid_targets_min": 1168
},
{
"epoch": 2.424483306836248,
"grad_norm": 0.4028349948778861,
"learning_rate": 3.306777180694042e-05,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15197904407978058,
"step": 1525,
"valid_targets_mean": 4536.2,
"valid_targets_min": 731
},
{
"epoch": 2.4324324324324325,
"grad_norm": 0.488660600681927,
"learning_rate": 3.30076425852141e-05,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18501275777816772,
"step": 1530,
"valid_targets_mean": 3903.4,
"valid_targets_min": 519
},
{
"epoch": 2.440381558028617,
"grad_norm": 0.4360649019785482,
"learning_rate": 3.294730890326109e-05,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14416208863258362,
"step": 1535,
"valid_targets_mean": 3269.1,
"valid_targets_min": 718
},
{
"epoch": 2.448330683624801,
"grad_norm": 0.3987623937481391,
"learning_rate": 3.2886771709434504e-05,
"loss": 0.1559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1603170931339264,
"step": 1540,
"valid_targets_mean": 4707.6,
"valid_targets_min": 1348
},
{
"epoch": 2.4562798092209857,
"grad_norm": 0.5797017322011377,
"learning_rate": 3.282603195528635e-05,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17639771103858948,
"step": 1545,
"valid_targets_mean": 3203.8,
"valid_targets_min": 568
},
{
"epoch": 2.46422893481717,
"grad_norm": 0.44881682454570193,
"learning_rate": 3.276509059555257e-05,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15224912762641907,
"step": 1550,
"valid_targets_mean": 4156.8,
"valid_targets_min": 551
},
{
"epoch": 2.4721780604133547,
"grad_norm": 0.4299523456790547,
"learning_rate": 3.270394858813802e-05,
"loss": 0.1693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2051280438899994,
"step": 1555,
"valid_targets_mean": 4095.7,
"valid_targets_min": 621
},
{
"epoch": 2.480127186009539,
"grad_norm": 0.46068757123222875,
"learning_rate": 3.264260689410147e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15283241868019104,
"step": 1560,
"valid_targets_mean": 3226.4,
"valid_targets_min": 912
},
{
"epoch": 2.4880763116057234,
"grad_norm": 0.47403025787042874,
"learning_rate": 3.2581066477640435e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15874740481376648,
"step": 1565,
"valid_targets_mean": 3952.1,
"valid_targets_min": 872
},
{
"epoch": 2.496025437201908,
"grad_norm": 0.4626317047147037,
"learning_rate": 3.251932830607603e-05,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16611367464065552,
"step": 1570,
"valid_targets_mean": 3792.7,
"valid_targets_min": 450
},
{
"epoch": 2.503974562798092,
"grad_norm": 0.48592321395910304,
"learning_rate": 3.245739334983779e-05,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1791059672832489,
"step": 1575,
"valid_targets_mean": 3011.2,
"valid_targets_min": 305
},
{
"epoch": 2.5119236883942766,
"grad_norm": 0.48642110315097836,
"learning_rate": 3.239526258244842e-05,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18121963739395142,
"step": 1580,
"valid_targets_mean": 3705.4,
"valid_targets_min": 465
},
{
"epoch": 2.519872813990461,
"grad_norm": 0.4193245496234458,
"learning_rate": 3.233293698050845e-05,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15967342257499695,
"step": 1585,
"valid_targets_mean": 4023.4,
"valid_targets_min": 548
},
{
"epoch": 2.5278219395866453,
"grad_norm": 0.5640866498973993,
"learning_rate": 3.227041752368091e-05,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17153598368167877,
"step": 1590,
"valid_targets_mean": 2566.8,
"valid_targets_min": 217
},
{
"epoch": 2.53577106518283,
"grad_norm": 0.41665001246607075,
"learning_rate": 3.220770519467597e-05,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1515938937664032,
"step": 1595,
"valid_targets_mean": 4122.9,
"valid_targets_min": 237
},
{
"epoch": 2.5437201907790143,
"grad_norm": 0.39614139545188226,
"learning_rate": 3.214480097923542e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18220946192741394,
"step": 1600,
"valid_targets_mean": 5175.8,
"valid_targets_min": 705
},
{
"epoch": 2.551669316375199,
"grad_norm": 0.43229505102472626,
"learning_rate": 3.208170586611721e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16309629380702972,
"step": 1605,
"valid_targets_mean": 3784.4,
"valid_targets_min": 584
},
{
"epoch": 2.559618441971383,
"grad_norm": 0.4243434467048783,
"learning_rate": 3.201842084707993e-05,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1563934087753296,
"step": 1610,
"valid_targets_mean": 4158.7,
"valid_targets_min": 578
},
{
"epoch": 2.5675675675675675,
"grad_norm": 0.43578064511427506,
"learning_rate": 3.195494691686718e-05,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18895184993743896,
"step": 1615,
"valid_targets_mean": 4406.8,
"valid_targets_min": 1521
},
{
"epoch": 2.575516693163752,
"grad_norm": 0.4519962457233152,
"learning_rate": 3.189128507319197e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17107641696929932,
"step": 1620,
"valid_targets_mean": 3569.7,
"valid_targets_min": 534
},
{
"epoch": 2.5834658187599366,
"grad_norm": 0.5454247674899096,
"learning_rate": 3.182743631672102e-05,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17942318320274353,
"step": 1625,
"valid_targets_mean": 2771.4,
"valid_targets_min": 1372
},
{
"epoch": 2.5914149443561207,
"grad_norm": 0.4497356577426226,
"learning_rate": 3.1763401651059025e-05,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1738359034061432,
"step": 1630,
"valid_targets_mean": 3365.7,
"valid_targets_min": 911
},
{
"epoch": 2.5993640699523053,
"grad_norm": 0.7952703957802248,
"learning_rate": 3.1699182082732886e-05,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18283095955848694,
"step": 1635,
"valid_targets_mean": 2729.1,
"valid_targets_min": 249
},
{
"epoch": 2.60731319554849,
"grad_norm": 0.39447463509094877,
"learning_rate": 3.1634778621175905e-05,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14707916975021362,
"step": 1640,
"valid_targets_mean": 4424.3,
"valid_targets_min": 794
},
{
"epoch": 2.615262321144674,
"grad_norm": 0.5826754203242515,
"learning_rate": 3.157019227871189e-05,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18842703104019165,
"step": 1645,
"valid_targets_mean": 2496.5,
"valid_targets_min": 248
},
{
"epoch": 2.6232114467408585,
"grad_norm": 0.4569413845264777,
"learning_rate": 3.150542407053927e-05,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15572036802768707,
"step": 1650,
"valid_targets_mean": 3717.3,
"valid_targets_min": 206
},
{
"epoch": 2.631160572337043,
"grad_norm": 0.3769631110508782,
"learning_rate": 3.144047501471511e-05,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15287700295448303,
"step": 1655,
"valid_targets_mean": 4491.1,
"valid_targets_min": 623
},
{
"epoch": 2.639109697933227,
"grad_norm": 0.3834879165232079,
"learning_rate": 3.1375346132139135e-05,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14792010188102722,
"step": 1660,
"valid_targets_mean": 4377.1,
"valid_targets_min": 1297
},
{
"epoch": 2.6470588235294117,
"grad_norm": 0.40025749764942126,
"learning_rate": 3.131003844653766e-05,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16569784283638,
"step": 1665,
"valid_targets_mean": 4147.7,
"valid_targets_min": 231
},
{
"epoch": 2.6550079491255962,
"grad_norm": 0.6151639522393043,
"learning_rate": 3.124455298444752e-05,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18059095740318298,
"step": 1670,
"valid_targets_mean": 3476.2,
"valid_targets_min": 205
},
{
"epoch": 2.6629570747217803,
"grad_norm": 0.4732700696731575,
"learning_rate": 3.1178890775199925e-05,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1820976436138153,
"step": 1675,
"valid_targets_mean": 3768.2,
"valid_targets_min": 671
},
{
"epoch": 2.670906200317965,
"grad_norm": 0.44427708127372323,
"learning_rate": 3.1113052850904275e-05,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14810726046562195,
"step": 1680,
"valid_targets_mean": 3540.6,
"valid_targets_min": 546
},
{
"epoch": 2.6788553259141494,
"grad_norm": 0.47123009484821854,
"learning_rate": 3.1047040246431936e-05,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17077761888504028,
"step": 1685,
"valid_targets_mean": 3889.4,
"valid_targets_min": 269
},
{
"epoch": 2.686804451510334,
"grad_norm": 0.4318567795086639,
"learning_rate": 3.098085399939998e-05,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1917814016342163,
"step": 1690,
"valid_targets_mean": 4599.8,
"valid_targets_min": 1239
},
{
"epoch": 2.6947535771065185,
"grad_norm": 0.4721685189025569,
"learning_rate": 3.091449515015489e-05,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17242677509784698,
"step": 1695,
"valid_targets_mean": 3185.9,
"valid_targets_min": 683
},
{
"epoch": 2.7027027027027026,
"grad_norm": 0.4250655218343069,
"learning_rate": 3.084796474175618e-05,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1556561142206192,
"step": 1700,
"valid_targets_mean": 4078.5,
"valid_targets_min": 729
},
{
"epoch": 2.710651828298887,
"grad_norm": 0.4447639847156236,
"learning_rate": 3.078126381996001e-05,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15216678380966187,
"step": 1705,
"valid_targets_mean": 4152.2,
"valid_targets_min": 513
},
{
"epoch": 2.7186009538950717,
"grad_norm": 0.4579147243616527,
"learning_rate": 3.071439343320274e-05,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1592155396938324,
"step": 1710,
"valid_targets_mean": 3433.2,
"valid_targets_min": 593
},
{
"epoch": 2.726550079491256,
"grad_norm": 0.4407571500778382,
"learning_rate": 3.064735463258449e-05,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17721107602119446,
"step": 1715,
"valid_targets_mean": 4108.9,
"valid_targets_min": 240
},
{
"epoch": 2.7344992050874404,
"grad_norm": 0.40400452078934607,
"learning_rate": 3.0580148471852544e-05,
"loss": 0.1612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15850304067134857,
"step": 1720,
"valid_targets_mean": 4096.9,
"valid_targets_min": 727
},
{
"epoch": 2.742448330683625,
"grad_norm": 0.37213244183165023,
"learning_rate": 3.0512776007384882e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14977069199085236,
"step": 1725,
"valid_targets_mean": 5645.9,
"valid_targets_min": 1122
},
{
"epoch": 2.750397456279809,
"grad_norm": 0.46209322559956156,
"learning_rate": 3.0445238298173492e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1584990918636322,
"step": 1730,
"valid_targets_mean": 3129.1,
"valid_targets_min": 262
},
{
"epoch": 2.7583465818759936,
"grad_norm": 0.4385757383753134,
"learning_rate": 3.0377536405807753e-05,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1700027585029602,
"step": 1735,
"valid_targets_mean": 4126.4,
"valid_targets_min": 1038
},
{
"epoch": 2.766295707472178,
"grad_norm": 0.5770273602388422,
"learning_rate": 3.030967139445776e-05,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1636781394481659,
"step": 1740,
"valid_targets_mean": 2366.4,
"valid_targets_min": 330
},
{
"epoch": 2.7742448330683622,
"grad_norm": 0.46564547279320734,
"learning_rate": 3.0241644330857604e-05,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15485122799873352,
"step": 1745,
"valid_targets_mean": 3985.4,
"valid_targets_min": 614
},
{
"epoch": 2.7821939586645468,
"grad_norm": 0.47547498624328677,
"learning_rate": 3.0173456284288565e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19546955823898315,
"step": 1750,
"valid_targets_mean": 4155.4,
"valid_targets_min": 492
},
{
"epoch": 2.7901430842607313,
"grad_norm": 0.5158856359689629,
"learning_rate": 3.010510832656233e-05,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.161908358335495,
"step": 1755,
"valid_targets_mean": 3625.6,
"valid_targets_min": 860
},
{
"epoch": 2.798092209856916,
"grad_norm": 0.4471113346837271,
"learning_rate": 3.0036601532004175e-05,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1580810248851776,
"step": 1760,
"valid_targets_mean": 3677.0,
"valid_targets_min": 413
},
{
"epoch": 2.8060413354531004,
"grad_norm": 0.4114471784729695,
"learning_rate": 2.996793697743601e-05,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1642129123210907,
"step": 1765,
"valid_targets_mean": 4178.1,
"valid_targets_min": 835
},
{
"epoch": 2.8139904610492845,
"grad_norm": 0.43668170542838514,
"learning_rate": 2.9899115742159512e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16554221510887146,
"step": 1770,
"valid_targets_mean": 4644.9,
"valid_targets_min": 693
},
{
"epoch": 2.821939586645469,
"grad_norm": 0.5043488707813197,
"learning_rate": 2.9830138907939137e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16675223410129547,
"step": 1775,
"valid_targets_mean": 3199.9,
"valid_targets_min": 304
},
{
"epoch": 2.8298887122416536,
"grad_norm": 0.39898904679988073,
"learning_rate": 2.976100755898511e-05,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16235503554344177,
"step": 1780,
"valid_targets_mean": 4958.9,
"valid_targets_min": 690
},
{
"epoch": 2.8378378378378377,
"grad_norm": 0.5087094254868092,
"learning_rate": 2.9691722781936398e-05,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16532549262046814,
"step": 1785,
"valid_targets_mean": 2913.4,
"valid_targets_min": 538
},
{
"epoch": 2.8457869634340223,
"grad_norm": 0.514390244173884,
"learning_rate": 2.962228566584362e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18927565217018127,
"step": 1790,
"valid_targets_mean": 3447.2,
"valid_targets_min": 623
},
{
"epoch": 2.853736089030207,
"grad_norm": 0.4250826109776861,
"learning_rate": 2.9552697302151937e-05,
"loss": 0.1572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15817922353744507,
"step": 1795,
"valid_targets_mean": 4025.1,
"valid_targets_min": 779
},
{
"epoch": 2.861685214626391,
"grad_norm": 0.4104299314914552,
"learning_rate": 2.9482958784683883e-05,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1422051340341568,
"step": 1800,
"valid_targets_mean": 3494.4,
"valid_targets_min": 262
},
{
"epoch": 2.8696343402225755,
"grad_norm": 0.41440908629922096,
"learning_rate": 2.9413071209622174e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14636817574501038,
"step": 1805,
"valid_targets_mean": 4556.1,
"valid_targets_min": 847
},
{
"epoch": 2.87758346581876,
"grad_norm": 0.48515765879460354,
"learning_rate": 2.934303567549251e-05,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1678956151008606,
"step": 1810,
"valid_targets_mean": 3278.6,
"valid_targets_min": 522
},
{
"epoch": 2.885532591414944,
"grad_norm": 0.514128862513967,
"learning_rate": 2.9272853283146255e-05,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16510531306266785,
"step": 1815,
"valid_targets_mean": 2977.9,
"valid_targets_min": 355
},
{
"epoch": 2.8934817170111287,
"grad_norm": 0.5493626194079975,
"learning_rate": 2.9202525135743158e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22584211826324463,
"step": 1820,
"valid_targets_mean": 2734.2,
"valid_targets_min": 686
},
{
"epoch": 2.901430842607313,
"grad_norm": 0.4370645426098783,
"learning_rate": 2.9132052338734033e-05,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16311654448509216,
"step": 1825,
"valid_targets_mean": 3748.9,
"valid_targets_min": 648
},
{
"epoch": 2.9093799682034978,
"grad_norm": 0.45957400888294386,
"learning_rate": 2.9061435999843354e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15466034412384033,
"step": 1830,
"valid_targets_mean": 3323.8,
"valid_targets_min": 699
},
{
"epoch": 2.9173290937996823,
"grad_norm": 0.39548994984246866,
"learning_rate": 2.8990677229051855e-05,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1540757715702057,
"step": 1835,
"valid_targets_mean": 4090.8,
"valid_targets_min": 889
},
{
"epoch": 2.9252782193958664,
"grad_norm": 0.4905605606999161,
"learning_rate": 2.8919777138579074e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16376616060733795,
"step": 1840,
"valid_targets_mean": 2992.8,
"valid_targets_min": 253
},
{
"epoch": 2.933227344992051,
"grad_norm": 0.39954714024700316,
"learning_rate": 2.8848736842865893e-05,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13295181095600128,
"step": 1845,
"valid_targets_mean": 3622.3,
"valid_targets_min": 534
},
{
"epoch": 2.9411764705882355,
"grad_norm": 0.4109518903334489,
"learning_rate": 2.8777557458556993e-05,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15689434111118317,
"step": 1850,
"valid_targets_mean": 4599.6,
"valid_targets_min": 1357
},
{
"epoch": 2.9491255961844196,
"grad_norm": 0.4134036810952952,
"learning_rate": 2.870624010448332e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16236630082130432,
"step": 1855,
"valid_targets_mean": 4970.9,
"valid_targets_min": 525
},
{
"epoch": 2.957074721780604,
"grad_norm": 0.44310700881675275,
"learning_rate": 2.8634785901644497e-05,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18711400032043457,
"step": 1860,
"valid_targets_mean": 4005.5,
"valid_targets_min": 368
},
{
"epoch": 2.9650238473767887,
"grad_norm": 0.3717450015352577,
"learning_rate": 2.856319597319119e-05,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14527782797813416,
"step": 1865,
"valid_targets_mean": 4636.0,
"valid_targets_min": 834
},
{
"epoch": 2.972972972972973,
"grad_norm": 0.4489188113660503,
"learning_rate": 2.849147144440747e-05,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18267220258712769,
"step": 1870,
"valid_targets_mean": 3598.4,
"valid_targets_min": 272
},
{
"epoch": 2.9809220985691574,
"grad_norm": 0.463504579635663,
"learning_rate": 2.8419613442693127e-05,
"loss": 0.1825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16523773968219757,
"step": 1875,
"valid_targets_mean": 3690.0,
"valid_targets_min": 741
},
{
"epoch": 2.988871224165342,
"grad_norm": 0.42098915439827383,
"learning_rate": 2.834762309754593e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15425992012023926,
"step": 1880,
"valid_targets_mean": 3851.8,
"valid_targets_min": 1123
},
{
"epoch": 2.996820349761526,
"grad_norm": 0.44087606889969083,
"learning_rate": 2.8275501540543877e-05,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1857764720916748,
"step": 1885,
"valid_targets_mean": 4492.8,
"valid_targets_min": 303
},
{
"epoch": 3.0047694753577106,
"grad_norm": 0.40019519904714795,
"learning_rate": 2.8203249905327434e-05,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14805257320404053,
"step": 1890,
"valid_targets_mean": 4000.0,
"valid_targets_min": 622
},
{
"epoch": 3.012718600953895,
"grad_norm": 0.3925087002790559,
"learning_rate": 2.81308693275817e-05,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15407413244247437,
"step": 1895,
"valid_targets_mean": 5172.0,
"valid_targets_min": 717
},
{
"epoch": 3.0206677265500796,
"grad_norm": 0.46275383155041416,
"learning_rate": 2.8058360945018518e-05,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13890619575977325,
"step": 1900,
"valid_targets_mean": 4028.7,
"valid_targets_min": 560
},
{
"epoch": 3.0286168521462637,
"grad_norm": 0.4551559001740428,
"learning_rate": 2.7985725897358665e-05,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15436714887619019,
"step": 1905,
"valid_targets_mean": 3797.8,
"valid_targets_min": 565
},
{
"epoch": 3.0365659777424483,
"grad_norm": 0.4842383814763534,
"learning_rate": 2.791296532631389e-05,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14294975996017456,
"step": 1910,
"valid_targets_mean": 3047.1,
"valid_targets_min": 545
},
{
"epoch": 3.044515103338633,
"grad_norm": 0.5397174824822419,
"learning_rate": 2.7840080375568964e-05,
"loss": 0.1452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1518700122833252,
"step": 1915,
"valid_targets_mean": 3124.6,
"valid_targets_min": 650
},
{
"epoch": 3.0524642289348174,
"grad_norm": 0.5358906602930991,
"learning_rate": 2.7767072190763733e-05,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1446910947561264,
"step": 1920,
"valid_targets_mean": 2824.1,
"valid_targets_min": 538
},
{
"epoch": 3.0604133545310015,
"grad_norm": 0.40186405732354413,
"learning_rate": 2.7693941919475076e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1320028454065323,
"step": 1925,
"valid_targets_mean": 4311.8,
"valid_targets_min": 1384
},
{
"epoch": 3.068362480127186,
"grad_norm": 0.5420721530535801,
"learning_rate": 2.7620690711198906e-05,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16763970255851746,
"step": 1930,
"valid_targets_mean": 3246.2,
"valid_targets_min": 678
},
{
"epoch": 3.0763116057233706,
"grad_norm": 0.46354880795162495,
"learning_rate": 2.7547319717332066e-05,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15304705500602722,
"step": 1935,
"valid_targets_mean": 3665.1,
"valid_targets_min": 304
},
{
"epoch": 3.0842607313195547,
"grad_norm": 0.4230495218281992,
"learning_rate": 2.7473830091154243e-05,
"loss": 0.1475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1243860200047493,
"step": 1940,
"valid_targets_mean": 3626.8,
"valid_targets_min": 568
},
{
"epoch": 3.0922098569157392,
"grad_norm": 0.4361635236789642,
"learning_rate": 2.7400222987809856e-05,
"loss": 0.1448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12188908457756042,
"step": 1945,
"valid_targets_mean": 4010.5,
"valid_targets_min": 498
},
{
"epoch": 3.100158982511924,
"grad_norm": 0.4439974035967091,
"learning_rate": 2.7326499564289867e-05,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13789242506027222,
"step": 1950,
"valid_targets_mean": 3711.9,
"valid_targets_min": 454
},
{
"epoch": 3.108108108108108,
"grad_norm": 0.41877176013375694,
"learning_rate": 2.725266097941363e-05,
"loss": 0.1395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1316269338130951,
"step": 1955,
"valid_targets_mean": 4314.9,
"valid_targets_min": 1299
},
{
"epoch": 3.1160572337042924,
"grad_norm": 0.527858481472521,
"learning_rate": 2.717870839381066e-05,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15569709241390228,
"step": 1960,
"valid_targets_mean": 3514.8,
"valid_targets_min": 949
},
{
"epoch": 3.124006359300477,
"grad_norm": 0.3850217928191781,
"learning_rate": 2.7104642969902357e-05,
"loss": 0.1367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1267361342906952,
"step": 1965,
"valid_targets_mean": 4886.9,
"valid_targets_min": 300
},
{
"epoch": 3.1319554848966615,
"grad_norm": 0.44634061646307166,
"learning_rate": 2.7030465871883812e-05,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15789856016635895,
"step": 1970,
"valid_targets_mean": 4405.6,
"valid_targets_min": 512
},
{
"epoch": 3.1399046104928456,
"grad_norm": 0.44800018132825026,
"learning_rate": 2.6956178265705434e-05,
"loss": 0.1458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1587265133857727,
"step": 1975,
"valid_targets_mean": 4086.9,
"valid_targets_min": 1071
},
{
"epoch": 3.14785373608903,
"grad_norm": 0.4616270378131397,
"learning_rate": 2.688178131905465e-05,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1500604748725891,
"step": 1980,
"valid_targets_mean": 3678.9,
"valid_targets_min": 683
},
{
"epoch": 3.1558028616852147,
"grad_norm": 0.5790165944659751,
"learning_rate": 2.680727620133757e-05,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15115083754062653,
"step": 1985,
"valid_targets_mean": 2691.0,
"valid_targets_min": 502
},
{
"epoch": 3.1637519872813993,
"grad_norm": 0.4845439722921149,
"learning_rate": 2.673266408366057e-05,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12436607480049133,
"step": 1990,
"valid_targets_mean": 3094.4,
"valid_targets_min": 299
},
{
"epoch": 3.1717011128775834,
"grad_norm": 0.49364688977299304,
"learning_rate": 2.6657946138811915e-05,
"loss": 0.1452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1511753499507904,
"step": 1995,
"valid_targets_mean": 3998.1,
"valid_targets_min": 781
},
{
"epoch": 3.179650238473768,
"grad_norm": 0.488321490398884,
"learning_rate": 2.6583123541243302e-05,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17050573229789734,
"step": 2000,
"valid_targets_mean": 3620.8,
"valid_targets_min": 248
},
{
"epoch": 3.1875993640699525,
"grad_norm": 0.40982555411387517,
"learning_rate": 2.6508197467051406e-05,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12908829748630524,
"step": 2005,
"valid_targets_mean": 4178.4,
"valid_targets_min": 1472
},
{
"epoch": 3.1955484896661366,
"grad_norm": 0.40055451862255126,
"learning_rate": 2.6433169093959405e-05,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14281156659126282,
"step": 2010,
"valid_targets_mean": 4660.8,
"valid_targets_min": 685
},
{
"epoch": 3.203497615262321,
"grad_norm": 0.46116477905857267,
"learning_rate": 2.6358039601298454e-05,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13968366384506226,
"step": 2015,
"valid_targets_mean": 3884.2,
"valid_targets_min": 344
},
{
"epoch": 3.2114467408585057,
"grad_norm": 0.43289954051552515,
"learning_rate": 2.6282810169989158e-05,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1596599519252777,
"step": 2020,
"valid_targets_mean": 4390.9,
"valid_targets_min": 254
},
{
"epoch": 3.21939586645469,
"grad_norm": 0.5078592423856673,
"learning_rate": 2.6207481982523e-05,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1573963314294815,
"step": 2025,
"valid_targets_mean": 3303.6,
"valid_targets_min": 1122
},
{
"epoch": 3.2273449920508743,
"grad_norm": 0.5091146694996267,
"learning_rate": 2.6132056222943757e-05,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1862080991268158,
"step": 2030,
"valid_targets_mean": 3232.9,
"valid_targets_min": 481
},
{
"epoch": 3.235294117647059,
"grad_norm": 0.5238546808532447,
"learning_rate": 2.6056534076828883e-05,
"loss": 0.1576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18422989547252655,
"step": 2035,
"valid_targets_mean": 3585.9,
"valid_targets_min": 266
},
{
"epoch": 3.2432432432432434,
"grad_norm": 0.4363636469238868,
"learning_rate": 2.598091673127091e-05,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14309856295585632,
"step": 2040,
"valid_targets_mean": 3745.1,
"valid_targets_min": 921
},
{
"epoch": 3.2511923688394275,
"grad_norm": 0.4339103556613612,
"learning_rate": 2.5905205374858728e-05,
"loss": 0.1526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14386232197284698,
"step": 2045,
"valid_targets_mean": 4056.8,
"valid_targets_min": 1465
},
{
"epoch": 3.259141494435612,
"grad_norm": 0.42741463506623106,
"learning_rate": 2.5829401197658946e-05,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20502996444702148,
"step": 2050,
"valid_targets_mean": 5179.3,
"valid_targets_min": 1065
},
{
"epoch": 3.2670906200317966,
"grad_norm": 0.43626977002875506,
"learning_rate": 2.5753505391197173e-05,
"loss": 0.1436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.148350328207016,
"step": 2055,
"valid_targets_mean": 4743.6,
"valid_targets_min": 568
},
{
"epoch": 3.275039745627981,
"grad_norm": 0.46840087217117315,
"learning_rate": 2.5677519148439286e-05,
"loss": 0.1576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15138383209705353,
"step": 2060,
"valid_targets_mean": 3961.1,
"valid_targets_min": 243
},
{
"epoch": 3.2829888712241653,
"grad_norm": 0.507365313224075,
"learning_rate": 2.56014436637727e-05,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13263681530952454,
"step": 2065,
"valid_targets_mean": 2687.8,
"valid_targets_min": 251
},
{
"epoch": 3.29093799682035,
"grad_norm": 0.4749587295324443,
"learning_rate": 2.5525280132987544e-05,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13461729884147644,
"step": 2070,
"valid_targets_mean": 3908.1,
"valid_targets_min": 343
},
{
"epoch": 3.2988871224165344,
"grad_norm": 0.5571544935176302,
"learning_rate": 2.544902975325793e-05,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15287074446678162,
"step": 2075,
"valid_targets_mean": 2425.0,
"valid_targets_min": 205
},
{
"epoch": 3.3068362480127185,
"grad_norm": 0.45571560695399776,
"learning_rate": 2.5372693723123075e-05,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1337605118751526,
"step": 2080,
"valid_targets_mean": 3706.5,
"valid_targets_min": 448
},
{
"epoch": 3.314785373608903,
"grad_norm": 0.4841238396850524,
"learning_rate": 2.5296273242468514e-05,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13751645386219025,
"step": 2085,
"valid_targets_mean": 3224.1,
"valid_targets_min": 281
},
{
"epoch": 3.3227344992050876,
"grad_norm": 0.5882557810118016,
"learning_rate": 2.5219769512507202e-05,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15059013664722443,
"step": 2090,
"valid_targets_mean": 4222.4,
"valid_targets_min": 1837
},
{
"epoch": 3.3306836248012717,
"grad_norm": 0.4355529800792949,
"learning_rate": 2.5143183735760638e-05,
"loss": 0.1401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13719777762889862,
"step": 2095,
"valid_targets_mean": 5038.6,
"valid_targets_min": 692
},
{
"epoch": 3.338632750397456,
"grad_norm": 0.48366910917541367,
"learning_rate": 2.5066517116039978e-05,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14523795247077942,
"step": 2100,
"valid_targets_mean": 3369.9,
"valid_targets_min": 635
},
{
"epoch": 3.3465818759936408,
"grad_norm": 0.432180761274418,
"learning_rate": 2.4989770858427113e-05,
"loss": 0.1391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14896121621131897,
"step": 2105,
"valid_targets_mean": 4274.6,
"valid_targets_min": 1463
},
{
"epoch": 3.3545310015898253,
"grad_norm": 0.4673043662584066,
"learning_rate": 2.4912946169255722e-05,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14605014026165009,
"step": 2110,
"valid_targets_mean": 3783.2,
"valid_targets_min": 1054
},
{
"epoch": 3.3624801271860094,
"grad_norm": 0.4743882917216998,
"learning_rate": 2.4836044256092288e-05,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1554591804742813,
"step": 2115,
"valid_targets_mean": 3935.7,
"valid_targets_min": 612
},
{
"epoch": 3.370429252782194,
"grad_norm": 0.4815307642109087,
"learning_rate": 2.475906632771714e-05,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14014503359794617,
"step": 2120,
"valid_targets_mean": 3164.2,
"valid_targets_min": 373
},
{
"epoch": 3.3783783783783785,
"grad_norm": 0.40589792615723674,
"learning_rate": 2.468201359410548e-05,
"loss": 0.1402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14491534233093262,
"step": 2125,
"valid_targets_mean": 4419.9,
"valid_targets_min": 340
},
{
"epoch": 3.3863275039745626,
"grad_norm": 0.44260667005600757,
"learning_rate": 2.4604887266408304e-05,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1457509994506836,
"step": 2130,
"valid_targets_mean": 4288.4,
"valid_targets_min": 637
},
{
"epoch": 3.394276629570747,
"grad_norm": 0.4581973653604292,
"learning_rate": 2.4527688556933402e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15415199100971222,
"step": 2135,
"valid_targets_mean": 4045.8,
"valid_targets_min": 977
},
{
"epoch": 3.4022257551669317,
"grad_norm": 0.7140350335944461,
"learning_rate": 2.445041867912629e-05,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15349167585372925,
"step": 2140,
"valid_targets_mean": 2618.8,
"valid_targets_min": 673
},
{
"epoch": 3.4101748807631163,
"grad_norm": 0.5034625114730497,
"learning_rate": 2.4373078847551154e-05,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14303407073020935,
"step": 2145,
"valid_targets_mean": 3076.3,
"valid_targets_min": 675
},
{
"epoch": 3.4181240063593004,
"grad_norm": 0.48632708952047105,
"learning_rate": 2.4295670277871736e-05,
"loss": 0.1495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1465069055557251,
"step": 2150,
"valid_targets_mean": 3372.1,
"valid_targets_min": 705
},
{
"epoch": 3.426073131955485,
"grad_norm": 0.4937147781905013,
"learning_rate": 2.4218194186832237e-05,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17899924516677856,
"step": 2155,
"valid_targets_mean": 3543.7,
"valid_targets_min": 204
},
{
"epoch": 3.4340222575516695,
"grad_norm": 0.446614778026149,
"learning_rate": 2.4140651792238193e-05,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16787397861480713,
"step": 2160,
"valid_targets_mean": 4232.8,
"valid_targets_min": 1131
},
{
"epoch": 3.4419713831478536,
"grad_norm": 0.5049089497785076,
"learning_rate": 2.4063044312937332e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1745222806930542,
"step": 2165,
"valid_targets_mean": 3461.6,
"valid_targets_min": 582
},
{
"epoch": 3.449920508744038,
"grad_norm": 0.41955260576113246,
"learning_rate": 2.3985372968800407e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1277008205652237,
"step": 2170,
"valid_targets_mean": 3886.0,
"valid_targets_min": 548
},
{
"epoch": 3.4578696343402227,
"grad_norm": 0.44853544938510986,
"learning_rate": 2.3907638980702043e-05,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13143455982208252,
"step": 2175,
"valid_targets_mean": 2990.2,
"valid_targets_min": 695
},
{
"epoch": 3.4658187599364068,
"grad_norm": 0.5052915184377108,
"learning_rate": 2.382984357050151e-05,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1574200838804245,
"step": 2180,
"valid_targets_mean": 3370.8,
"valid_targets_min": 352
},
{
"epoch": 3.4737678855325913,
"grad_norm": 0.44259229283391566,
"learning_rate": 2.3751987961023545e-05,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13950997591018677,
"step": 2185,
"valid_targets_mean": 3953.6,
"valid_targets_min": 220
},
{
"epoch": 3.481717011128776,
"grad_norm": 0.48788565916051185,
"learning_rate": 2.3674073376039152e-05,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1728115677833557,
"step": 2190,
"valid_targets_mean": 3669.0,
"valid_targets_min": 671
},
{
"epoch": 3.4896661367249604,
"grad_norm": 0.4492760385555854,
"learning_rate": 2.359610104024631e-05,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15678560733795166,
"step": 2195,
"valid_targets_mean": 3583.8,
"valid_targets_min": 637
},
{
"epoch": 3.4976152623211445,
"grad_norm": 0.39986255476691307,
"learning_rate": 2.3518072179250753e-05,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14417177438735962,
"step": 2200,
"valid_targets_mean": 4219.2,
"valid_targets_min": 641
},
{
"epoch": 3.505564387917329,
"grad_norm": 0.384596360059307,
"learning_rate": 2.343998801954673e-05,
"loss": 0.1377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11725412309169769,
"step": 2205,
"valid_targets_mean": 4539.5,
"valid_targets_min": 1403
},
{
"epoch": 3.5135135135135136,
"grad_norm": 0.3726022277230603,
"learning_rate": 2.3361849788497666e-05,
"loss": 0.1467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12121937423944473,
"step": 2210,
"valid_targets_mean": 4714.5,
"valid_targets_min": 1012
},
{
"epoch": 3.521462639109698,
"grad_norm": 0.426941312289138,
"learning_rate": 2.3283658714316935e-05,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13825076818466187,
"step": 2215,
"valid_targets_mean": 4406.4,
"valid_targets_min": 559
},
{
"epoch": 3.5294117647058822,
"grad_norm": 0.4301504339821543,
"learning_rate": 2.320541602604851e-05,
"loss": 0.1424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13971027731895447,
"step": 2220,
"valid_targets_mean": 3877.9,
"valid_targets_min": 642
},
{
"epoch": 3.537360890302067,
"grad_norm": 0.5113573188300341,
"learning_rate": 2.3127122953547663e-05,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1780821532011032,
"step": 2225,
"valid_targets_mean": 3525.3,
"valid_targets_min": 738
},
{
"epoch": 3.5453100158982513,
"grad_norm": 0.5063219756936636,
"learning_rate": 2.3048780727461627e-05,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16249513626098633,
"step": 2230,
"valid_targets_mean": 3025.3,
"valid_targets_min": 627
},
{
"epoch": 3.5532591414944354,
"grad_norm": 0.4792775762459798,
"learning_rate": 2.2970390579210246e-05,
"loss": 0.1414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1491563469171524,
"step": 2235,
"valid_targets_mean": 3644.2,
"valid_targets_min": 568
},
{
"epoch": 3.56120826709062,
"grad_norm": 0.4620771758711201,
"learning_rate": 2.2891953740966643e-05,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16006189584732056,
"step": 2240,
"valid_targets_mean": 4079.1,
"valid_targets_min": 235
},
{
"epoch": 3.5691573926868045,
"grad_norm": 0.44785087939845997,
"learning_rate": 2.281347144563782e-05,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1455570012331009,
"step": 2245,
"valid_targets_mean": 4200.4,
"valid_targets_min": 562
},
{
"epoch": 3.5771065182829886,
"grad_norm": 0.5185565156273501,
"learning_rate": 2.273494492684531e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16593654453754425,
"step": 2250,
"valid_targets_mean": 3104.9,
"valid_targets_min": 309
},
{
"epoch": 3.585055643879173,
"grad_norm": 0.4172228609919065,
"learning_rate": 2.265637541890577e-05,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1278490126132965,
"step": 2255,
"valid_targets_mean": 3515.1,
"valid_targets_min": 294
},
{
"epoch": 3.5930047694753577,
"grad_norm": 0.4286795679059123,
"learning_rate": 2.2577764156811563e-05,
"loss": 0.1455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14926648139953613,
"step": 2260,
"valid_targets_mean": 4430.3,
"valid_targets_min": 675
},
{
"epoch": 3.6009538950715423,
"grad_norm": 0.560172122368529,
"learning_rate": 2.2499112376211373e-05,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18510201573371887,
"step": 2265,
"valid_targets_mean": 3477.6,
"valid_targets_min": 794
},
{
"epoch": 3.6089030206677264,
"grad_norm": 0.43226594819787095,
"learning_rate": 2.2420421313390776e-05,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14725884795188904,
"step": 2270,
"valid_targets_mean": 4508.8,
"valid_targets_min": 1163
},
{
"epoch": 3.616852146263911,
"grad_norm": 0.4437643653037656,
"learning_rate": 2.234169220525282e-05,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13907790184020996,
"step": 2275,
"valid_targets_mean": 4162.6,
"valid_targets_min": 1468
},
{
"epoch": 3.6248012718600955,
"grad_norm": 0.4837609246828785,
"learning_rate": 2.226292628929853e-05,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14810554683208466,
"step": 2280,
"valid_targets_mean": 3524.7,
"valid_targets_min": 947
},
{
"epoch": 3.63275039745628,
"grad_norm": 0.4869827211098654,
"learning_rate": 2.2184124803607525e-05,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15223252773284912,
"step": 2285,
"valid_targets_mean": 3463.3,
"valid_targets_min": 759
},
{
"epoch": 3.640699523052464,
"grad_norm": 0.4108383751418014,
"learning_rate": 2.210528898681851e-05,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.142578586935997,
"step": 2290,
"valid_targets_mean": 4477.9,
"valid_targets_min": 1006
},
{
"epoch": 3.6486486486486487,
"grad_norm": 0.4566807244274852,
"learning_rate": 2.2026420078109825e-05,
"loss": 0.1373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13954466581344604,
"step": 2295,
"valid_targets_mean": 4329.2,
"valid_targets_min": 1167
},
{
"epoch": 3.6565977742448332,
"grad_norm": 0.4162315487171508,
"learning_rate": 2.1947519317179972e-05,
"loss": 0.1544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11526475101709366,
"step": 2300,
"valid_targets_mean": 4507.4,
"valid_targets_min": 775
},
{
"epoch": 3.6645468998410173,
"grad_norm": 0.4900587733241069,
"learning_rate": 2.1868587944228118e-05,
"loss": 0.1595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15211628377437592,
"step": 2305,
"valid_targets_mean": 3048.8,
"valid_targets_min": 286
},
{
"epoch": 3.672496025437202,
"grad_norm": 0.5187421796257302,
"learning_rate": 2.1789627199934588e-05,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1537800431251526,
"step": 2310,
"valid_targets_mean": 3951.4,
"valid_targets_min": 723
},
{
"epoch": 3.6804451510333864,
"grad_norm": 0.4523155098757611,
"learning_rate": 2.1710638325441408e-05,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15439185500144958,
"step": 2315,
"valid_targets_mean": 3848.8,
"valid_targets_min": 468
},
{
"epoch": 3.6883942766295705,
"grad_norm": 0.5113186455328838,
"learning_rate": 2.1631622562332744e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12993109226226807,
"step": 2320,
"valid_targets_mean": 3168.6,
"valid_targets_min": 203
},
{
"epoch": 3.696343402225755,
"grad_norm": 0.520264446513899,
"learning_rate": 2.155258115261542e-05,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1672590672969818,
"step": 2325,
"valid_targets_mean": 3197.3,
"valid_targets_min": 538
},
{
"epoch": 3.7042925278219396,
"grad_norm": 0.397858988377642,
"learning_rate": 2.1473515338699383e-05,
"loss": 0.146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13418936729431152,
"step": 2330,
"valid_targets_mean": 4454.8,
"valid_targets_min": 278
},
{
"epoch": 3.7122416534181237,
"grad_norm": 0.47038464892938564,
"learning_rate": 2.1394426363378186e-05,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14343999326229095,
"step": 2335,
"valid_targets_mean": 3456.6,
"valid_targets_min": 524
},
{
"epoch": 3.7201907790143083,
"grad_norm": 0.4590271298948369,
"learning_rate": 2.1315315469809426e-05,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15839475393295288,
"step": 2340,
"valid_targets_mean": 3980.2,
"valid_targets_min": 1039
},
{
"epoch": 3.728139904610493,
"grad_norm": 0.526091163735105,
"learning_rate": 2.1236183901495236e-05,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21831142902374268,
"step": 2345,
"valid_targets_mean": 3343.4,
"valid_targets_min": 578
},
{
"epoch": 3.7360890302066774,
"grad_norm": 0.4487683579294528,
"learning_rate": 2.1157032902262716e-05,
"loss": 0.1424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15747785568237305,
"step": 2350,
"valid_targets_mean": 4185.1,
"valid_targets_min": 834
},
{
"epoch": 3.744038155802862,
"grad_norm": 0.41019128305055114,
"learning_rate": 2.1077863716244388e-05,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12705016136169434,
"step": 2355,
"valid_targets_mean": 3949.4,
"valid_targets_min": 656
},
{
"epoch": 3.751987281399046,
"grad_norm": 0.446236415640611,
"learning_rate": 2.099867758785866e-05,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14645332098007202,
"step": 2360,
"valid_targets_mean": 3793.7,
"valid_targets_min": 551
},
{
"epoch": 3.7599364069952306,
"grad_norm": 0.5374551107704829,
"learning_rate": 2.091947576179023e-05,
"loss": 0.1483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1566208451986313,
"step": 2365,
"valid_targets_mean": 3043.1,
"valid_targets_min": 279
},
{
"epoch": 3.767885532591415,
"grad_norm": 0.48392227359646184,
"learning_rate": 2.084025948297055e-05,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14955100417137146,
"step": 2370,
"valid_targets_mean": 3625.3,
"valid_targets_min": 777
},
{
"epoch": 3.7758346581875992,
"grad_norm": 0.4196458061277742,
"learning_rate": 2.0761029996558233e-05,
"loss": 0.1379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13161495327949524,
"step": 2375,
"valid_targets_mean": 3986.8,
"valid_targets_min": 1095
},
{
"epoch": 3.7837837837837838,
"grad_norm": 0.40047392629967743,
"learning_rate": 2.068178854791951e-05,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13223011791706085,
"step": 2380,
"valid_targets_mean": 4361.8,
"valid_targets_min": 555
},
{
"epoch": 3.7917329093799683,
"grad_norm": 0.3964855035870811,
"learning_rate": 2.0602536382608638e-05,
"loss": 0.1452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12523694336414337,
"step": 2385,
"valid_targets_mean": 4463.9,
"valid_targets_min": 790
},
{
"epoch": 3.7996820349761524,
"grad_norm": 0.4585272620018194,
"learning_rate": 2.0523274746348315e-05,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16742074489593506,
"step": 2390,
"valid_targets_mean": 4025.6,
"valid_targets_min": 1296
},
{
"epoch": 3.807631160572337,
"grad_norm": 0.5154964949124577,
"learning_rate": 2.0444004885010114e-05,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14283734560012817,
"step": 2395,
"valid_targets_mean": 2625.4,
"valid_targets_min": 718
},
{
"epoch": 3.8155802861685215,
"grad_norm": 0.40675149816537554,
"learning_rate": 2.0364728044594897e-05,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13937920331954956,
"step": 2400,
"valid_targets_mean": 4620.8,
"valid_targets_min": 847
},
{
"epoch": 3.8235294117647056,
"grad_norm": 0.44791101289332774,
"learning_rate": 2.0285445471213218e-05,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11926200985908508,
"step": 2405,
"valid_targets_mean": 3797.2,
"valid_targets_min": 280
},
{
"epoch": 3.83147853736089,
"grad_norm": 0.4690049435912802,
"learning_rate": 2.020615841106575e-05,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.158674418926239,
"step": 2410,
"valid_targets_mean": 3615.0,
"valid_targets_min": 434
},
{
"epoch": 3.8394276629570747,
"grad_norm": 0.4778625950349475,
"learning_rate": 2.0126868110423685e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1569017916917801,
"step": 2415,
"valid_targets_mean": 3607.1,
"valid_targets_min": 244
},
{
"epoch": 3.8473767885532593,
"grad_norm": 0.5094399368297139,
"learning_rate": 2.0047575815609166e-05,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13234496116638184,
"step": 2420,
"valid_targets_mean": 4075.4,
"valid_targets_min": 1276
},
{
"epoch": 3.855325914149444,
"grad_norm": 0.4474580576793741,
"learning_rate": 1.996828277297566e-05,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1673652082681656,
"step": 2425,
"valid_targets_mean": 3956.6,
"valid_targets_min": 687
},
{
"epoch": 3.863275039745628,
"grad_norm": 0.47557411799173016,
"learning_rate": 1.988899022888841e-05,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14662069082260132,
"step": 2430,
"valid_targets_mean": 3376.6,
"valid_targets_min": 290
},
{
"epoch": 3.8712241653418125,
"grad_norm": 0.47253918336301953,
"learning_rate": 1.98096994297048e-05,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17109301686286926,
"step": 2435,
"valid_targets_mean": 4009.4,
"valid_targets_min": 621
},
{
"epoch": 3.879173290937997,
"grad_norm": 0.4811824636612629,
"learning_rate": 1.9730411621754798e-05,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16535258293151855,
"step": 2440,
"valid_targets_mean": 4401.9,
"valid_targets_min": 1153
},
{
"epoch": 3.887122416534181,
"grad_norm": 0.47574278128170894,
"learning_rate": 1.9651128051321376e-05,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16865494847297668,
"step": 2445,
"valid_targets_mean": 3826.2,
"valid_targets_min": 743
},
{
"epoch": 3.8950715421303657,
"grad_norm": 0.4927720545302061,
"learning_rate": 1.9571849964620858e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1311875879764557,
"step": 2450,
"valid_targets_mean": 2777.1,
"valid_targets_min": 619
},
{
"epoch": 3.90302066772655,
"grad_norm": 0.4520272890103647,
"learning_rate": 1.949257860778339e-05,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19364655017852783,
"step": 2455,
"valid_targets_mean": 4212.9,
"valid_targets_min": 304
},
{
"epoch": 3.9109697933227343,
"grad_norm": 0.48056289266042657,
"learning_rate": 1.9413315226833343e-05,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1471574306488037,
"step": 2460,
"valid_targets_mean": 3280.9,
"valid_targets_min": 988
},
{
"epoch": 3.918918918918919,
"grad_norm": 0.44927106422669333,
"learning_rate": 1.9334061067669725e-05,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15913772583007812,
"step": 2465,
"valid_targets_mean": 4163.8,
"valid_targets_min": 525
},
{
"epoch": 3.9268680445151034,
"grad_norm": 0.4047406712647876,
"learning_rate": 1.9254817376046556e-05,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14912940561771393,
"step": 2470,
"valid_targets_mean": 4459.5,
"valid_targets_min": 1301
},
{
"epoch": 3.9348171701112875,
"grad_norm": 0.48354323358352247,
"learning_rate": 1.9175585397553368e-05,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14772868156433105,
"step": 2475,
"valid_targets_mean": 3460.9,
"valid_targets_min": 746
},
{
"epoch": 3.942766295707472,
"grad_norm": 0.45165188294145747,
"learning_rate": 1.909636637759554e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14915470778942108,
"step": 2480,
"valid_targets_mean": 3941.9,
"valid_targets_min": 753
},
{
"epoch": 3.9507154213036566,
"grad_norm": 0.675364427291404,
"learning_rate": 1.9017161561374787e-05,
"loss": 0.1375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14537788927555084,
"step": 2485,
"valid_targets_mean": 3596.5,
"valid_targets_min": 271
},
{
"epoch": 3.958664546899841,
"grad_norm": 0.4529521240142203,
"learning_rate": 1.893797219386957e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14005938172340393,
"step": 2490,
"valid_targets_mean": 3370.2,
"valid_targets_min": 491
},
{
"epoch": 3.9666136724960257,
"grad_norm": 0.43898112823019947,
"learning_rate": 1.885879951981549e-05,
"loss": 0.143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1563473492860794,
"step": 2495,
"valid_targets_mean": 4142.4,
"valid_targets_min": 519
},
{
"epoch": 3.97456279809221,
"grad_norm": 0.4632944157750017,
"learning_rate": 1.877964478368577e-05,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15442904829978943,
"step": 2500,
"valid_targets_mean": 3855.9,
"valid_targets_min": 302
},
{
"epoch": 3.9825119236883944,
"grad_norm": 0.4422485867941161,
"learning_rate": 1.8700509229671696e-05,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1370777189731598,
"step": 2505,
"valid_targets_mean": 3780.2,
"valid_targets_min": 1165
},
{
"epoch": 3.990461049284579,
"grad_norm": 0.40877054927258344,
"learning_rate": 1.8621394101663003e-05,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1423787623643875,
"step": 2510,
"valid_targets_mean": 4734.8,
"valid_targets_min": 519
},
{
"epoch": 3.998410174880763,
"grad_norm": 0.49482609642383296,
"learning_rate": 1.854230064322837e-05,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15848851203918457,
"step": 2515,
"valid_targets_mean": 3223.8,
"valid_targets_min": 275
},
{
"epoch": 4.006359300476947,
"grad_norm": 0.3675406957911613,
"learning_rate": 1.8463230097595887e-05,
"loss": 0.1376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13189461827278137,
"step": 2520,
"valid_targets_mean": 4952.8,
"valid_targets_min": 1721
},
{
"epoch": 4.014308426073132,
"grad_norm": 0.507020553139243,
"learning_rate": 1.8384183707633475e-05,
"loss": 0.1316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1438116431236267,
"step": 2525,
"valid_targets_mean": 3300.6,
"valid_targets_min": 677
},
{
"epoch": 4.022257551669316,
"grad_norm": 0.47001299296067484,
"learning_rate": 1.8305162715829348e-05,
"loss": 0.139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14781130850315094,
"step": 2530,
"valid_targets_mean": 3934.6,
"valid_targets_min": 921
},
{
"epoch": 4.030206677265501,
"grad_norm": 0.41847190140441093,
"learning_rate": 1.8226168364272534e-05,
"loss": 0.123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11341873556375504,
"step": 2535,
"valid_targets_mean": 4553.1,
"valid_targets_min": 1276
},
{
"epoch": 4.038155802861685,
"grad_norm": 0.5373424873152618,
"learning_rate": 1.8147201894633282e-05,
"loss": 0.1284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10829570144414902,
"step": 2540,
"valid_targets_mean": 4025.9,
"valid_targets_min": 551
},
{
"epoch": 4.046104928457869,
"grad_norm": 0.44151630488419186,
"learning_rate": 1.8068264548143605e-05,
"loss": 0.1361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13234928250312805,
"step": 2545,
"valid_targets_mean": 4406.9,
"valid_targets_min": 290
},
{
"epoch": 4.054054054054054,
"grad_norm": 0.44111473492914083,
"learning_rate": 1.7989357565577746e-05,
"loss": 0.1209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12020754814147949,
"step": 2550,
"valid_targets_mean": 3875.1,
"valid_targets_min": 984
},
{
"epoch": 4.0620031796502385,
"grad_norm": 0.497648457748331,
"learning_rate": 1.7910482187232643e-05,
"loss": 0.1271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13153505325317383,
"step": 2555,
"valid_targets_mean": 3588.8,
"valid_targets_min": 308
},
{
"epoch": 4.069952305246423,
"grad_norm": 0.4466450096417644,
"learning_rate": 1.7831639652908507e-05,
"loss": 0.132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1519913375377655,
"step": 2560,
"valid_targets_mean": 4519.4,
"valid_targets_min": 373
},
{
"epoch": 4.077901430842608,
"grad_norm": 0.5133411375199687,
"learning_rate": 1.775283120188925e-05,
"loss": 0.12,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11747326701879501,
"step": 2565,
"valid_targets_mean": 3593.9,
"valid_targets_min": 696
},
{
"epoch": 4.085850556438792,
"grad_norm": 0.5340060908823832,
"learning_rate": 1.7674058072923075e-05,
"loss": 0.1424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14561407268047333,
"step": 2570,
"valid_targets_mean": 2832.8,
"valid_targets_min": 691
},
{
"epoch": 4.093799682034976,
"grad_norm": 0.5131875664235621,
"learning_rate": 1.7595321504202977e-05,
"loss": 0.1352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13636553287506104,
"step": 2575,
"valid_targets_mean": 3649.6,
"valid_targets_min": 251
},
{
"epoch": 4.101748807631161,
"grad_norm": 0.49807691314048513,
"learning_rate": 1.751662273334725e-05,
"loss": 0.1355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14528346061706543,
"step": 2580,
"valid_targets_mean": 3304.9,
"valid_targets_min": 273
},
{
"epoch": 4.109697933227345,
"grad_norm": 0.5137089285911086,
"learning_rate": 1.7437962997380093e-05,
"loss": 0.1315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12808027863502502,
"step": 2585,
"valid_targets_mean": 3785.6,
"valid_targets_min": 357
},
{
"epoch": 4.117647058823529,
"grad_norm": 0.4503928265620839,
"learning_rate": 1.7359343532712135e-05,
"loss": 0.1379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14875495433807373,
"step": 2590,
"valid_targets_mean": 4586.7,
"valid_targets_min": 270
},
{
"epoch": 4.125596184419714,
"grad_norm": 0.4166285208229854,
"learning_rate": 1.7280765575120992e-05,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11069852113723755,
"step": 2595,
"valid_targets_mean": 4363.1,
"valid_targets_min": 498
},
{
"epoch": 4.133545310015898,
"grad_norm": 0.5155386718641107,
"learning_rate": 1.7202230359731835e-05,
"loss": 0.1373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14892956614494324,
"step": 2600,
"valid_targets_mean": 3399.8,
"valid_targets_min": 592
},
{
"epoch": 4.141494435612083,
"grad_norm": 0.526180170879376,
"learning_rate": 1.7123739120998033e-05,
"loss": 0.1252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.133394256234169,
"step": 2605,
"valid_targets_mean": 3551.6,
"valid_targets_min": 519
},
{
"epoch": 4.149443561208267,
"grad_norm": 0.43448892503799785,
"learning_rate": 1.7045293092681686e-05,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12770622968673706,
"step": 2610,
"valid_targets_mean": 4312.1,
"valid_targets_min": 278
},
{
"epoch": 4.157392686804451,
"grad_norm": 0.47438188721000024,
"learning_rate": 1.6966893507834242e-05,
"loss": 0.1388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11475702375173569,
"step": 2615,
"valid_targets_mean": 3365.8,
"valid_targets_min": 527
},
{
"epoch": 4.165341812400636,
"grad_norm": 0.4734353597894468,
"learning_rate": 1.6888541598777167e-05,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14915436506271362,
"step": 2620,
"valid_targets_mean": 3915.1,
"valid_targets_min": 709
},
{
"epoch": 4.17329093799682,
"grad_norm": 0.44954055606792176,
"learning_rate": 1.68102385970825e-05,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12147843092679977,
"step": 2625,
"valid_targets_mean": 4042.4,
"valid_targets_min": 702
},
{
"epoch": 4.1812400635930045,
"grad_norm": 0.5461716268999647,
"learning_rate": 1.6731985733553545e-05,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1752236783504486,
"step": 2630,
"valid_targets_mean": 3508.4,
"valid_targets_min": 237
},
{
"epoch": 4.1891891891891895,
"grad_norm": 0.47376122084778394,
"learning_rate": 1.6653784238205525e-05,
"loss": 0.137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13985666632652283,
"step": 2635,
"valid_targets_mean": 3967.4,
"valid_targets_min": 633
},
{
"epoch": 4.197138314785374,
"grad_norm": 0.49860840899961373,
"learning_rate": 1.6575635340246203e-05,
"loss": 0.142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13958841562271118,
"step": 2640,
"valid_targets_mean": 3776.4,
"valid_targets_min": 581
},
{
"epoch": 4.205087440381558,
"grad_norm": 0.5671244632485692,
"learning_rate": 1.649754026805662e-05,
"loss": 0.1334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17595896124839783,
"step": 2645,
"valid_targets_mean": 3767.5,
"valid_targets_min": 239
},
{
"epoch": 4.213036565977743,
"grad_norm": 0.4534522358165292,
"learning_rate": 1.6419500249171737e-05,
"loss": 0.1256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12649832665920258,
"step": 2650,
"valid_targets_mean": 3767.0,
"valid_targets_min": 300
},
{
"epoch": 4.220985691573927,
"grad_norm": 0.48461063763882706,
"learning_rate": 1.634151651026118e-05,
"loss": 0.1253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11336950957775116,
"step": 2655,
"valid_targets_mean": 3496.2,
"valid_targets_min": 337
},
{
"epoch": 4.228934817170111,
"grad_norm": 0.5517432754534229,
"learning_rate": 1.626359027710993e-05,
"loss": 0.1255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12822790443897247,
"step": 2660,
"valid_targets_mean": 2547.8,
"valid_targets_min": 368
},
{
"epoch": 4.236883942766296,
"grad_norm": 0.6506977836059051,
"learning_rate": 1.6185722774599064e-05,
"loss": 0.1323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13393157720565796,
"step": 2665,
"valid_targets_mean": 3280.5,
"valid_targets_min": 611
},
{
"epoch": 4.24483306836248,
"grad_norm": 0.5560817254019538,
"learning_rate": 1.6107915226686504e-05,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1394142508506775,
"step": 2670,
"valid_targets_mean": 3167.7,
"valid_targets_min": 512
},
{
"epoch": 4.252782193958664,
"grad_norm": 0.531467297115508,
"learning_rate": 1.603016885638779e-05,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14491944015026093,
"step": 2675,
"valid_targets_mean": 3221.8,
"valid_targets_min": 247
},
{
"epoch": 4.260731319554849,
"grad_norm": 0.4488475679526595,
"learning_rate": 1.5952484885756827e-05,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13313503563404083,
"step": 2680,
"valid_targets_mean": 3901.4,
"valid_targets_min": 317
},
{
"epoch": 4.268680445151033,
"grad_norm": 0.47568888206678156,
"learning_rate": 1.587486453586669e-05,
"loss": 0.1346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12674440443515778,
"step": 2685,
"valid_targets_mean": 3657.6,
"valid_targets_min": 513
},
{
"epoch": 4.276629570747218,
"grad_norm": 0.46272650057707004,
"learning_rate": 1.579730902679045e-05,
"loss": 0.1339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15541914105415344,
"step": 2690,
"valid_targets_mean": 4025.2,
"valid_targets_min": 502
},
{
"epoch": 4.284578696343402,
"grad_norm": 0.4472468025529375,
"learning_rate": 1.5719819577581982e-05,
"loss": 0.1223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12270389497280121,
"step": 2695,
"valid_targets_mean": 3892.1,
"valid_targets_min": 793
},
{
"epoch": 4.292527821939586,
"grad_norm": 0.5592143714752654,
"learning_rate": 1.5642397406256768e-05,
"loss": 0.1291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15055924654006958,
"step": 2700,
"valid_targets_mean": 2888.4,
"valid_targets_min": 663
},
{
"epoch": 4.300476947535771,
"grad_norm": 0.6380121268077782,
"learning_rate": 1.556504372977283e-05,
"loss": 0.1457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17369496822357178,
"step": 2705,
"valid_targets_mean": 3295.8,
"valid_targets_min": 450
},
{
"epoch": 4.3084260731319555,
"grad_norm": 0.43592849432503594,
"learning_rate": 1.548775976401152e-05,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12458646297454834,
"step": 2710,
"valid_targets_mean": 4257.1,
"valid_targets_min": 673
},
{
"epoch": 4.31637519872814,
"grad_norm": 0.5249006611498069,
"learning_rate": 1.5410546723758452e-05,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1341407299041748,
"step": 2715,
"valid_targets_mean": 3361.5,
"valid_targets_min": 260
},
{
"epoch": 4.324324324324325,
"grad_norm": 0.4535416533335133,
"learning_rate": 1.5333405822684428e-05,
"loss": 0.1254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1214504987001419,
"step": 2720,
"valid_targets_mean": 4414.6,
"valid_targets_min": 540
},
{
"epoch": 4.332273449920509,
"grad_norm": 0.4731025497262397,
"learning_rate": 1.5256338273326293e-05,
"loss": 0.127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13752460479736328,
"step": 2725,
"valid_targets_mean": 3609.0,
"valid_targets_min": 1095
},
{
"epoch": 4.340222575516693,
"grad_norm": 0.5291643855694953,
"learning_rate": 1.5179345287067935e-05,
"loss": 0.1349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14532646536827087,
"step": 2730,
"valid_targets_mean": 3274.8,
"valid_targets_min": 736
},
{
"epoch": 4.348171701112878,
"grad_norm": 0.49276963970488963,
"learning_rate": 1.5102428074121222e-05,
"loss": 0.1359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13466641306877136,
"step": 2735,
"valid_targets_mean": 4083.1,
"valid_targets_min": 243
},
{
"epoch": 4.356120826709062,
"grad_norm": 0.5271105291571133,
"learning_rate": 1.5025587843506986e-05,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13063038885593414,
"step": 2740,
"valid_targets_mean": 3548.1,
"valid_targets_min": 617
},
{
"epoch": 4.364069952305247,
"grad_norm": 0.5029010534111552,
"learning_rate": 1.4948825803035996e-05,
"loss": 0.1302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.115936279296875,
"step": 2745,
"valid_targets_mean": 4106.9,
"valid_targets_min": 581
},
{
"epoch": 4.372019077901431,
"grad_norm": 0.4305157347551604,
"learning_rate": 1.4872143159290016e-05,
"loss": 0.1379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1385708451271057,
"step": 2750,
"valid_targets_mean": 4007.7,
"valid_targets_min": 781
},
{
"epoch": 4.379968203497615,
"grad_norm": 0.5872775238224067,
"learning_rate": 1.4795541117602808e-05,
"loss": 0.131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11982855200767517,
"step": 2755,
"valid_targets_mean": 3377.2,
"valid_targets_min": 646
},
{
"epoch": 4.3879173290938,
"grad_norm": 0.4813077822857676,
"learning_rate": 1.4719020882041175e-05,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1347476989030838,
"step": 2760,
"valid_targets_mean": 3714.1,
"valid_targets_min": 598
},
{
"epoch": 4.395866454689984,
"grad_norm": 0.5454824004525505,
"learning_rate": 1.4642583655386084e-05,
"loss": 0.1306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12626631557941437,
"step": 2765,
"valid_targets_mean": 3165.4,
"valid_targets_min": 689
},
{
"epoch": 4.403815580286168,
"grad_norm": 0.4885305355016124,
"learning_rate": 1.4566230639113696e-05,
"loss": 0.1332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1025635302066803,
"step": 2770,
"valid_targets_mean": 4869.7,
"valid_targets_min": 683
},
{
"epoch": 4.411764705882353,
"grad_norm": 0.4770935247503296,
"learning_rate": 1.448996303337654e-05,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.124050073325634,
"step": 2775,
"valid_targets_mean": 3172.6,
"valid_targets_min": 720
},
{
"epoch": 4.419713831478537,
"grad_norm": 0.46987397640146145,
"learning_rate": 1.4413782036984616e-05,
"loss": 0.1255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11378094553947449,
"step": 2780,
"valid_targets_mean": 3712.6,
"valid_targets_min": 666
},
{
"epoch": 4.4276629570747215,
"grad_norm": 0.4291495568703118,
"learning_rate": 1.4337688847386542e-05,
"loss": 0.1251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10549108684062958,
"step": 2785,
"valid_targets_mean": 3789.5,
"valid_targets_min": 545
},
{
"epoch": 4.4356120826709065,
"grad_norm": 0.48467330245194035,
"learning_rate": 1.426168466065077e-05,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14184287190437317,
"step": 2790,
"valid_targets_mean": 4098.1,
"valid_targets_min": 1006
},
{
"epoch": 4.443561208267091,
"grad_norm": 0.4320267387261653,
"learning_rate": 1.4185770671446743e-05,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11710529029369354,
"step": 2795,
"valid_targets_mean": 4207.4,
"valid_targets_min": 891
},
{
"epoch": 4.451510333863275,
"grad_norm": 0.4899699268579415,
"learning_rate": 1.4109948073026153e-05,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13632246851921082,
"step": 2800,
"valid_targets_mean": 3296.7,
"valid_targets_min": 635
},
{
"epoch": 4.45945945945946,
"grad_norm": 0.43337393856388357,
"learning_rate": 1.4034218057204165e-05,
"loss": 0.1368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12501519918441772,
"step": 2805,
"valid_targets_mean": 3881.5,
"valid_targets_min": 919
},
{
"epoch": 4.467408585055644,
"grad_norm": 0.4398737794805095,
"learning_rate": 1.3958581814340679e-05,
"loss": 0.1274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11017243564128876,
"step": 2810,
"valid_targets_mean": 3680.9,
"valid_targets_min": 219
},
{
"epoch": 4.475357710651828,
"grad_norm": 0.5233156447822513,
"learning_rate": 1.3883040533321637e-05,
"loss": 0.1281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1441815048456192,
"step": 2815,
"valid_targets_mean": 3133.9,
"valid_targets_min": 341
},
{
"epoch": 4.483306836248013,
"grad_norm": 0.4598890957258285,
"learning_rate": 1.3807595401540322e-05,
"loss": 0.1356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14368480443954468,
"step": 2820,
"valid_targets_mean": 4432.7,
"valid_targets_min": 291
},
{
"epoch": 4.491255961844197,
"grad_norm": 0.5085977500037545,
"learning_rate": 1.3732247604878697e-05,
"loss": 0.1352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12015148252248764,
"step": 2825,
"valid_targets_mean": 3563.8,
"valid_targets_min": 587
},
{
"epoch": 4.499205087440382,
"grad_norm": 0.5315330999004808,
"learning_rate": 1.3656998327688764e-05,
"loss": 0.1392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1353592574596405,
"step": 2830,
"valid_targets_mean": 3689.6,
"valid_targets_min": 204
},
{
"epoch": 4.507154213036566,
"grad_norm": 0.5305726504410712,
"learning_rate": 1.3581848752773961e-05,
"loss": 0.1219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11149744689464569,
"step": 2835,
"valid_targets_mean": 3077.8,
"valid_targets_min": 512
},
{
"epoch": 4.51510333863275,
"grad_norm": 0.5139894765702253,
"learning_rate": 1.3506800061370555e-05,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14306671917438507,
"step": 2840,
"valid_targets_mean": 3728.9,
"valid_targets_min": 1152
},
{
"epoch": 4.523052464228935,
"grad_norm": 0.4814345025583722,
"learning_rate": 1.3431853433129058e-05,
"loss": 0.1246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11117015779018402,
"step": 2845,
"valid_targets_mean": 3341.5,
"valid_targets_min": 566
},
{
"epoch": 4.531001589825119,
"grad_norm": 0.5079196992633277,
"learning_rate": 1.3357010046095741e-05,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17309923470020294,
"step": 2850,
"valid_targets_mean": 2918.5,
"valid_targets_min": 816
},
{
"epoch": 4.538950715421303,
"grad_norm": 0.4517165892172054,
"learning_rate": 1.3282271076694052e-05,
"loss": 0.1296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1249191164970398,
"step": 2855,
"valid_targets_mean": 4362.0,
"valid_targets_min": 951
},
{
"epoch": 4.546899841017488,
"grad_norm": 0.47163152664152436,
"learning_rate": 1.3207637699706162e-05,
"loss": 0.1322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13854432106018066,
"step": 2860,
"valid_targets_mean": 3941.9,
"valid_targets_min": 248
},
{
"epoch": 4.5548489666136724,
"grad_norm": 0.4474413787281936,
"learning_rate": 1.3133111088254507e-05,
"loss": 0.1267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11171597242355347,
"step": 2865,
"valid_targets_mean": 3772.6,
"valid_targets_min": 254
},
{
"epoch": 4.5627980922098565,
"grad_norm": 0.5078641249343999,
"learning_rate": 1.3058692413783307e-05,
"loss": 0.1407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13531452417373657,
"step": 2870,
"valid_targets_mean": 3739.0,
"valid_targets_min": 678
},
{
"epoch": 4.5707472178060415,
"grad_norm": 0.7026774408330564,
"learning_rate": 1.2984382846040187e-05,
"loss": 0.1315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1399625539779663,
"step": 2875,
"valid_targets_mean": 4271.8,
"valid_targets_min": 716
},
{
"epoch": 4.578696343402226,
"grad_norm": 0.46761769157477573,
"learning_rate": 1.2910183553057788e-05,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14058490097522736,
"step": 2880,
"valid_targets_mean": 3651.0,
"valid_targets_min": 310
},
{
"epoch": 4.586645468998411,
"grad_norm": 0.4383231851637327,
"learning_rate": 1.2836095701135398e-05,
"loss": 0.1322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11564694344997406,
"step": 2885,
"valid_targets_mean": 3662.7,
"valid_targets_min": 691
},
{
"epoch": 4.594594594594595,
"grad_norm": 0.46123656999116863,
"learning_rate": 1.2762120454820628e-05,
"loss": 0.1274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1169496402144432,
"step": 2890,
"valid_targets_mean": 3931.8,
"valid_targets_min": 250
},
{
"epoch": 4.602543720190779,
"grad_norm": 0.4338183551025682,
"learning_rate": 1.268825897689108e-05,
"loss": 0.1292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12584465742111206,
"step": 2895,
"valid_targets_mean": 4739.1,
"valid_targets_min": 1044
},
{
"epoch": 4.610492845786963,
"grad_norm": 0.4172369284320454,
"learning_rate": 1.2614512428336105e-05,
"loss": 0.1321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12070607393980026,
"step": 2900,
"valid_targets_mean": 5442.9,
"valid_targets_min": 673
},
{
"epoch": 4.618441971383148,
"grad_norm": 0.47358327667927247,
"learning_rate": 1.254088196833855e-05,
"loss": 0.1318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1363537609577179,
"step": 2905,
"valid_targets_mean": 4575.1,
"valid_targets_min": 524
},
{
"epoch": 4.626391096979332,
"grad_norm": 0.46039621956253657,
"learning_rate": 1.2467368754256513e-05,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1305224895477295,
"step": 2910,
"valid_targets_mean": 4386.9,
"valid_targets_min": 716
},
{
"epoch": 4.634340222575517,
"grad_norm": 0.48832499251309247,
"learning_rate": 1.2393973941605161e-05,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.125309556722641,
"step": 2915,
"valid_targets_mean": 3788.6,
"valid_targets_min": 988
},
{
"epoch": 4.642289348171701,
"grad_norm": 0.5232937532641884,
"learning_rate": 1.2320698684038599e-05,
"loss": 0.1371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1394532024860382,
"step": 2920,
"valid_targets_mean": 3360.9,
"valid_targets_min": 258
},
{
"epoch": 4.650238473767885,
"grad_norm": 0.4558597876370874,
"learning_rate": 1.2247544133331681e-05,
"loss": 0.1303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11967042088508606,
"step": 2925,
"valid_targets_mean": 4315.3,
"valid_targets_min": 281
},
{
"epoch": 4.65818759936407,
"grad_norm": 0.5566298887502414,
"learning_rate": 1.2174511439361943e-05,
"loss": 0.1467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1408625692129135,
"step": 2930,
"valid_targets_mean": 2664.5,
"valid_targets_min": 744
},
{
"epoch": 4.666136724960254,
"grad_norm": 0.48634223320131703,
"learning_rate": 1.2101601750091528e-05,
"loss": 0.1379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16628813743591309,
"step": 2935,
"valid_targets_mean": 4301.5,
"valid_targets_min": 1436
},
{
"epoch": 4.674085850556438,
"grad_norm": 0.46133307731688006,
"learning_rate": 1.2028816211549117e-05,
"loss": 0.1206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12970274686813354,
"step": 2940,
"valid_targets_mean": 4872.5,
"valid_targets_min": 1521
},
{
"epoch": 4.682034976152623,
"grad_norm": 0.42861468167336814,
"learning_rate": 1.195615596781194e-05,
"loss": 0.1325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1275981068611145,
"step": 2945,
"valid_targets_mean": 4291.4,
"valid_targets_min": 1324
},
{
"epoch": 4.6899841017488075,
"grad_norm": 0.45633412060443734,
"learning_rate": 1.18836221609878e-05,
"loss": 0.123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12598268687725067,
"step": 2950,
"valid_targets_mean": 4175.3,
"valid_targets_min": 839
},
{
"epoch": 4.697933227344992,
"grad_norm": 0.5343832571290266,
"learning_rate": 1.1811215931197084e-05,
"loss": 0.1332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1605256199836731,
"step": 2955,
"valid_targets_mean": 3076.2,
"valid_targets_min": 774
},
{
"epoch": 4.705882352941177,
"grad_norm": 0.4961038270131699,
"learning_rate": 1.1738938416554857e-05,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13582147657871246,
"step": 2960,
"valid_targets_mean": 3582.1,
"valid_targets_min": 267
},
{
"epoch": 4.713831478537361,
"grad_norm": 0.5512004556887968,
"learning_rate": 1.1666790753153009e-05,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13612379133701324,
"step": 2965,
"valid_targets_mean": 2709.6,
"valid_targets_min": 977
},
{
"epoch": 4.721780604133546,
"grad_norm": 0.5381030618661898,
"learning_rate": 1.1594774075042345e-05,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1454896181821823,
"step": 2970,
"valid_targets_mean": 3670.9,
"valid_targets_min": 511
},
{
"epoch": 4.72972972972973,
"grad_norm": 0.5509557031574198,
"learning_rate": 1.152288951421478e-05,
"loss": 0.1253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13313612341880798,
"step": 2975,
"valid_targets_mean": 2507.1,
"valid_targets_min": 344
},
{
"epoch": 4.737678855325914,
"grad_norm": 0.5619248692734761,
"learning_rate": 1.1451138200585567e-05,
"loss": 0.1301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13828039169311523,
"step": 2980,
"valid_targets_mean": 3192.6,
"valid_targets_min": 304
},
{
"epoch": 4.745627980922099,
"grad_norm": 0.6067851198602392,
"learning_rate": 1.13795212619755e-05,
"loss": 0.1338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1492369920015335,
"step": 2985,
"valid_targets_mean": 2374.6,
"valid_targets_min": 295
},
{
"epoch": 4.753577106518283,
"grad_norm": 0.4802919158480157,
"learning_rate": 1.1308039824093197e-05,
"loss": 0.1292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1495775282382965,
"step": 2990,
"valid_targets_mean": 3698.0,
"valid_targets_min": 642
},
{
"epoch": 4.761526232114467,
"grad_norm": 0.4709231044726117,
"learning_rate": 1.1236695010517434e-05,
"loss": 0.143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1218520998954773,
"step": 2995,
"valid_targets_mean": 3672.4,
"valid_targets_min": 252
},
{
"epoch": 4.769475357710652,
"grad_norm": 0.43463931612817397,
"learning_rate": 1.116548794267945e-05,
"loss": 0.1253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12758862972259521,
"step": 3000,
"valid_targets_mean": 4420.1,
"valid_targets_min": 413
},
{
"epoch": 4.777424483306836,
"grad_norm": 0.45148983869993,
"learning_rate": 1.109441973984534e-05,
"loss": 0.1288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11758168786764145,
"step": 3005,
"valid_targets_mean": 3833.6,
"valid_targets_min": 199
},
{
"epoch": 4.78537360890302,
"grad_norm": 0.4726760123977448,
"learning_rate": 1.1023491519098439e-05,
"loss": 0.1328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15904685854911804,
"step": 3010,
"valid_targets_mean": 4469.8,
"valid_targets_min": 683
},
{
"epoch": 4.793322734499205,
"grad_norm": 0.5308825581080399,
"learning_rate": 1.0952704395321781e-05,
"loss": 0.1256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13085004687309265,
"step": 3015,
"valid_targets_mean": 3272.6,
"valid_targets_min": 251
},
{
"epoch": 4.801271860095389,
"grad_norm": 0.5180355797993398,
"learning_rate": 1.0882059481180588e-05,
"loss": 0.1264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11950570344924927,
"step": 3020,
"valid_targets_mean": 3030.1,
"valid_targets_min": 349
},
{
"epoch": 4.809220985691574,
"grad_norm": 0.4600006136661297,
"learning_rate": 1.0811557887104747e-05,
"loss": 0.1316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13670320808887482,
"step": 3025,
"valid_targets_mean": 3798.9,
"valid_targets_min": 735
},
{
"epoch": 4.8171701112877585,
"grad_norm": 0.5471165258975516,
"learning_rate": 1.074120072127137e-05,
"loss": 0.139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10859496891498566,
"step": 3030,
"valid_targets_mean": 4030.0,
"valid_targets_min": 285
},
{
"epoch": 4.825119236883943,
"grad_norm": 0.4875896845337796,
"learning_rate": 1.0670989089587395e-05,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15141701698303223,
"step": 3035,
"valid_targets_mean": 3959.2,
"valid_targets_min": 348
},
{
"epoch": 4.833068362480127,
"grad_norm": 0.46841773833007866,
"learning_rate": 1.0600924095672184e-05,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1404210776090622,
"step": 3040,
"valid_targets_mean": 4134.9,
"valid_targets_min": 834
},
{
"epoch": 4.841017488076312,
"grad_norm": 0.4822180291377705,
"learning_rate": 1.0531006840840162e-05,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15318647027015686,
"step": 3045,
"valid_targets_mean": 3816.3,
"valid_targets_min": 1540
},
{
"epoch": 4.848966613672496,
"grad_norm": 0.4598922245539829,
"learning_rate": 1.046123842408354e-05,
"loss": 0.1338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.142354816198349,
"step": 3050,
"valid_targets_mean": 4431.2,
"valid_targets_min": 309
},
{
"epoch": 4.856915739268681,
"grad_norm": 0.4289633212386471,
"learning_rate": 1.0391619942055007e-05,
"loss": 0.1313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1268487572669983,
"step": 3055,
"valid_targets_mean": 3981.8,
"valid_targets_min": 806
},
{
"epoch": 4.864864864864865,
"grad_norm": 0.5512192977590487,
"learning_rate": 1.0322152489050508e-05,
"loss": 0.1344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1406165063381195,
"step": 3060,
"valid_targets_mean": 3987.3,
"valid_targets_min": 1264
},
{
"epoch": 4.872813990461049,
"grad_norm": 0.473626788275172,
"learning_rate": 1.0252837156992065e-05,
"loss": 0.1278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12075041234493256,
"step": 3065,
"valid_targets_mean": 3601.8,
"valid_targets_min": 410
},
{
"epoch": 4.880763116057234,
"grad_norm": 0.4208027067707839,
"learning_rate": 1.018367503541057e-05,
"loss": 0.1275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11000724136829376,
"step": 3070,
"valid_targets_mean": 4098.9,
"valid_targets_min": 699
},
{
"epoch": 4.888712241653418,
"grad_norm": 0.4042871962162526,
"learning_rate": 1.0114667211428675e-05,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12441422045230865,
"step": 3075,
"valid_targets_mean": 5265.6,
"valid_targets_min": 787
},
{
"epoch": 4.896661367249602,
"grad_norm": 0.48474645193150095,
"learning_rate": 1.0045814769743731e-05,
"loss": 0.1372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13803794980049133,
"step": 3080,
"valid_targets_mean": 3752.9,
"valid_targets_min": 725
},
{
"epoch": 4.904610492845787,
"grad_norm": 0.558064394873645,
"learning_rate": 9.977118792610719e-06,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12287827581167221,
"step": 3085,
"valid_targets_mean": 3135.6,
"valid_targets_min": 673
},
{
"epoch": 4.912559618441971,
"grad_norm": 0.47354314556138427,
"learning_rate": 9.908580359825204e-06,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11178020387887955,
"step": 3090,
"valid_targets_mean": 4488.8,
"valid_targets_min": 466
},
{
"epoch": 4.920508744038155,
"grad_norm": 0.4188496112443199,
"learning_rate": 9.840200548706435e-06,
"loss": 0.1311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1269189715385437,
"step": 3095,
"valid_targets_mean": 4419.6,
"valid_targets_min": 636
},
{
"epoch": 4.92845786963434,
"grad_norm": 0.48069575474565923,
"learning_rate": 9.771980434080348e-06,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14761850237846375,
"step": 3100,
"valid_targets_mean": 4263.5,
"valid_targets_min": 609
},
{
"epoch": 4.9364069952305245,
"grad_norm": 0.47361836995858364,
"learning_rate": 9.70392108826269e-06,
"loss": 0.1303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1389940083026886,
"step": 3105,
"valid_targets_mean": 3997.1,
"valid_targets_min": 538
},
{
"epoch": 4.9443561208267095,
"grad_norm": 0.502593429400252,
"learning_rate": 9.636023581042191e-06,
"loss": 0.1352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1681274026632309,
"step": 3110,
"valid_targets_mean": 3780.9,
"valid_targets_min": 856
},
{
"epoch": 4.952305246422894,
"grad_norm": 0.6771515271251293,
"learning_rate": 9.5682889796637e-06,
"loss": 0.1403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1500101536512375,
"step": 3115,
"valid_targets_mean": 4520.4,
"valid_targets_min": 549
},
{
"epoch": 4.960254372019078,
"grad_norm": 0.4872072441985026,
"learning_rate": 9.500718348811457e-06,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1341622769832611,
"step": 3120,
"valid_targets_mean": 3533.3,
"valid_targets_min": 264
},
{
"epoch": 4.968203497615263,
"grad_norm": 0.4872550048404107,
"learning_rate": 9.433312750592337e-06,
"loss": 0.1348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12632372975349426,
"step": 3125,
"valid_targets_mean": 3567.7,
"valid_targets_min": 758
},
{
"epoch": 4.976152623211447,
"grad_norm": 0.4963406118007583,
"learning_rate": 9.366073244519124e-06,
"loss": 0.1262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12338396161794662,
"step": 3130,
"valid_targets_mean": 3381.1,
"valid_targets_min": 551
},
{
"epoch": 4.984101748807631,
"grad_norm": 0.5634271164967108,
"learning_rate": 9.299000887493934e-06,
"loss": 0.13,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14706090092658997,
"step": 3135,
"valid_targets_mean": 3212.7,
"valid_targets_min": 686
},
{
"epoch": 4.992050874403816,
"grad_norm": 0.5169455768152297,
"learning_rate": 9.232096733791518e-06,
"loss": 0.1339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14801155030727386,
"step": 3140,
"valid_targets_mean": 3497.0,
"valid_targets_min": 1131
},
{
"epoch": 5.0,
"grad_norm": 0.4146566743306906,
"learning_rate": 9.165361835042734e-06,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12379302084445953,
"step": 3145,
"valid_targets_mean": 4029.0,
"valid_targets_min": 281
},
{
"epoch": 5.007949125596184,
"grad_norm": 0.457923014155659,
"learning_rate": 9.098797240218036e-06,
"loss": 0.121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10793712735176086,
"step": 3150,
"valid_targets_mean": 4072.9,
"valid_targets_min": 746
},
{
"epoch": 5.015898251192369,
"grad_norm": 0.5279976098261123,
"learning_rate": 9.032403995610937e-06,
"loss": 0.1228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11182405054569244,
"step": 3155,
"valid_targets_mean": 2553.0,
"valid_targets_min": 538
},
{
"epoch": 5.023847376788553,
"grad_norm": 0.48776564405835493,
"learning_rate": 8.966183144821583e-06,
"loss": 0.1147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10740777850151062,
"step": 3160,
"valid_targets_mean": 3739.8,
"valid_targets_min": 564
},
{
"epoch": 5.031796502384737,
"grad_norm": 0.4595972840148685,
"learning_rate": 8.900135728740373e-06,
"loss": 0.1239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11679710447788239,
"step": 3165,
"valid_targets_mean": 4084.7,
"valid_targets_min": 276
},
{
"epoch": 5.039745627980922,
"grad_norm": 0.47396166912319276,
"learning_rate": 8.83426278553158e-06,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11660698056221008,
"step": 3170,
"valid_targets_mean": 3834.4,
"valid_targets_min": 644
},
{
"epoch": 5.047694753577106,
"grad_norm": 0.5657974369615991,
"learning_rate": 8.768565350616998e-06,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16728852689266205,
"step": 3175,
"valid_targets_mean": 3509.4,
"valid_targets_min": 610
},
{
"epoch": 5.0556438791732905,
"grad_norm": 0.4887634707217319,
"learning_rate": 8.703044456659741e-06,
"loss": 0.1238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11223262548446655,
"step": 3180,
"valid_targets_mean": 4200.7,
"valid_targets_min": 598
},
{
"epoch": 5.0635930047694755,
"grad_norm": 0.5536746484103304,
"learning_rate": 8.63770113354794e-06,
"loss": 0.1229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12999343872070312,
"step": 3185,
"valid_targets_mean": 3016.6,
"valid_targets_min": 486
},
{
"epoch": 5.07154213036566,
"grad_norm": 0.43802408737800774,
"learning_rate": 8.572536408378587e-06,
"loss": 0.1221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0922771543264389,
"step": 3190,
"valid_targets_mean": 4741.3,
"valid_targets_min": 285
},
{
"epoch": 5.079491255961845,
"grad_norm": 0.4652049118167889,
"learning_rate": 8.507551305441408e-06,
"loss": 0.1226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12782129645347595,
"step": 3195,
"valid_targets_mean": 4579.9,
"valid_targets_min": 568
},
{
"epoch": 5.087440381558029,
"grad_norm": 0.43604310018158265,
"learning_rate": 8.442746846202711e-06,
"loss": 0.119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09423212707042694,
"step": 3200,
"valid_targets_mean": 4047.1,
"valid_targets_min": 1021
},
{
"epoch": 5.095389507154213,
"grad_norm": 0.49985284842571,
"learning_rate": 8.378124049289394e-06,
"loss": 0.1135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12812739610671997,
"step": 3205,
"valid_targets_mean": 3787.6,
"valid_targets_min": 576
},
{
"epoch": 5.103338632750398,
"grad_norm": 0.5306993606687345,
"learning_rate": 8.313683930472889e-06,
"loss": 0.1259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13846567273139954,
"step": 3210,
"valid_targets_mean": 3789.9,
"valid_targets_min": 537
},
{
"epoch": 5.111287758346582,
"grad_norm": 0.526017364900564,
"learning_rate": 8.249427502653198e-06,
"loss": 0.1231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13277852535247803,
"step": 3215,
"valid_targets_mean": 3243.6,
"valid_targets_min": 623
},
{
"epoch": 5.119236883942766,
"grad_norm": 0.4826797520729495,
"learning_rate": 8.185355775842982e-06,
"loss": 0.1424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1628974825143814,
"step": 3220,
"valid_targets_mean": 4196.1,
"valid_targets_min": 549
},
{
"epoch": 5.127186009538951,
"grad_norm": 0.47266391553239756,
"learning_rate": 8.12146975715171e-06,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.124434694647789,
"step": 3225,
"valid_targets_mean": 4489.1,
"valid_targets_min": 294
},
{
"epoch": 5.135135135135135,
"grad_norm": 0.5104351929242484,
"learning_rate": 8.057770450769771e-06,
"loss": 0.1269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14183968305587769,
"step": 3230,
"valid_targets_mean": 3486.3,
"valid_targets_min": 660
},
{
"epoch": 5.143084260731319,
"grad_norm": 0.5350401545785989,
"learning_rate": 7.994258857952748e-06,
"loss": 0.1194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14458492398262024,
"step": 3235,
"valid_targets_mean": 3730.2,
"valid_targets_min": 679
},
{
"epoch": 5.151033386327504,
"grad_norm": 0.47568127630523516,
"learning_rate": 7.93093597700564e-06,
"loss": 0.1122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11599075794219971,
"step": 3240,
"valid_targets_mean": 3875.6,
"valid_targets_min": 690
},
{
"epoch": 5.158982511923688,
"grad_norm": 0.5212929399191217,
"learning_rate": 7.867802803267182e-06,
"loss": 0.1249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11911657452583313,
"step": 3245,
"valid_targets_mean": 3369.2,
"valid_targets_min": 221
},
{
"epoch": 5.166931637519872,
"grad_norm": 0.44904326831297614,
"learning_rate": 7.80486032909421e-06,
"loss": 0.1283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13542252779006958,
"step": 3250,
"valid_targets_mean": 5412.6,
"valid_targets_min": 706
},
{
"epoch": 5.174880763116057,
"grad_norm": 0.5816953917270461,
"learning_rate": 7.742109543846063e-06,
"loss": 0.1274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12738856673240662,
"step": 3255,
"valid_targets_mean": 2924.6,
"valid_targets_min": 672
},
{
"epoch": 5.1828298887122415,
"grad_norm": 0.4706987710505265,
"learning_rate": 7.679551433869001e-06,
"loss": 0.1197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11224916577339172,
"step": 3260,
"valid_targets_mean": 4329.3,
"valid_targets_min": 249
},
{
"epoch": 5.1907790143084265,
"grad_norm": 0.4351758065293425,
"learning_rate": 7.617186982480749e-06,
"loss": 0.1186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10177105665206909,
"step": 3265,
"valid_targets_mean": 3785.4,
"valid_targets_min": 1054
},
{
"epoch": 5.198728139904611,
"grad_norm": 0.5015716097475679,
"learning_rate": 7.5550171699549945e-06,
"loss": 0.1219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14602243900299072,
"step": 3270,
"valid_targets_mean": 3782.1,
"valid_targets_min": 663
},
{
"epoch": 5.206677265500795,
"grad_norm": 0.4602593511104768,
"learning_rate": 7.493042973506e-06,
"loss": 0.1194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11888657510280609,
"step": 3275,
"valid_targets_mean": 4810.8,
"valid_targets_min": 1011
},
{
"epoch": 5.21462639109698,
"grad_norm": 0.5526497578097684,
"learning_rate": 7.431265367273268e-06,
"loss": 0.1144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11730851978063583,
"step": 3280,
"valid_targets_mean": 3694.4,
"valid_targets_min": 281
},
{
"epoch": 5.222575516693164,
"grad_norm": 0.5252464567539773,
"learning_rate": 7.36968532230617e-06,
"loss": 0.1428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1225329339504242,
"step": 3285,
"valid_targets_mean": 3195.1,
"valid_targets_min": 258
},
{
"epoch": 5.230524642289348,
"grad_norm": 0.5192954833459635,
"learning_rate": 7.308303806548742e-06,
"loss": 0.129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13095176219940186,
"step": 3290,
"valid_targets_mean": 3724.8,
"valid_targets_min": 636
},
{
"epoch": 5.238473767885533,
"grad_norm": 0.5487669317072835,
"learning_rate": 7.247121784824445e-06,
"loss": 0.1258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13627754151821136,
"step": 3295,
"valid_targets_mean": 3452.6,
"valid_targets_min": 324
},
{
"epoch": 5.246422893481717,
"grad_norm": 0.528698693229382,
"learning_rate": 7.186140218820979e-06,
"loss": 0.1303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12275183945894241,
"step": 3300,
"valid_targets_mean": 4150.6,
"valid_targets_min": 768
},
{
"epoch": 5.254372019077901,
"grad_norm": 0.5046952538958149,
"learning_rate": 7.125360067075196e-06,
"loss": 0.1216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13393549621105194,
"step": 3305,
"valid_targets_mean": 3828.8,
"valid_targets_min": 262
},
{
"epoch": 5.262321144674086,
"grad_norm": 0.5275289393785,
"learning_rate": 7.0647822849580385e-06,
"loss": 0.1117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11984727531671524,
"step": 3310,
"valid_targets_mean": 2990.9,
"valid_targets_min": 465
},
{
"epoch": 5.27027027027027,
"grad_norm": 0.5986098211183422,
"learning_rate": 7.004407824659491e-06,
"loss": 0.1223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12287823855876923,
"step": 3315,
"valid_targets_mean": 2975.7,
"valid_targets_min": 733
},
{
"epoch": 5.278219395866454,
"grad_norm": 0.493508460343489,
"learning_rate": 6.944237635173627e-06,
"loss": 0.1373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1410299688577652,
"step": 3320,
"valid_targets_mean": 4679.4,
"valid_targets_min": 542
},
{
"epoch": 5.286168521462639,
"grad_norm": 0.5340963975918633,
"learning_rate": 6.88427266228372e-06,
"loss": 0.1258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11206860840320587,
"step": 3325,
"valid_targets_mean": 2824.8,
"valid_targets_min": 548
},
{
"epoch": 5.294117647058823,
"grad_norm": 0.5288120769728034,
"learning_rate": 6.824513848547323e-06,
"loss": 0.1258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13739335536956787,
"step": 3330,
"valid_targets_mean": 2994.0,
"valid_targets_min": 774
},
{
"epoch": 5.302066772655008,
"grad_norm": 0.4460570196931101,
"learning_rate": 6.764962133281503e-06,
"loss": 0.1161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0984058827161789,
"step": 3335,
"valid_targets_mean": 4019.4,
"valid_targets_min": 657
},
{
"epoch": 5.3100158982511925,
"grad_norm": 0.47811950799417524,
"learning_rate": 6.705618452548057e-06,
"loss": 0.1267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11787131428718567,
"step": 3340,
"valid_targets_mean": 4479.8,
"valid_targets_min": 557
},
{
"epoch": 5.317965023847377,
"grad_norm": 0.4666566027641988,
"learning_rate": 6.646483739138778e-06,
"loss": 0.1112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12056516110897064,
"step": 3345,
"valid_targets_mean": 3949.9,
"valid_targets_min": 1048
},
{
"epoch": 5.325914149443562,
"grad_norm": 0.4975374351704887,
"learning_rate": 6.5875589225608376e-06,
"loss": 0.1224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11528253555297852,
"step": 3350,
"valid_targets_mean": 3459.3,
"valid_targets_min": 671
},
{
"epoch": 5.333863275039746,
"grad_norm": 0.4880004851265583,
"learning_rate": 6.528844929022134e-06,
"loss": 0.1219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10715194791555405,
"step": 3355,
"valid_targets_mean": 3779.9,
"valid_targets_min": 555
},
{
"epoch": 5.34181240063593,
"grad_norm": 0.5375997285477788,
"learning_rate": 6.4703426814167434e-06,
"loss": 0.1247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12751339375972748,
"step": 3360,
"valid_targets_mean": 3645.8,
"valid_targets_min": 635
},
{
"epoch": 5.349761526232115,
"grad_norm": 0.5313239520073082,
"learning_rate": 6.412053099310449e-06,
"loss": 0.1167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12041355669498444,
"step": 3365,
"valid_targets_mean": 4356.8,
"valid_targets_min": 730
},
{
"epoch": 5.357710651828299,
"grad_norm": 0.5428782069622755,
"learning_rate": 6.353977098926225e-06,
"loss": 0.1278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13842326402664185,
"step": 3370,
"valid_targets_mean": 3841.1,
"valid_targets_min": 279
},
{
"epoch": 5.365659777424483,
"grad_norm": 0.5475098794287568,
"learning_rate": 6.296115593129888e-06,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12307454645633698,
"step": 3375,
"valid_targets_mean": 4148.9,
"valid_targets_min": 519
},
{
"epoch": 5.373608903020668,
"grad_norm": 0.797877703342453,
"learning_rate": 6.238469491415728e-06,
"loss": 0.1184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13038906455039978,
"step": 3380,
"valid_targets_mean": 2991.3,
"valid_targets_min": 369
},
{
"epoch": 5.381558028616852,
"grad_norm": 0.48617214325748453,
"learning_rate": 6.181039699892206e-06,
"loss": 0.1255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11232590675354004,
"step": 3385,
"valid_targets_mean": 3804.4,
"valid_targets_min": 591
},
{
"epoch": 5.389507154213036,
"grad_norm": 0.5086690584311961,
"learning_rate": 6.123827121267709e-06,
"loss": 0.1151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12465276569128036,
"step": 3390,
"valid_targets_mean": 4029.9,
"valid_targets_min": 821
},
{
"epoch": 5.397456279809221,
"grad_norm": 0.4123929559301535,
"learning_rate": 6.066832654836396e-06,
"loss": 0.1228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10203292965888977,
"step": 3395,
"valid_targets_mean": 4760.1,
"valid_targets_min": 591
},
{
"epoch": 5.405405405405405,
"grad_norm": 0.5479065770064241,
"learning_rate": 6.010057196464012e-06,
"loss": 0.1323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11120990663766861,
"step": 3400,
"valid_targets_mean": 3094.6,
"valid_targets_min": 221
},
{
"epoch": 5.413354531001589,
"grad_norm": 0.48420485798613333,
"learning_rate": 5.9535016385738335e-06,
"loss": 0.1226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10648505389690399,
"step": 3405,
"valid_targets_mean": 4042.4,
"valid_targets_min": 1384
},
{
"epoch": 5.421303656597774,
"grad_norm": 0.48392218431147466,
"learning_rate": 5.897166870132658e-06,
"loss": 0.116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11931923776865005,
"step": 3410,
"valid_targets_mean": 3597.8,
"valid_targets_min": 665
},
{
"epoch": 5.4292527821939585,
"grad_norm": 0.5393253911493405,
"learning_rate": 5.841053776636781e-06,
"loss": 0.1157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12923894822597504,
"step": 3415,
"valid_targets_mean": 3682.3,
"valid_targets_min": 693
},
{
"epoch": 5.4372019077901435,
"grad_norm": 0.5792385751129733,
"learning_rate": 5.7851632400981285e-06,
"loss": 0.1149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10763402283191681,
"step": 3420,
"valid_targets_mean": 4127.3,
"valid_targets_min": 687
},
{
"epoch": 5.4451510333863276,
"grad_norm": 0.48182773969358605,
"learning_rate": 5.729496139030377e-06,
"loss": 0.1222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1422126591205597,
"step": 3425,
"valid_targets_mean": 4550.5,
"valid_targets_min": 1598
},
{
"epoch": 5.453100158982512,
"grad_norm": 0.41697301913199153,
"learning_rate": 5.67405334843512e-06,
"loss": 0.1165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10176099836826324,
"step": 3430,
"valid_targets_mean": 5134.2,
"valid_targets_min": 581
},
{
"epoch": 5.461049284578697,
"grad_norm": 0.5513948557355665,
"learning_rate": 5.618835739788136e-06,
"loss": 0.1175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12029505521059036,
"step": 3435,
"valid_targets_mean": 2973.1,
"valid_targets_min": 312
},
{
"epoch": 5.468998410174881,
"grad_norm": 0.5035419846944795,
"learning_rate": 5.563844181025706e-06,
"loss": 0.1216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11482226848602295,
"step": 3440,
"valid_targets_mean": 3700.4,
"valid_targets_min": 993
},
{
"epoch": 5.476947535771065,
"grad_norm": 0.5134434569519974,
"learning_rate": 5.509079536530939e-06,
"loss": 0.1313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14722689986228943,
"step": 3445,
"valid_targets_mean": 4011.1,
"valid_targets_min": 1226
},
{
"epoch": 5.48489666136725,
"grad_norm": 0.6045299385441325,
"learning_rate": 5.4545426671201905e-06,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12199525535106659,
"step": 3450,
"valid_targets_mean": 3293.1,
"valid_targets_min": 563
},
{
"epoch": 5.492845786963434,
"grad_norm": 0.550935705887857,
"learning_rate": 5.400234430029561e-06,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14424438774585724,
"step": 3455,
"valid_targets_mean": 3206.7,
"valid_targets_min": 688
},
{
"epoch": 5.500794912559618,
"grad_norm": 0.4951329559478596,
"learning_rate": 5.346155678901392e-06,
"loss": 0.1175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12117502838373184,
"step": 3460,
"valid_targets_mean": 3883.6,
"valid_targets_min": 679
},
{
"epoch": 5.508744038155803,
"grad_norm": 0.531009459855668,
"learning_rate": 5.292307263770859e-06,
"loss": 0.1244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1292455941438675,
"step": 3465,
"valid_targets_mean": 3177.2,
"valid_targets_min": 636
},
{
"epoch": 5.516693163751987,
"grad_norm": 0.5665502788954249,
"learning_rate": 5.238690031052603e-06,
"loss": 0.1166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11746140569448471,
"step": 3470,
"valid_targets_mean": 2960.9,
"valid_targets_min": 290
},
{
"epoch": 5.524642289348172,
"grad_norm": 0.47470831904665967,
"learning_rate": 5.185304823527426e-06,
"loss": 0.1122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11849209666252136,
"step": 3475,
"valid_targets_mean": 4295.4,
"valid_targets_min": 574
},
{
"epoch": 5.532591414944356,
"grad_norm": 0.5348564893263684,
"learning_rate": 5.132152480329072e-06,
"loss": 0.1252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13434147834777832,
"step": 3480,
"valid_targets_mean": 3653.6,
"valid_targets_min": 593
},
{
"epoch": 5.54054054054054,
"grad_norm": 0.45313684699490947,
"learning_rate": 5.07923383693099e-06,
"loss": 0.1123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10309700667858124,
"step": 3485,
"valid_targets_mean": 3730.9,
"valid_targets_min": 545
},
{
"epoch": 5.548489666136725,
"grad_norm": 0.5594176484506791,
"learning_rate": 5.0265497251332314e-06,
"loss": 0.1159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11101377010345459,
"step": 3490,
"valid_targets_mean": 3820.3,
"valid_targets_min": 269
},
{
"epoch": 5.556438791732909,
"grad_norm": 0.45166597844599227,
"learning_rate": 4.974100973049385e-06,
"loss": 0.1247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10583409667015076,
"step": 3495,
"valid_targets_mean": 4374.6,
"valid_targets_min": 275
},
{
"epoch": 5.5643879173290935,
"grad_norm": 0.5180648698026142,
"learning_rate": 4.921888405093525e-06,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11158320307731628,
"step": 3500,
"valid_targets_mean": 3499.5,
"valid_targets_min": 749
},
{
"epoch": 5.5723370429252785,
"grad_norm": 0.4509178468225708,
"learning_rate": 4.869912841967286e-06,
"loss": 0.1149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11846384406089783,
"step": 3505,
"valid_targets_mean": 4619.4,
"valid_targets_min": 982
},
{
"epoch": 5.580286168521463,
"grad_norm": 0.5462056280603287,
"learning_rate": 4.818175100646952e-06,
"loss": 0.1288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12996745109558105,
"step": 3510,
"valid_targets_mean": 3452.2,
"valid_targets_min": 715
},
{
"epoch": 5.588235294117647,
"grad_norm": 0.4452887332184351,
"learning_rate": 4.766675994370598e-06,
"loss": 0.1148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12007399648427963,
"step": 3515,
"valid_targets_mean": 3976.9,
"valid_targets_min": 528
},
{
"epoch": 5.596184419713832,
"grad_norm": 0.4955106517830543,
"learning_rate": 4.7154163326253265e-06,
"loss": 0.1311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1265922635793686,
"step": 3520,
"valid_targets_mean": 4157.2,
"valid_targets_min": 639
},
{
"epoch": 5.604133545310016,
"grad_norm": 0.4967818054308162,
"learning_rate": 4.664396921134551e-06,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12537996470928192,
"step": 3525,
"valid_targets_mean": 3731.1,
"valid_targets_min": 711
},
{
"epoch": 5.6120826709062,
"grad_norm": 0.5922113133845275,
"learning_rate": 4.613618561845306e-06,
"loss": 0.128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18149852752685547,
"step": 3530,
"valid_targets_mean": 3075.6,
"valid_targets_min": 717
},
{
"epoch": 5.620031796502385,
"grad_norm": 0.4486775225512763,
"learning_rate": 4.563082052915649e-06,
"loss": 0.1233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10791641473770142,
"step": 3535,
"valid_targets_mean": 4184.4,
"valid_targets_min": 1044
},
{
"epoch": 5.627980922098569,
"grad_norm": 0.47196647754075016,
"learning_rate": 4.512788188702135e-06,
"loss": 0.1074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10782913118600845,
"step": 3540,
"valid_targets_mean": 4232.4,
"valid_targets_min": 286
},
{
"epoch": 5.635930047694753,
"grad_norm": 0.40473591866365777,
"learning_rate": 4.462737759747315e-06,
"loss": 0.1143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09814178198575974,
"step": 3545,
"valid_targets_mean": 5018.9,
"valid_targets_min": 534
},
{
"epoch": 5.643879173290938,
"grad_norm": 0.4970418048544055,
"learning_rate": 4.412931552767295e-06,
"loss": 0.1194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12168466299772263,
"step": 3550,
"valid_targets_mean": 3969.1,
"valid_targets_min": 908
},
{
"epoch": 5.651828298887122,
"grad_norm": 0.4466747416437135,
"learning_rate": 4.363370350639405e-06,
"loss": 0.1236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11409342288970947,
"step": 3555,
"valid_targets_mean": 4624.2,
"valid_targets_min": 668
},
{
"epoch": 5.659777424483307,
"grad_norm": 0.548867935644448,
"learning_rate": 4.314054932389859e-06,
"loss": 0.1214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13996033370494843,
"step": 3560,
"valid_targets_mean": 4342.4,
"valid_targets_min": 668
},
{
"epoch": 5.667726550079491,
"grad_norm": 0.48475073547335606,
"learning_rate": 4.2649860731815255e-06,
"loss": 0.1262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12767939269542694,
"step": 3565,
"valid_targets_mean": 3903.4,
"valid_targets_min": 580
},
{
"epoch": 5.675675675675675,
"grad_norm": 0.5810018741448055,
"learning_rate": 4.216164544301755e-06,
"loss": 0.1234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12019410729408264,
"step": 3570,
"valid_targets_mean": 2819.9,
"valid_targets_min": 277
},
{
"epoch": 5.68362480127186,
"grad_norm": 0.45812190476555054,
"learning_rate": 4.167591113150225e-06,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0970279797911644,
"step": 3575,
"valid_targets_mean": 3835.1,
"valid_targets_min": 606
},
{
"epoch": 5.6915739268680445,
"grad_norm": 0.4583758611151626,
"learning_rate": 4.119266543226921e-06,
"loss": 0.1146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11823764443397522,
"step": 3580,
"valid_targets_mean": 4078.4,
"valid_targets_min": 686
},
{
"epoch": 5.699523052464229,
"grad_norm": 0.5300561778832891,
"learning_rate": 4.071191594120081e-06,
"loss": 0.1311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1100766509771347,
"step": 3585,
"valid_targets_mean": 3071.7,
"valid_targets_min": 259
},
{
"epoch": 5.707472178060414,
"grad_norm": 0.5096830083092221,
"learning_rate": 4.023367021494313e-06,
"loss": 0.1224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13244731724262238,
"step": 3590,
"valid_targets_mean": 3879.1,
"valid_targets_min": 709
},
{
"epoch": 5.715421303656598,
"grad_norm": 0.6172482897906679,
"learning_rate": 3.975793577078682e-06,
"loss": 0.1147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11370215564966202,
"step": 3595,
"valid_targets_mean": 3879.4,
"valid_targets_min": 1163
},
{
"epoch": 5.723370429252782,
"grad_norm": 0.5043378824343994,
"learning_rate": 3.928472008654891e-06,
"loss": 0.1105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1176089495420456,
"step": 3600,
"valid_targets_mean": 4378.8,
"valid_targets_min": 819
},
{
"epoch": 5.731319554848967,
"grad_norm": 0.5132872802234864,
"learning_rate": 3.881403060045545e-06,
"loss": 0.1217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10852010548114777,
"step": 3605,
"valid_targets_mean": 3407.3,
"valid_targets_min": 859
},
{
"epoch": 5.739268680445151,
"grad_norm": 0.5063474175192859,
"learning_rate": 3.834587471102464e-06,
"loss": 0.1203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11489781737327576,
"step": 3610,
"valid_targets_mean": 3358.4,
"valid_targets_min": 724
},
{
"epoch": 5.747217806041336,
"grad_norm": 0.44741625934657075,
"learning_rate": 3.7880259776950224e-06,
"loss": 0.1189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11125510931015015,
"step": 3615,
"valid_targets_mean": 4725.9,
"valid_targets_min": 935
},
{
"epoch": 5.75516693163752,
"grad_norm": 0.5622460074052544,
"learning_rate": 3.741719311698608e-06,
"loss": 0.1254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1445854902267456,
"step": 3620,
"valid_targets_mean": 3845.8,
"valid_targets_min": 326
},
{
"epoch": 5.763116057233704,
"grad_norm": 0.5095441924194869,
"learning_rate": 3.69566820098312e-06,
"loss": 0.118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11811588704586029,
"step": 3625,
"valid_targets_mean": 3504.1,
"valid_targets_min": 499
},
{
"epoch": 5.771065182829888,
"grad_norm": 0.6091555550332428,
"learning_rate": 3.6498733694015197e-06,
"loss": 0.1204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15617358684539795,
"step": 3630,
"valid_targets_mean": 3396.4,
"valid_targets_min": 219
},
{
"epoch": 5.779014308426073,
"grad_norm": 0.5229211609685805,
"learning_rate": 3.604335536778434e-06,
"loss": 0.1146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13374817371368408,
"step": 3635,
"valid_targets_mean": 4108.9,
"valid_targets_min": 625
},
{
"epoch": 5.786963434022257,
"grad_norm": 0.5225267465274916,
"learning_rate": 3.559055418898887e-06,
"loss": 0.1323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1492437720298767,
"step": 3640,
"valid_targets_mean": 3701.8,
"valid_targets_min": 262
},
{
"epoch": 5.794912559618442,
"grad_norm": 0.49027694616246914,
"learning_rate": 3.5140337274970014e-06,
"loss": 0.1205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12383852899074554,
"step": 3645,
"valid_targets_mean": 5302.7,
"valid_targets_min": 992
},
{
"epoch": 5.802861685214626,
"grad_norm": 0.49546019569767785,
"learning_rate": 3.469271170244832e-06,
"loss": 0.1157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11465057730674744,
"step": 3650,
"valid_targets_mean": 3762.5,
"valid_targets_min": 1734
},
{
"epoch": 5.8108108108108105,
"grad_norm": 0.6328363349278949,
"learning_rate": 3.4247684507412605e-06,
"loss": 0.1242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13153359293937683,
"step": 3655,
"valid_targets_mean": 2784.2,
"valid_targets_min": 294
},
{
"epoch": 5.8187599364069955,
"grad_norm": 0.502167626760723,
"learning_rate": 3.380526268500892e-06,
"loss": 0.1181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12254327535629272,
"step": 3660,
"valid_targets_mean": 3786.4,
"valid_targets_min": 193
},
{
"epoch": 5.82670906200318,
"grad_norm": 0.45125186924627153,
"learning_rate": 3.3365453189430984e-06,
"loss": 0.1226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10970175266265869,
"step": 3665,
"valid_targets_mean": 4506.9,
"valid_targets_min": 1367
},
{
"epoch": 5.834658187599364,
"grad_norm": 0.5205657434846551,
"learning_rate": 3.292826293381071e-06,
"loss": 0.1272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13056659698486328,
"step": 3670,
"valid_targets_mean": 4076.0,
"valid_targets_min": 1257
},
{
"epoch": 5.842607313195549,
"grad_norm": 0.5429453705327059,
"learning_rate": 3.2493698790109664e-06,
"loss": 0.1225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12193150818347931,
"step": 3675,
"valid_targets_mean": 3906.0,
"valid_targets_min": 444
},
{
"epoch": 5.850556438791733,
"grad_norm": 0.6227078505185998,
"learning_rate": 3.2061767589010763e-06,
"loss": 0.1258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13154500722885132,
"step": 3680,
"valid_targets_mean": 2870.4,
"valid_targets_min": 255
},
{
"epoch": 5.858505564387917,
"grad_norm": 0.49948300350719843,
"learning_rate": 3.1632476119811285e-06,
"loss": 0.1214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11474519222974777,
"step": 3685,
"valid_targets_mean": 4023.4,
"valid_targets_min": 737
},
{
"epoch": 5.866454689984102,
"grad_norm": 0.5200212537952184,
"learning_rate": 3.120583113031579e-06,
"loss": 0.1275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13559041917324066,
"step": 3690,
"valid_targets_mean": 3464.1,
"valid_targets_min": 203
},
{
"epoch": 5.874403815580286,
"grad_norm": 0.46446067076843983,
"learning_rate": 3.07818393267304e-06,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09316763281822205,
"step": 3695,
"valid_targets_mean": 3673.7,
"valid_targets_min": 231
},
{
"epoch": 5.882352941176471,
"grad_norm": 0.4404533791714637,
"learning_rate": 3.036050737355709e-06,
"loss": 0.1165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09938673675060272,
"step": 3700,
"valid_targets_mean": 4383.9,
"valid_targets_min": 1208
},
{
"epoch": 5.890302066772655,
"grad_norm": 0.5161902873588942,
"learning_rate": 2.9941841893489075e-06,
"loss": 0.1276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1233370378613472,
"step": 3705,
"valid_targets_mean": 4478.1,
"valid_targets_min": 1631
},
{
"epoch": 5.898251192368839,
"grad_norm": 0.49950014205727683,
"learning_rate": 2.9525849467306766e-06,
"loss": 0.1286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1349901705980301,
"step": 3710,
"valid_targets_mean": 4360.8,
"valid_targets_min": 1207
},
{
"epoch": 5.906200317965024,
"grad_norm": 0.6255270102689031,
"learning_rate": 2.9112536633774245e-06,
"loss": 0.1297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14242327213287354,
"step": 3715,
"valid_targets_mean": 2748.8,
"valid_targets_min": 566
},
{
"epoch": 5.914149443561208,
"grad_norm": 0.4795827841967414,
"learning_rate": 2.8701909889536384e-06,
"loss": 0.1223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12320660799741745,
"step": 3720,
"valid_targets_mean": 3648.8,
"valid_targets_min": 1105
},
{
"epoch": 5.922098569157392,
"grad_norm": 0.46609837304180957,
"learning_rate": 2.8293975689017018e-06,
"loss": 0.121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09863148629665375,
"step": 3725,
"valid_targets_mean": 3843.1,
"valid_targets_min": 1049
},
{
"epoch": 5.930047694753577,
"grad_norm": 0.5299211238306798,
"learning_rate": 2.788874044431722e-06,
"loss": 0.1191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11683914065361023,
"step": 3730,
"valid_targets_mean": 3052.8,
"valid_targets_min": 357
},
{
"epoch": 5.9379968203497615,
"grad_norm": 0.5208980690753293,
"learning_rate": 2.7486210525114533e-06,
"loss": 0.1133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12761931121349335,
"step": 3735,
"valid_targets_mean": 3831.2,
"valid_targets_min": 468
},
{
"epoch": 5.945945945945946,
"grad_norm": 0.6678323734362,
"learning_rate": 2.708639225856311e-06,
"loss": 0.1237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12598900496959686,
"step": 3740,
"valid_targets_mean": 3501.5,
"valid_targets_min": 668
},
{
"epoch": 5.953895071542131,
"grad_norm": 0.5264094063837836,
"learning_rate": 2.6689291929193962e-06,
"loss": 0.1282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13515892624855042,
"step": 3745,
"valid_targets_mean": 3571.8,
"valid_targets_min": 744
},
{
"epoch": 5.961844197138315,
"grad_norm": 0.42300031769118174,
"learning_rate": 2.629491577881622e-06,
"loss": 0.1131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10418035089969635,
"step": 3750,
"valid_targets_mean": 4830.2,
"valid_targets_min": 658
},
{
"epoch": 5.9697933227345,
"grad_norm": 0.4877715372350325,
"learning_rate": 2.5903270006419236e-06,
"loss": 0.1276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11131057143211365,
"step": 3755,
"valid_targets_mean": 3662.4,
"valid_targets_min": 384
},
{
"epoch": 5.977742448330684,
"grad_norm": 0.4822345208975422,
"learning_rate": 2.551436076807501e-06,
"loss": 0.1206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10331891477108002,
"step": 3760,
"valid_targets_mean": 3850.6,
"valid_targets_min": 1253
},
{
"epoch": 5.985691573926868,
"grad_norm": 0.5405507727305193,
"learning_rate": 2.5128194176841226e-06,
"loss": 0.1208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11677927523851395,
"step": 3765,
"valid_targets_mean": 3175.6,
"valid_targets_min": 560
},
{
"epoch": 5.993640699523052,
"grad_norm": 0.6454948139161141,
"learning_rate": 2.4744776302665563e-06,
"loss": 0.1213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13788512349128723,
"step": 3770,
"valid_targets_mean": 3206.7,
"valid_targets_min": 452
},
{
"epoch": 6.001589825119237,
"grad_norm": 0.44867451795140395,
"learning_rate": 2.436411317228997e-06,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1155017837882042,
"step": 3775,
"valid_targets_mean": 3869.2,
"valid_targets_min": 717
},
{
"epoch": 6.009538950715421,
"grad_norm": 0.48596893402956937,
"learning_rate": 2.3986210769155994e-06,
"loss": 0.1215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11859863996505737,
"step": 3780,
"valid_targets_mean": 3937.1,
"valid_targets_min": 790
},
{
"epoch": 6.017488076311606,
"grad_norm": 0.522552014133015,
"learning_rate": 2.361107503331095e-06,
"loss": 0.1206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13054189085960388,
"step": 3785,
"valid_targets_mean": 3340.6,
"valid_targets_min": 649
},
{
"epoch": 6.02543720190779,
"grad_norm": 0.5187257820275404,
"learning_rate": 2.3238711861314165e-06,
"loss": 0.1164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0982595682144165,
"step": 3790,
"valid_targets_mean": 3887.9,
"valid_targets_min": 225
},
{
"epoch": 6.033386327503974,
"grad_norm": 0.492221911506423,
"learning_rate": 2.2869127106144663e-06,
"loss": 0.1223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10179409384727478,
"step": 3795,
"valid_targets_mean": 3659.4,
"valid_targets_min": 581
},
{
"epoch": 6.041335453100159,
"grad_norm": 0.5706240801694208,
"learning_rate": 2.2502326577109e-06,
"loss": 0.1247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14859774708747864,
"step": 3800,
"valid_targets_mean": 3022.1,
"valid_targets_min": 576
},
{
"epoch": 6.049284578696343,
"grad_norm": 0.4903458403444158,
"learning_rate": 2.213831603974985e-06,
"loss": 0.1208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12874770164489746,
"step": 3805,
"valid_targets_mean": 3873.9,
"valid_targets_min": 1757
},
{
"epoch": 6.0572337042925275,
"grad_norm": 0.6672892423704999,
"learning_rate": 2.1777101215755624e-06,
"loss": 0.124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14127162098884583,
"step": 3810,
"valid_targets_mean": 2096.2,
"valid_targets_min": 307
},
{
"epoch": 6.0651828298887125,
"grad_norm": 0.4545999025709332,
"learning_rate": 2.1418687782870284e-06,
"loss": 0.115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1308123916387558,
"step": 3815,
"valid_targets_mean": 4371.7,
"valid_targets_min": 911
},
{
"epoch": 6.073131955484897,
"grad_norm": 0.487382004726638,
"learning_rate": 2.1063081374804263e-06,
"loss": 0.1156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11653155088424683,
"step": 3820,
"valid_targets_mean": 4370.7,
"valid_targets_min": 716
},
{
"epoch": 6.081081081081081,
"grad_norm": 0.5230128586154896,
"learning_rate": 2.0710287581145884e-06,
"loss": 0.1107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11809296905994415,
"step": 3825,
"valid_targets_mean": 3450.1,
"valid_targets_min": 468
},
{
"epoch": 6.089030206677266,
"grad_norm": 0.5190144803094725,
"learning_rate": 2.036031194727346e-06,
"loss": 0.1299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13838720321655273,
"step": 3830,
"valid_targets_mean": 3676.1,
"valid_targets_min": 623
},
{
"epoch": 6.09697933227345,
"grad_norm": 0.46738733555474804,
"learning_rate": 2.0013159974268094e-06,
"loss": 0.1182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11170323193073273,
"step": 3835,
"valid_targets_mean": 4278.0,
"valid_targets_min": 709
},
{
"epoch": 6.104928457869635,
"grad_norm": 0.4624128199722627,
"learning_rate": 1.9668837118827346e-06,
"loss": 0.1101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09756626933813095,
"step": 3840,
"valid_targets_mean": 4007.2,
"valid_targets_min": 678
},
{
"epoch": 6.112877583465819,
"grad_norm": 0.5119513810750553,
"learning_rate": 1.932734879317937e-06,
"loss": 0.1265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10754363238811493,
"step": 3845,
"valid_targets_mean": 3588.8,
"valid_targets_min": 295
},
{
"epoch": 6.120826709062003,
"grad_norm": 0.41100363613961804,
"learning_rate": 1.8988700364997758e-06,
"loss": 0.117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10548628866672516,
"step": 3850,
"valid_targets_mean": 4552.5,
"valid_targets_min": 1126
},
{
"epoch": 6.128775834658188,
"grad_norm": 0.5133116111241467,
"learning_rate": 1.8652897157317395e-06,
"loss": 0.1165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14871114492416382,
"step": 3855,
"valid_targets_mean": 3678.9,
"valid_targets_min": 652
},
{
"epoch": 6.136724960254372,
"grad_norm": 0.5261537871220848,
"learning_rate": 1.8319944448450578e-06,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10628058761358261,
"step": 3860,
"valid_targets_mean": 3190.5,
"valid_targets_min": 257
},
{
"epoch": 6.144674085850556,
"grad_norm": 0.4713576235713761,
"learning_rate": 1.7989847471904065e-06,
"loss": 0.1097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09839437156915665,
"step": 3865,
"valid_targets_mean": 4262.8,
"valid_targets_min": 614
},
{
"epoch": 6.152623211446741,
"grad_norm": 0.6149608619383016,
"learning_rate": 1.766261141629706e-06,
"loss": 0.1184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10006123036146164,
"step": 3870,
"valid_targets_mean": 4775.4,
"valid_targets_min": 1547
},
{
"epoch": 6.160572337042925,
"grad_norm": 0.5676332722536679,
"learning_rate": 1.7338241425279244e-06,
"loss": 0.116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1152639240026474,
"step": 3875,
"valid_targets_mean": 2869.9,
"valid_targets_min": 253
},
{
"epoch": 6.168521462639109,
"grad_norm": 0.43406528581225035,
"learning_rate": 1.7016742597450341e-06,
"loss": 0.1035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0894886776804924,
"step": 3880,
"valid_targets_mean": 4228.3,
"valid_targets_min": 889
},
{
"epoch": 6.176470588235294,
"grad_norm": 0.4391775601429534,
"learning_rate": 1.6698119986279726e-06,
"loss": 0.1302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1086900532245636,
"step": 3885,
"valid_targets_mean": 4487.6,
"valid_targets_min": 1009
},
{
"epoch": 6.1844197138314785,
"grad_norm": 0.43257145105765316,
"learning_rate": 1.6382378600026982e-06,
"loss": 0.1129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09367109835147858,
"step": 3890,
"valid_targets_mean": 4436.7,
"valid_targets_min": 672
},
{
"epoch": 6.192368839427663,
"grad_norm": 0.46585023110175705,
"learning_rate": 1.60695234016633e-06,
"loss": 0.1239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11722202599048615,
"step": 3895,
"valid_targets_mean": 4294.6,
"valid_targets_min": 580
},
{
"epoch": 6.200317965023848,
"grad_norm": 0.4902572872103629,
"learning_rate": 1.5759559308793448e-06,
"loss": 0.1081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10776770859956741,
"step": 3900,
"valid_targets_mean": 3943.4,
"valid_targets_min": 271
},
{
"epoch": 6.208267090620032,
"grad_norm": 0.5594670199155989,
"learning_rate": 1.5452491193578412e-06,
"loss": 0.1202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12497895956039429,
"step": 3905,
"valid_targets_mean": 3098.4,
"valid_targets_min": 735
},
{
"epoch": 6.216216216216216,
"grad_norm": 0.5219935562912217,
"learning_rate": 1.5148323882658767e-06,
"loss": 0.1158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10808251798152924,
"step": 3910,
"valid_targets_mean": 4122.3,
"valid_targets_min": 283
},
{
"epoch": 6.224165341812401,
"grad_norm": 0.5005990647111696,
"learning_rate": 1.484706215707905e-06,
"loss": 0.1206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10552050173282623,
"step": 3915,
"valid_targets_mean": 3699.5,
"valid_targets_min": 699
},
{
"epoch": 6.232114467408585,
"grad_norm": 0.6045839092717541,
"learning_rate": 1.4548710752212292e-06,
"loss": 0.1085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11157447099685669,
"step": 3920,
"valid_targets_mean": 2340.5,
"valid_targets_min": 254
},
{
"epoch": 6.24006359300477,
"grad_norm": 0.5250995042813899,
"learning_rate": 1.425327435768582e-06,
"loss": 0.1204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13459616899490356,
"step": 3925,
"valid_targets_mean": 3940.4,
"valid_targets_min": 699
},
{
"epoch": 6.248012718600954,
"grad_norm": 0.472579910076907,
"learning_rate": 1.3960757617307486e-06,
"loss": 0.1204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12376942485570908,
"step": 3930,
"valid_targets_mean": 4687.8,
"valid_targets_min": 876
},
{
"epoch": 6.255961844197138,
"grad_norm": 0.4618301620060851,
"learning_rate": 1.3671165128992514e-06,
"loss": 0.1095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10723580420017242,
"step": 3935,
"valid_targets_mean": 4437.8,
"valid_targets_min": 543
},
{
"epoch": 6.263910969793323,
"grad_norm": 0.4999776109608244,
"learning_rate": 1.3384501444691544e-06,
"loss": 0.1047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10837283730506897,
"step": 3940,
"valid_targets_mean": 3520.4,
"valid_targets_min": 295
},
{
"epoch": 6.271860095389507,
"grad_norm": 0.5126636237250259,
"learning_rate": 1.3100771070318796e-06,
"loss": 0.1176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11529883742332458,
"step": 3945,
"valid_targets_mean": 4288.9,
"valid_targets_min": 251
},
{
"epoch": 6.279809220985691,
"grad_norm": 0.47848229996426966,
"learning_rate": 1.2819978465681283e-06,
"loss": 0.1236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0940292477607727,
"step": 3950,
"valid_targets_mean": 3521.3,
"valid_targets_min": 498
},
{
"epoch": 6.287758346581876,
"grad_norm": 0.5732393529239456,
"learning_rate": 1.254212804440893e-06,
"loss": 0.1244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1338890790939331,
"step": 3955,
"valid_targets_mean": 3135.6,
"valid_targets_min": 312
},
{
"epoch": 6.29570747217806,
"grad_norm": 0.5326295342711036,
"learning_rate": 1.2267224173884929e-06,
"loss": 0.1145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13209447264671326,
"step": 3960,
"valid_targets_mean": 3774.2,
"valid_targets_min": 571
},
{
"epoch": 6.3036565977742445,
"grad_norm": 0.4711791669124887,
"learning_rate": 1.199527117517727e-06,
"loss": 0.113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11155182123184204,
"step": 3965,
"valid_targets_mean": 3798.5,
"valid_targets_min": 276
},
{
"epoch": 6.3116057233704295,
"grad_norm": 0.4818693237836275,
"learning_rate": 1.172627332297076e-06,
"loss": 0.1146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10713420063257217,
"step": 3970,
"valid_targets_mean": 3704.2,
"valid_targets_min": 651
},
{
"epoch": 6.319554848966614,
"grad_norm": 0.5058735177237607,
"learning_rate": 1.1460234845499763e-06,
"loss": 0.1135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.132293701171875,
"step": 3975,
"valid_targets_mean": 4033.2,
"valid_targets_min": 868
},
{
"epoch": 6.327503974562799,
"grad_norm": 0.48180321982015545,
"learning_rate": 1.1197159924481804e-06,
"loss": 0.125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11559031903743744,
"step": 3980,
"valid_targets_mean": 4418.4,
"valid_targets_min": 649
},
{
"epoch": 6.335453100158983,
"grad_norm": 0.6108262295945303,
"learning_rate": 1.0937052695051965e-06,
"loss": 0.1185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14231693744659424,
"step": 3985,
"valid_targets_mean": 4821.4,
"valid_targets_min": 1296
},
{
"epoch": 6.343402225755167,
"grad_norm": 0.5735633688087327,
"learning_rate": 1.067991724569759e-06,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12734287977218628,
"step": 3990,
"valid_targets_mean": 3712.1,
"valid_targets_min": 578
},
{
"epoch": 6.351351351351352,
"grad_norm": 0.4962186042387327,
"learning_rate": 1.0425757618194265e-06,
"loss": 0.1143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11310100555419922,
"step": 3995,
"valid_targets_mean": 4223.6,
"valid_targets_min": 307
},
{
"epoch": 6.359300476947536,
"grad_norm": 0.4808255029002646,
"learning_rate": 1.0174577807542273e-06,
"loss": 0.1242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10521212220191956,
"step": 4000,
"valid_targets_mean": 3883.7,
"valid_targets_min": 1113
},
{
"epoch": 6.36724960254372,
"grad_norm": 0.4740602995913292,
"learning_rate": 9.926381761903614e-07,
"loss": 0.1121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11520376056432724,
"step": 4005,
"valid_targets_mean": 4185.7,
"valid_targets_min": 1471
},
{
"epoch": 6.375198728139905,
"grad_norm": 0.4470619298701318,
"learning_rate": 9.681173382540177e-07,
"loss": 0.118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10057910531759262,
"step": 4010,
"valid_targets_mean": 4749.6,
"valid_targets_min": 771
},
{
"epoch": 6.383147853736089,
"grad_norm": 0.5582730349142845,
"learning_rate": 9.438956523752263e-07,
"loss": 0.1194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14447925984859467,
"step": 4015,
"valid_targets_mean": 3494.1,
"valid_targets_min": 699
},
{
"epoch": 6.391096979332273,
"grad_norm": 0.4602774808448654,
"learning_rate": 9.199734992818099e-07,
"loss": 0.1045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10162511467933655,
"step": 4020,
"valid_targets_mean": 4045.6,
"valid_targets_min": 615
},
{
"epoch": 6.399046104928458,
"grad_norm": 0.9217957425599271,
"learning_rate": 8.963512549933795e-07,
"loss": 0.1213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10582847148180008,
"step": 4025,
"valid_targets_mean": 3972.8,
"valid_targets_min": 797
},
{
"epoch": 6.406995230524642,
"grad_norm": 0.48625229787458,
"learning_rate": 8.730292908154614e-07,
"loss": 0.1203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13875703513622284,
"step": 4030,
"valid_targets_mean": 3860.8,
"valid_targets_min": 218
},
{
"epoch": 6.414944356120826,
"grad_norm": 0.4648812460273993,
"learning_rate": 8.500079733336175e-07,
"loss": 0.1114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1072784960269928,
"step": 4035,
"valid_targets_mean": 3870.5,
"valid_targets_min": 841
},
{
"epoch": 6.422893481717011,
"grad_norm": 0.5971157428394955,
"learning_rate": 8.272876644077188e-07,
"loss": 0.1207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16263656318187714,
"step": 4040,
"valid_targets_mean": 3596.1,
"valid_targets_min": 248
},
{
"epoch": 6.4308426073131955,
"grad_norm": 0.4392492224710974,
"learning_rate": 8.048687211662343e-07,
"loss": 0.1076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0819651186466217,
"step": 4045,
"valid_targets_mean": 3597.6,
"valid_targets_min": 296
},
{
"epoch": 6.43879173290938,
"grad_norm": 0.5349233453433273,
"learning_rate": 7.827514960006266e-07,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.153071790933609,
"step": 4050,
"valid_targets_mean": 4198.1,
"valid_targets_min": 203
},
{
"epoch": 6.4467408585055646,
"grad_norm": 0.5485637315230164,
"learning_rate": 7.609363365598165e-07,
"loss": 0.1192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09980130195617676,
"step": 4055,
"valid_targets_mean": 3078.7,
"valid_targets_min": 266
},
{
"epoch": 6.454689984101749,
"grad_norm": 0.568411168151065,
"learning_rate": 7.394235857447119e-07,
"loss": 0.1233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12002958357334137,
"step": 4060,
"valid_targets_mean": 3055.5,
"valid_targets_min": 277
},
{
"epoch": 6.462639109697934,
"grad_norm": 0.5213091406213507,
"learning_rate": 7.182135817028157e-07,
"loss": 0.109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11195459216833115,
"step": 4065,
"valid_targets_mean": 3587.9,
"valid_targets_min": 839
},
{
"epoch": 6.470588235294118,
"grad_norm": 0.5134486003820178,
"learning_rate": 6.973066578229248e-07,
"loss": 0.121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11719434708356857,
"step": 4070,
"valid_targets_mean": 4122.6,
"valid_targets_min": 848
},
{
"epoch": 6.478537360890302,
"grad_norm": 0.4962383127871119,
"learning_rate": 6.767031427298687e-07,
"loss": 0.1113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11477995663881302,
"step": 4075,
"valid_targets_mean": 3880.5,
"valid_targets_min": 553
},
{
"epoch": 6.486486486486487,
"grad_norm": 0.5116829216283925,
"learning_rate": 6.564033602793584e-07,
"loss": 0.112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10865809768438339,
"step": 4080,
"valid_targets_mean": 3936.4,
"valid_targets_min": 203
},
{
"epoch": 6.494435612082671,
"grad_norm": 0.49006467961889066,
"learning_rate": 6.364076295529042e-07,
"loss": 0.1224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11683492362499237,
"step": 4085,
"valid_targets_mean": 4282.9,
"valid_targets_min": 655
},
{
"epoch": 6.502384737678855,
"grad_norm": 0.6452016504816608,
"learning_rate": 6.167162648527703e-07,
"loss": 0.1167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14076688885688782,
"step": 4090,
"valid_targets_mean": 3114.0,
"valid_targets_min": 562
},
{
"epoch": 6.51033386327504,
"grad_norm": 0.581962945018844,
"learning_rate": 5.973295756970653e-07,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12058502435684204,
"step": 4095,
"valid_targets_mean": 2951.9,
"valid_targets_min": 215
},
{
"epoch": 6.518282988871224,
"grad_norm": 0.5276399869645112,
"learning_rate": 5.782478668148672e-07,
"loss": 0.1185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12663058936595917,
"step": 4100,
"valid_targets_mean": 3469.2,
"valid_targets_min": 883
},
{
"epoch": 6.526232114467408,
"grad_norm": 0.47852804567749874,
"learning_rate": 5.59471438141419e-07,
"loss": 0.1063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09485980868339539,
"step": 4105,
"valid_targets_mean": 3878.8,
"valid_targets_min": 671
},
{
"epoch": 6.534181240063593,
"grad_norm": 0.4656719855928257,
"learning_rate": 5.410005848134315e-07,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11063895374536514,
"step": 4110,
"valid_targets_mean": 4169.6,
"valid_targets_min": 555
},
{
"epoch": 6.542130365659777,
"grad_norm": 0.582805206984922,
"learning_rate": 5.228355971644461e-07,
"loss": 0.1196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14886021614074707,
"step": 4115,
"valid_targets_mean": 3361.9,
"valid_targets_min": 205
},
{
"epoch": 6.550079491255962,
"grad_norm": 0.4719462940844744,
"learning_rate": 5.049767607202549e-07,
"loss": 0.1179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10012765973806381,
"step": 4120,
"valid_targets_mean": 4136.4,
"valid_targets_min": 490
},
{
"epoch": 6.558028616852146,
"grad_norm": 1.3556535238795349,
"learning_rate": 4.874243561944214e-07,
"loss": 0.1142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12124701589345932,
"step": 4125,
"valid_targets_mean": 3717.2,
"valid_targets_min": 281
},
{
"epoch": 6.5659777424483305,
"grad_norm": 0.5426225357284815,
"learning_rate": 4.701786594838753e-07,
"loss": 0.1227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13302527368068695,
"step": 4130,
"valid_targets_mean": 3212.1,
"valid_targets_min": 519
},
{
"epoch": 6.573926868044515,
"grad_norm": 0.5217934884004445,
"learning_rate": 4.532399416645694e-07,
"loss": 0.1255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12307184189558029,
"step": 4135,
"valid_targets_mean": 3814.6,
"valid_targets_min": 692
},
{
"epoch": 6.5818759936407,
"grad_norm": 0.46337006848354445,
"learning_rate": 4.366084689872074e-07,
"loss": 0.1306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.146135151386261,
"step": 4140,
"valid_targets_mean": 4986.4,
"valid_targets_min": 1521
},
{
"epoch": 6.589825119236884,
"grad_norm": 0.5660661020795137,
"learning_rate": 4.202845028730829e-07,
"loss": 0.1106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14232556521892548,
"step": 4145,
"valid_targets_mean": 3666.0,
"valid_targets_min": 748
},
{
"epoch": 6.597774244833069,
"grad_norm": 0.5103188227448534,
"learning_rate": 4.0426829990994677e-07,
"loss": 0.109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10854796320199966,
"step": 4150,
"valid_targets_mean": 3345.2,
"valid_targets_min": 706
},
{
"epoch": 6.605723370429253,
"grad_norm": 0.5531875415363303,
"learning_rate": 3.885601118479909e-07,
"loss": 0.1201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13567741215229034,
"step": 4155,
"valid_targets_mean": 3677.8,
"valid_targets_min": 728
},
{
"epoch": 6.613672496025437,
"grad_norm": 0.5680532693391935,
"learning_rate": 3.731601855958844e-07,
"loss": 0.1155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10990526527166367,
"step": 4160,
"valid_targets_mean": 3246.2,
"valid_targets_min": 577
},
{
"epoch": 6.621621621621622,
"grad_norm": 0.8069806110549206,
"learning_rate": 3.5806876321688553e-07,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15170586109161377,
"step": 4165,
"valid_targets_mean": 3854.2,
"valid_targets_min": 522
},
{
"epoch": 6.629570747217806,
"grad_norm": 0.5399036381526361,
"learning_rate": 3.4328608192505164e-07,
"loss": 0.1269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1231968104839325,
"step": 4170,
"valid_targets_mean": 3397.2,
"valid_targets_min": 324
},
{
"epoch": 6.63751987281399,
"grad_norm": 0.43662516483746666,
"learning_rate": 3.288123740814997e-07,
"loss": 0.1229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11871956288814545,
"step": 4175,
"valid_targets_mean": 5077.1,
"valid_targets_min": 1399
},
{
"epoch": 6.645468998410175,
"grad_norm": 0.52274643112803,
"learning_rate": 3.1464786719075825e-07,
"loss": 0.1063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09565606713294983,
"step": 4180,
"valid_targets_mean": 3180.1,
"valid_targets_min": 220
},
{
"epoch": 6.653418124006359,
"grad_norm": 0.5634216558721306,
"learning_rate": 3.0079278389719246e-07,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10372507572174072,
"step": 4185,
"valid_targets_mean": 3673.8,
"valid_targets_min": 290
},
{
"epoch": 6.661367249602543,
"grad_norm": 0.6083528281521314,
"learning_rate": 2.8724734198149585e-07,
"loss": 0.1228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09832460433244705,
"step": 4190,
"valid_targets_mean": 3061.6,
"valid_targets_min": 691
},
{
"epoch": 6.669316375198728,
"grad_norm": 0.4419979233676959,
"learning_rate": 2.7401175435727735e-07,
"loss": 0.1118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09950825572013855,
"step": 4195,
"valid_targets_mean": 4492.2,
"valid_targets_min": 591
},
{
"epoch": 6.677265500794912,
"grad_norm": 0.504982275604603,
"learning_rate": 2.61086229067713e-07,
"loss": 0.1111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10245563834905624,
"step": 4200,
"valid_targets_mean": 3867.2,
"valid_targets_min": 1379
},
{
"epoch": 6.685214626391097,
"grad_norm": 0.5140544947040371,
"learning_rate": 2.4847096928226846e-07,
"loss": 0.1193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10791807621717453,
"step": 4205,
"valid_targets_mean": 3571.3,
"valid_targets_min": 891
},
{
"epoch": 6.6931637519872815,
"grad_norm": 0.5413468567786459,
"learning_rate": 2.3616617329351499e-07,
"loss": 0.1141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11113090813159943,
"step": 4210,
"valid_targets_mean": 3172.6,
"valid_targets_min": 281
},
{
"epoch": 6.701112877583466,
"grad_norm": 0.49989740724965176,
"learning_rate": 2.2417203451400749e-07,
"loss": 0.118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11632831394672394,
"step": 4215,
"valid_targets_mean": 3993.2,
"valid_targets_min": 293
},
{
"epoch": 6.709062003179651,
"grad_norm": 0.5360781888423928,
"learning_rate": 2.124887414732424e-07,
"loss": 0.1151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1259898841381073,
"step": 4220,
"valid_targets_mean": 3856.2,
"valid_targets_min": 578
},
{
"epoch": 6.717011128775835,
"grad_norm": 0.5026442130672338,
"learning_rate": 2.0111647781470233e-07,
"loss": 0.1178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10925573855638504,
"step": 4225,
"valid_targets_mean": 3679.4,
"valid_targets_min": 249
},
{
"epoch": 6.724960254372019,
"grad_norm": 0.5622738756387758,
"learning_rate": 1.9005542229295848e-07,
"loss": 0.1117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11003442853689194,
"step": 4230,
"valid_targets_mean": 2934.6,
"valid_targets_min": 533
},
{
"epoch": 6.732909379968204,
"grad_norm": 0.5361206317257745,
"learning_rate": 1.793057487708705e-07,
"loss": 0.1173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11059747636318207,
"step": 4235,
"valid_targets_mean": 3127.6,
"valid_targets_min": 251
},
{
"epoch": 6.740858505564388,
"grad_norm": 0.48942654254164564,
"learning_rate": 1.688676262168465e-07,
"loss": 0.1137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11752250790596008,
"step": 4240,
"valid_targets_mean": 3818.7,
"valid_targets_min": 739
},
{
"epoch": 6.748807631160572,
"grad_norm": 0.45231885595248883,
"learning_rate": 1.5874121870219415e-07,
"loss": 0.1154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11548950523138046,
"step": 4245,
"valid_targets_mean": 4585.7,
"valid_targets_min": 308
},
{
"epoch": 6.756756756756757,
"grad_norm": 0.47395667412902187,
"learning_rate": 1.4892668539853606e-07,
"loss": 0.1143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1214282214641571,
"step": 4250,
"valid_targets_mean": 4161.2,
"valid_targets_min": 765
},
{
"epoch": 6.764705882352941,
"grad_norm": 0.43529395808289495,
"learning_rate": 1.3942418057530714e-07,
"loss": 0.1038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09696638584136963,
"step": 4255,
"valid_targets_mean": 4235.6,
"valid_targets_min": 531
},
{
"epoch": 6.772655007949125,
"grad_norm": 0.4448513095931578,
"learning_rate": 1.3023385359733687e-07,
"loss": 0.1119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10132372379302979,
"step": 4260,
"valid_targets_mean": 4057.3,
"valid_targets_min": 703
},
{
"epoch": 6.78060413354531,
"grad_norm": 0.5547672548578956,
"learning_rate": 1.213558489224953e-07,
"loss": 0.1241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12664559483528137,
"step": 4265,
"valid_targets_mean": 3385.1,
"valid_targets_min": 349
},
{
"epoch": 6.788553259141494,
"grad_norm": 0.4670519878770078,
"learning_rate": 1.1279030609942177e-07,
"loss": 0.1339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12070097029209137,
"step": 4270,
"valid_targets_mean": 5304.9,
"valid_targets_min": 2131
},
{
"epoch": 6.796502384737678,
"grad_norm": 1.1700155137729815,
"learning_rate": 1.0453735976533985e-07,
"loss": 0.1216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12248082458972931,
"step": 4275,
"valid_targets_mean": 4182.2,
"valid_targets_min": 584
},
{
"epoch": 6.804451510333863,
"grad_norm": 0.5171523736974354,
"learning_rate": 9.659713964392358e-08,
"loss": 0.1097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10080324113368988,
"step": 4280,
"valid_targets_mean": 3404.8,
"valid_targets_min": 304
},
{
"epoch": 6.8124006359300475,
"grad_norm": 0.51183917876764,
"learning_rate": 8.896977054328349e-08,
"loss": 0.1078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08926388621330261,
"step": 4285,
"valid_targets_mean": 3781.9,
"valid_targets_min": 334
},
{
"epoch": 6.8203497615262325,
"grad_norm": 0.5317954705582983,
"learning_rate": 8.165537235398146e-08,
"loss": 0.1094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10373544692993164,
"step": 4290,
"valid_targets_mean": 3098.6,
"valid_targets_min": 576
},
{
"epoch": 6.828298887122417,
"grad_norm": 0.46554008682031195,
"learning_rate": 7.465406004715903e-08,
"loss": 0.1124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11525758355855942,
"step": 4295,
"valid_targets_mean": 4444.8,
"valid_targets_min": 834
},
{
"epoch": 6.836248012718601,
"grad_norm": 0.45846708598172736,
"learning_rate": 6.796594367272535e-08,
"loss": 0.1077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09519517421722412,
"step": 4300,
"valid_targets_mean": 3990.9,
"valid_targets_min": 559
},
{
"epoch": 6.844197138314786,
"grad_norm": 0.542174177410134,
"learning_rate": 6.159112835763204e-08,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09634318947792053,
"step": 4305,
"valid_targets_mean": 3841.8,
"valid_targets_min": 289
},
{
"epoch": 6.85214626391097,
"grad_norm": 0.5687137465211649,
"learning_rate": 5.552971430421439e-08,
"loss": 0.1136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11241281777620316,
"step": 4310,
"valid_targets_mean": 2990.4,
"valid_targets_min": 469
},
{
"epoch": 6.860095389507154,
"grad_norm": 0.4978344358648119,
"learning_rate": 4.9781796788621605e-08,
"loss": 0.1135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11623929440975189,
"step": 4315,
"valid_targets_mean": 3618.5,
"valid_targets_min": 671
},
{
"epoch": 6.868044515103339,
"grad_norm": 0.5297908608971749,
"learning_rate": 4.434746615932018e-08,
"loss": 0.123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11995728313922882,
"step": 4320,
"valid_targets_mean": 3083.2,
"valid_targets_min": 737
},
{
"epoch": 6.875993640699523,
"grad_norm": 0.61054223355744,
"learning_rate": 3.922680783566168e-08,
"loss": 0.1114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11064666509628296,
"step": 4325,
"valid_targets_mean": 3176.7,
"valid_targets_min": 558
},
{
"epoch": 6.883942766295707,
"grad_norm": 0.522298631432037,
"learning_rate": 3.441990230656167e-08,
"loss": 0.1108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11717766523361206,
"step": 4330,
"valid_targets_mean": 3661.9,
"valid_targets_min": 565
},
{
"epoch": 6.891891891891892,
"grad_norm": 0.49498352702719756,
"learning_rate": 2.992682512921175e-08,
"loss": 0.1336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12047946453094482,
"step": 4335,
"valid_targets_mean": 3766.9,
"valid_targets_min": 250
},
{
"epoch": 6.899841017488076,
"grad_norm": 0.5212865153023899,
"learning_rate": 2.574764692790499e-08,
"loss": 0.1193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12060309201478958,
"step": 4340,
"valid_targets_mean": 4045.0,
"valid_targets_min": 1740
},
{
"epoch": 6.907790143084261,
"grad_norm": 0.53810487124348,
"learning_rate": 2.188243339292795e-08,
"loss": 0.1131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11383530497550964,
"step": 4345,
"valid_targets_mean": 4394.4,
"valid_targets_min": 607
},
{
"epoch": 6.915739268680445,
"grad_norm": 0.44962307621678405,
"learning_rate": 1.8331245279517017e-08,
"loss": 0.109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09446686506271362,
"step": 4350,
"valid_targets_mean": 4012.4,
"valid_targets_min": 444
},
{
"epoch": 6.923688394276629,
"grad_norm": 0.5374076189204164,
"learning_rate": 1.509413840691476e-08,
"loss": 0.1113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11552655696868896,
"step": 4355,
"valid_targets_mean": 3191.7,
"valid_targets_min": 280
},
{
"epoch": 6.9316375198728135,
"grad_norm": 0.53179013058553,
"learning_rate": 1.2171163657481722e-08,
"loss": 0.1229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1528531163930893,
"step": 4360,
"valid_targets_mean": 3466.8,
"valid_targets_min": 564
},
{
"epoch": 6.9395866454689985,
"grad_norm": 0.5741198365523206,
"learning_rate": 9.562366975910397e-09,
"loss": 0.1247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1264297068119049,
"step": 4365,
"valid_targets_mean": 3148.3,
"valid_targets_min": 594
},
{
"epoch": 6.947535771065183,
"grad_norm": 0.5093734832614514,
"learning_rate": 7.2677893684880425e-09,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12815840542316437,
"step": 4370,
"valid_targets_mean": 3770.9,
"valid_targets_min": 295
},
{
"epoch": 6.955484896661368,
"grad_norm": 0.5049584504832715,
"learning_rate": 5.2874669024616246e-09,
"loss": 0.1168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1203048899769783,
"step": 4375,
"valid_targets_mean": 4105.9,
"valid_targets_min": 649
},
{
"epoch": 6.963434022257552,
"grad_norm": 0.5411424955946904,
"learning_rate": 3.621430705467166e-09,
"loss": 0.118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1432824283838272,
"step": 4380,
"valid_targets_mean": 3633.6,
"valid_targets_min": 834
},
{
"epoch": 6.971383147853736,
"grad_norm": 0.508251429943314,
"learning_rate": 2.2697069650456927e-09,
"loss": 0.1183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11797773092985153,
"step": 4385,
"valid_targets_mean": 3701.4,
"valid_targets_min": 610
},
{
"epoch": 6.979332273449921,
"grad_norm": 0.48126946316204494,
"learning_rate": 1.2323169282257852e-09,
"loss": 0.1223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12007807195186615,
"step": 4390,
"valid_targets_mean": 4153.2,
"valid_targets_min": 614
},
{
"epoch": 6.987281399046105,
"grad_norm": 0.5042572172371226,
"learning_rate": 5.092769011860732e-10,
"loss": 0.1192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13380548357963562,
"step": 4395,
"valid_targets_mean": 3818.6,
"valid_targets_min": 1226
},
{
"epoch": 6.995230524642289,
"grad_norm": 0.5243147413835153,
"learning_rate": 1.0059824901098581e-10,
"loss": 0.106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10705508291721344,
"step": 4400,
"valid_targets_mean": 3303.4,
"valid_targets_min": 802
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10637553036212921,
"step": 4403,
"total_flos": 1578618973913088.0,
"train_loss": 0.16220748680723057,
"train_runtime": 24708.9634,
"train_samples_per_second": 2.847,
"train_steps_per_second": 0.178,
"valid_targets_mean": 4107.2,
"valid_targets_min": 717
}
],
"logging_steps": 5,
"max_steps": 4403,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1578618973913088.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}