{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4739, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.007385524372230428, "grad_norm": 19.97872360716285, "learning_rate": 3.3755274261603377e-07, "loss": 0.624, "loss_nan_ranks": 0, "loss_rank_avg": 0.7236873507499695, "step": 5, "valid_targets_mean": 4191.2, "valid_targets_min": 560 }, { "epoch": 0.014771048744460856, "grad_norm": 16.297750328748872, "learning_rate": 7.59493670886076e-07, "loss": 0.6447, "loss_nan_ranks": 0, "loss_rank_avg": 0.6396403312683105, "step": 10, "valid_targets_mean": 3906.9, "valid_targets_min": 617 }, { "epoch": 0.022156573116691284, "grad_norm": 13.56762186389351, "learning_rate": 1.1814345991561182e-06, "loss": 0.6682, "loss_nan_ranks": 0, "loss_rank_avg": 0.5922929048538208, "step": 15, "valid_targets_mean": 5468.2, "valid_targets_min": 573 }, { "epoch": 0.029542097488921712, "grad_norm": 11.653889962740626, "learning_rate": 1.6033755274261605e-06, "loss": 0.5585, "loss_nan_ranks": 0, "loss_rank_avg": 0.5627623796463013, "step": 20, "valid_targets_mean": 4871.1, "valid_targets_min": 581 }, { "epoch": 0.03692762186115214, "grad_norm": 8.00562953617597, "learning_rate": 2.0253164556962026e-06, "loss": 0.5008, "loss_nan_ranks": 0, "loss_rank_avg": 0.5002298355102539, "step": 25, "valid_targets_mean": 4081.2, "valid_targets_min": 400 }, { "epoch": 0.04431314623338257, "grad_norm": 4.397412308851758, "learning_rate": 2.447257383966245e-06, "loss": 0.4932, "loss_nan_ranks": 0, "loss_rank_avg": 0.4381677806377411, "step": 30, "valid_targets_mean": 5501.4, "valid_targets_min": 638 }, { "epoch": 0.051698670605613, "grad_norm": 2.3819720550400656, "learning_rate": 2.8691983122362873e-06, "loss": 0.4548, "loss_nan_ranks": 0, "loss_rank_avg": 0.4095567464828491, "step": 35, "valid_targets_mean": 6018.8, "valid_targets_min": 479 }, { "epoch": 0.059084194977843424, "grad_norm": 1.5356961908394742, "learning_rate": 3.2911392405063294e-06, "loss": 0.4411, "loss_nan_ranks": 0, "loss_rank_avg": 0.3926240801811218, "step": 40, "valid_targets_mean": 4400.6, "valid_targets_min": 517 }, { "epoch": 0.06646971935007386, "grad_norm": 1.0870293491792131, "learning_rate": 3.713080168776372e-06, "loss": 0.4433, "loss_nan_ranks": 0, "loss_rank_avg": 0.417349636554718, "step": 45, "valid_targets_mean": 5836.1, "valid_targets_min": 762 }, { "epoch": 0.07385524372230429, "grad_norm": 0.943385047160246, "learning_rate": 4.135021097046414e-06, "loss": 0.4154, "loss_nan_ranks": 0, "loss_rank_avg": 0.41143539547920227, "step": 50, "valid_targets_mean": 5084.6, "valid_targets_min": 639 }, { "epoch": 0.08124076809453472, "grad_norm": 1.011998448398478, "learning_rate": 4.556962025316456e-06, "loss": 0.4151, "loss_nan_ranks": 0, "loss_rank_avg": 0.39654070138931274, "step": 55, "valid_targets_mean": 5247.8, "valid_targets_min": 681 }, { "epoch": 0.08862629246676514, "grad_norm": 0.686487046735958, "learning_rate": 4.978902953586498e-06, "loss": 0.3792, "loss_nan_ranks": 0, "loss_rank_avg": 0.33487510681152344, "step": 60, "valid_targets_mean": 5221.6, "valid_targets_min": 490 }, { "epoch": 0.09601181683899557, "grad_norm": 0.571553738713959, "learning_rate": 5.40084388185654e-06, "loss": 0.3743, "loss_nan_ranks": 0, "loss_rank_avg": 0.3575626313686371, "step": 65, "valid_targets_mean": 6041.3, "valid_targets_min": 618 }, { "epoch": 0.103397341211226, "grad_norm": 0.49365785429432335, "learning_rate": 5.8227848101265824e-06, "loss": 0.3463, "loss_nan_ranks": 0, "loss_rank_avg": 0.30460304021835327, "step": 70, "valid_targets_mean": 5298.4, "valid_targets_min": 535 }, { "epoch": 0.11078286558345643, "grad_norm": 0.5050364830057085, "learning_rate": 6.244725738396625e-06, "loss": 0.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.3081740140914917, "step": 75, "valid_targets_mean": 5255.7, "valid_targets_min": 652 }, { "epoch": 0.11816838995568685, "grad_norm": 0.5226990318037864, "learning_rate": 6.666666666666667e-06, "loss": 0.3904, "loss_nan_ranks": 0, "loss_rank_avg": 0.3145563006401062, "step": 80, "valid_targets_mean": 4663.9, "valid_targets_min": 392 }, { "epoch": 0.1255539143279173, "grad_norm": 0.4881100768231626, "learning_rate": 7.08860759493671e-06, "loss": 0.3726, "loss_nan_ranks": 0, "loss_rank_avg": 0.30497312545776367, "step": 85, "valid_targets_mean": 5632.1, "valid_targets_min": 719 }, { "epoch": 0.1329394387001477, "grad_norm": 0.5237726651638548, "learning_rate": 7.510548523206752e-06, "loss": 0.3544, "loss_nan_ranks": 0, "loss_rank_avg": 0.3278190791606903, "step": 90, "valid_targets_mean": 6220.0, "valid_targets_min": 751 }, { "epoch": 0.14032496307237813, "grad_norm": 0.4650280516019618, "learning_rate": 7.932489451476793e-06, "loss": 0.3182, "loss_nan_ranks": 0, "loss_rank_avg": 0.28953981399536133, "step": 95, "valid_targets_mean": 5031.3, "valid_targets_min": 642 }, { "epoch": 0.14771048744460857, "grad_norm": 0.46371951812182943, "learning_rate": 8.354430379746837e-06, "loss": 0.3099, "loss_nan_ranks": 0, "loss_rank_avg": 0.33909645676612854, "step": 100, "valid_targets_mean": 6196.9, "valid_targets_min": 545 }, { "epoch": 0.155096011816839, "grad_norm": 0.4568538569230339, "learning_rate": 8.776371308016879e-06, "loss": 0.3471, "loss_nan_ranks": 0, "loss_rank_avg": 0.2957189679145813, "step": 105, "valid_targets_mean": 6063.0, "valid_targets_min": 584 }, { "epoch": 0.16248153618906944, "grad_norm": 0.4578520750020651, "learning_rate": 9.198312236286921e-06, "loss": 0.3276, "loss_nan_ranks": 0, "loss_rank_avg": 0.29967236518859863, "step": 110, "valid_targets_mean": 6171.0, "valid_targets_min": 540 }, { "epoch": 0.16986706056129985, "grad_norm": 0.4955996123561873, "learning_rate": 9.620253164556963e-06, "loss": 0.3176, "loss_nan_ranks": 0, "loss_rank_avg": 0.2830328941345215, "step": 115, "valid_targets_mean": 4840.9, "valid_targets_min": 454 }, { "epoch": 0.17725258493353027, "grad_norm": 0.5471230185393541, "learning_rate": 1.0042194092827005e-05, "loss": 0.3219, "loss_nan_ranks": 0, "loss_rank_avg": 0.36016958951950073, "step": 120, "valid_targets_mean": 4376.1, "valid_targets_min": 605 }, { "epoch": 0.18463810930576072, "grad_norm": 0.5075473057243887, "learning_rate": 1.0464135021097049e-05, "loss": 0.3135, "loss_nan_ranks": 0, "loss_rank_avg": 0.314586877822876, "step": 125, "valid_targets_mean": 4974.8, "valid_targets_min": 615 }, { "epoch": 0.19202363367799113, "grad_norm": 0.4679315871943788, "learning_rate": 1.088607594936709e-05, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.27506357431411743, "step": 130, "valid_targets_mean": 5003.4, "valid_targets_min": 309 }, { "epoch": 0.19940915805022155, "grad_norm": 0.5203002455514378, "learning_rate": 1.1308016877637132e-05, "loss": 0.3111, "loss_nan_ranks": 0, "loss_rank_avg": 0.3530064821243286, "step": 135, "valid_targets_mean": 4744.3, "valid_targets_min": 380 }, { "epoch": 0.206794682422452, "grad_norm": 0.508532245402902, "learning_rate": 1.1729957805907175e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.26319918036460876, "step": 140, "valid_targets_mean": 4969.9, "valid_targets_min": 298 }, { "epoch": 0.21418020679468242, "grad_norm": 0.4977333684095323, "learning_rate": 1.2151898734177216e-05, "loss": 0.2864, "loss_nan_ranks": 0, "loss_rank_avg": 0.281037300825119, "step": 145, "valid_targets_mean": 4680.9, "valid_targets_min": 553 }, { "epoch": 0.22156573116691286, "grad_norm": 0.5700488921766971, "learning_rate": 1.2573839662447258e-05, "loss": 0.3138, "loss_nan_ranks": 0, "loss_rank_avg": 0.3317258059978485, "step": 150, "valid_targets_mean": 4780.8, "valid_targets_min": 613 }, { "epoch": 0.22895125553914328, "grad_norm": 0.5049210471064856, "learning_rate": 1.29957805907173e-05, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.31507956981658936, "step": 155, "valid_targets_mean": 4951.3, "valid_targets_min": 648 }, { "epoch": 0.2363367799113737, "grad_norm": 0.48733685753987915, "learning_rate": 1.3417721518987344e-05, "loss": 0.3144, "loss_nan_ranks": 0, "loss_rank_avg": 0.3532077670097351, "step": 160, "valid_targets_mean": 5704.9, "valid_targets_min": 615 }, { "epoch": 0.24372230428360414, "grad_norm": 0.478477178779921, "learning_rate": 1.3839662447257384e-05, "loss": 0.2889, "loss_nan_ranks": 0, "loss_rank_avg": 0.25617825984954834, "step": 165, "valid_targets_mean": 5201.0, "valid_targets_min": 614 }, { "epoch": 0.2511078286558346, "grad_norm": 0.6185796972171613, "learning_rate": 1.4261603375527426e-05, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.3018920421600342, "step": 170, "valid_targets_mean": 4082.6, "valid_targets_min": 595 }, { "epoch": 0.258493353028065, "grad_norm": 0.5575122691401694, "learning_rate": 1.468354430379747e-05, "loss": 0.2849, "loss_nan_ranks": 0, "loss_rank_avg": 0.2911016345024109, "step": 175, "valid_targets_mean": 4299.9, "valid_targets_min": 662 }, { "epoch": 0.2658788774002954, "grad_norm": 0.6276828580042122, "learning_rate": 1.5105485232067512e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.25065547227859497, "step": 180, "valid_targets_mean": 4217.5, "valid_targets_min": 388 }, { "epoch": 0.27326440177252587, "grad_norm": 0.4696050024959157, "learning_rate": 1.5527426160337554e-05, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.2493332028388977, "step": 185, "valid_targets_mean": 5711.5, "valid_targets_min": 679 }, { "epoch": 0.28064992614475626, "grad_norm": 0.5623419824234117, "learning_rate": 1.5949367088607598e-05, "loss": 0.2589, "loss_nan_ranks": 0, "loss_rank_avg": 0.27796900272369385, "step": 190, "valid_targets_mean": 4589.1, "valid_targets_min": 592 }, { "epoch": 0.2880354505169867, "grad_norm": 0.45269545432048147, "learning_rate": 1.637130801687764e-05, "loss": 0.243, "loss_nan_ranks": 0, "loss_rank_avg": 0.23348630964756012, "step": 195, "valid_targets_mean": 6195.4, "valid_targets_min": 1406 }, { "epoch": 0.29542097488921715, "grad_norm": 0.5800039153836231, "learning_rate": 1.679324894514768e-05, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.3133583664894104, "step": 200, "valid_targets_mean": 4379.1, "valid_targets_min": 577 }, { "epoch": 0.30280649926144754, "grad_norm": 0.4475247352688734, "learning_rate": 1.7215189873417723e-05, "loss": 0.2688, "loss_nan_ranks": 0, "loss_rank_avg": 0.2346859574317932, "step": 205, "valid_targets_mean": 5674.9, "valid_targets_min": 516 }, { "epoch": 0.310192023633678, "grad_norm": 0.6043039588064852, "learning_rate": 1.7637130801687767e-05, "loss": 0.284, "loss_nan_ranks": 0, "loss_rank_avg": 0.2985689640045166, "step": 210, "valid_targets_mean": 3230.7, "valid_targets_min": 451 }, { "epoch": 0.3175775480059084, "grad_norm": 0.46608512023497484, "learning_rate": 1.8059071729957807e-05, "loss": 0.2621, "loss_nan_ranks": 0, "loss_rank_avg": 0.2667817175388336, "step": 215, "valid_targets_mean": 5615.9, "valid_targets_min": 608 }, { "epoch": 0.3249630723781389, "grad_norm": 0.6393799102975143, "learning_rate": 1.848101265822785e-05, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.3485134243965149, "step": 220, "valid_targets_mean": 5232.9, "valid_targets_min": 551 }, { "epoch": 0.33234859675036926, "grad_norm": 0.4985956967264833, "learning_rate": 1.890295358649789e-05, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.22727638483047485, "step": 225, "valid_targets_mean": 5186.1, "valid_targets_min": 557 }, { "epoch": 0.3397341211225997, "grad_norm": 0.698867408214604, "learning_rate": 1.9324894514767935e-05, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.28445443511009216, "step": 230, "valid_targets_mean": 4395.3, "valid_targets_min": 613 }, { "epoch": 0.34711964549483015, "grad_norm": 0.4699161647524185, "learning_rate": 1.974683544303798e-05, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.27419084310531616, "step": 235, "valid_targets_mean": 6050.6, "valid_targets_min": 697 }, { "epoch": 0.35450516986706054, "grad_norm": 0.49712308816298567, "learning_rate": 2.0168776371308016e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.2411026805639267, "step": 240, "valid_targets_mean": 6215.0, "valid_targets_min": 375 }, { "epoch": 0.361890694239291, "grad_norm": 0.4755998361435196, "learning_rate": 2.0590717299578063e-05, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.31807953119277954, "step": 245, "valid_targets_mean": 5977.3, "valid_targets_min": 222 }, { "epoch": 0.36927621861152143, "grad_norm": 0.5522737703807714, "learning_rate": 2.1012658227848103e-05, "loss": 0.2728, "loss_nan_ranks": 0, "loss_rank_avg": 0.2637110650539398, "step": 250, "valid_targets_mean": 4707.1, "valid_targets_min": 424 }, { "epoch": 0.3766617429837518, "grad_norm": 0.5752807812899275, "learning_rate": 2.1434599156118144e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.252408891916275, "step": 255, "valid_targets_mean": 4646.9, "valid_targets_min": 620 }, { "epoch": 0.38404726735598227, "grad_norm": 0.4839304938690229, "learning_rate": 2.1856540084388188e-05, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.311644971370697, "step": 260, "valid_targets_mean": 6014.4, "valid_targets_min": 320 }, { "epoch": 0.3914327917282127, "grad_norm": 0.3679428184390633, "learning_rate": 2.2278481012658228e-05, "loss": 0.2603, "loss_nan_ranks": 0, "loss_rank_avg": 0.1715935468673706, "step": 265, "valid_targets_mean": 7149.1, "valid_targets_min": 708 }, { "epoch": 0.3988183161004431, "grad_norm": 0.4388882366281187, "learning_rate": 2.270042194092827e-05, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.21887677907943726, "step": 270, "valid_targets_mean": 5259.7, "valid_targets_min": 462 }, { "epoch": 0.40620384047267355, "grad_norm": 0.45156140818813745, "learning_rate": 2.3122362869198316e-05, "loss": 0.243, "loss_nan_ranks": 0, "loss_rank_avg": 0.1979508399963379, "step": 275, "valid_targets_mean": 5245.2, "valid_targets_min": 370 }, { "epoch": 0.413589364844904, "grad_norm": 0.5635183886045622, "learning_rate": 2.3544303797468356e-05, "loss": 0.2644, "loss_nan_ranks": 0, "loss_rank_avg": 0.2971973419189453, "step": 280, "valid_targets_mean": 4294.6, "valid_targets_min": 250 }, { "epoch": 0.42097488921713444, "grad_norm": 0.6003559911338966, "learning_rate": 2.39662447257384e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.27018484473228455, "step": 285, "valid_targets_mean": 4037.1, "valid_targets_min": 530 }, { "epoch": 0.42836041358936483, "grad_norm": 0.519146451009721, "learning_rate": 2.438818565400844e-05, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.25247296690940857, "step": 290, "valid_targets_mean": 5198.4, "valid_targets_min": 757 }, { "epoch": 0.4357459379615953, "grad_norm": 0.5295365016140835, "learning_rate": 2.481012658227848e-05, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.30645301938056946, "step": 295, "valid_targets_mean": 5075.9, "valid_targets_min": 586 }, { "epoch": 0.4431314623338257, "grad_norm": 0.5064359925137679, "learning_rate": 2.5232067510548524e-05, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.27146783471107483, "step": 300, "valid_targets_mean": 5670.0, "valid_targets_min": 510 }, { "epoch": 0.4505169867060561, "grad_norm": 0.4807884411055291, "learning_rate": 2.5654008438818568e-05, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.245832160115242, "step": 305, "valid_targets_mean": 4988.6, "valid_targets_min": 758 }, { "epoch": 0.45790251107828656, "grad_norm": 0.4874621524760727, "learning_rate": 2.6075949367088612e-05, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.22424304485321045, "step": 310, "valid_targets_mean": 4865.2, "valid_targets_min": 690 }, { "epoch": 0.465288035450517, "grad_norm": 0.5241781469793773, "learning_rate": 2.6497890295358652e-05, "loss": 0.2674, "loss_nan_ranks": 0, "loss_rank_avg": 0.2541046142578125, "step": 315, "valid_targets_mean": 4655.8, "valid_targets_min": 303 }, { "epoch": 0.4726735598227474, "grad_norm": 0.6693714356739207, "learning_rate": 2.6919831223628693e-05, "loss": 0.2598, "loss_nan_ranks": 0, "loss_rank_avg": 0.3150583803653717, "step": 320, "valid_targets_mean": 3789.6, "valid_targets_min": 323 }, { "epoch": 0.48005908419497784, "grad_norm": 0.4049583166705286, "learning_rate": 2.7341772151898737e-05, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.19988644123077393, "step": 325, "valid_targets_mean": 6250.1, "valid_targets_min": 565 }, { "epoch": 0.4874446085672083, "grad_norm": 0.5683986043691779, "learning_rate": 2.7763713080168777e-05, "loss": 0.2955, "loss_nan_ranks": 0, "loss_rank_avg": 0.30885380506515503, "step": 330, "valid_targets_mean": 4539.6, "valid_targets_min": 511 }, { "epoch": 0.4948301329394387, "grad_norm": 0.4293798580209713, "learning_rate": 2.8185654008438824e-05, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.2373587191104889, "step": 335, "valid_targets_mean": 6893.3, "valid_targets_min": 540 }, { "epoch": 0.5022156573116692, "grad_norm": 0.5051385898465901, "learning_rate": 2.8607594936708865e-05, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.2349412590265274, "step": 340, "valid_targets_mean": 5513.8, "valid_targets_min": 348 }, { "epoch": 0.5096011816838996, "grad_norm": 0.453650649705282, "learning_rate": 2.9029535864978905e-05, "loss": 0.2487, "loss_nan_ranks": 0, "loss_rank_avg": 0.24615350365638733, "step": 345, "valid_targets_mean": 5636.8, "valid_targets_min": 632 }, { "epoch": 0.51698670605613, "grad_norm": 0.5026094522177535, "learning_rate": 2.945147679324895e-05, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.25473105907440186, "step": 350, "valid_targets_mean": 4648.2, "valid_targets_min": 618 }, { "epoch": 0.5243722304283605, "grad_norm": 0.5473929641026576, "learning_rate": 2.987341772151899e-05, "loss": 0.2454, "loss_nan_ranks": 0, "loss_rank_avg": 0.25512436032295227, "step": 355, "valid_targets_mean": 4888.8, "valid_targets_min": 455 }, { "epoch": 0.5317577548005908, "grad_norm": 0.6818407765763758, "learning_rate": 3.029535864978903e-05, "loss": 0.251, "loss_nan_ranks": 0, "loss_rank_avg": 0.26583975553512573, "step": 360, "valid_targets_mean": 3901.6, "valid_targets_min": 393 }, { "epoch": 0.5391432791728212, "grad_norm": 0.43264528877861325, "learning_rate": 3.0717299578059074e-05, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.2336602509021759, "step": 365, "valid_targets_mean": 6759.1, "valid_targets_min": 654 }, { "epoch": 0.5465288035450517, "grad_norm": 0.4786744793085355, "learning_rate": 3.113924050632912e-05, "loss": 0.2568, "loss_nan_ranks": 0, "loss_rank_avg": 0.23913979530334473, "step": 370, "valid_targets_mean": 5128.6, "valid_targets_min": 436 }, { "epoch": 0.5539143279172821, "grad_norm": 0.6098930815067188, "learning_rate": 3.156118143459916e-05, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.27685385942459106, "step": 375, "valid_targets_mean": 4722.4, "valid_targets_min": 547 }, { "epoch": 0.5612998522895125, "grad_norm": 0.4884326875060275, "learning_rate": 3.19831223628692e-05, "loss": 0.2529, "loss_nan_ranks": 0, "loss_rank_avg": 0.269244909286499, "step": 380, "valid_targets_mean": 5746.3, "valid_targets_min": 649 }, { "epoch": 0.568685376661743, "grad_norm": 0.6966159287505779, "learning_rate": 3.240506329113924e-05, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.25672098994255066, "step": 385, "valid_targets_mean": 5211.0, "valid_targets_min": 451 }, { "epoch": 0.5760709010339734, "grad_norm": 0.4826433803477916, "learning_rate": 3.282700421940928e-05, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.21904008090496063, "step": 390, "valid_targets_mean": 4840.0, "valid_targets_min": 614 }, { "epoch": 0.5834564254062038, "grad_norm": 0.5161328067549831, "learning_rate": 3.324894514767932e-05, "loss": 0.2401, "loss_nan_ranks": 0, "loss_rank_avg": 0.21546295285224915, "step": 395, "valid_targets_mean": 5000.8, "valid_targets_min": 474 }, { "epoch": 0.5908419497784343, "grad_norm": 0.441903839632028, "learning_rate": 3.367088607594937e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.2418462634086609, "step": 400, "valid_targets_mean": 6752.2, "valid_targets_min": 526 }, { "epoch": 0.5982274741506647, "grad_norm": 0.4263460620059315, "learning_rate": 3.409282700421941e-05, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.2564152479171753, "step": 405, "valid_targets_mean": 5806.5, "valid_targets_min": 581 }, { "epoch": 0.6056129985228951, "grad_norm": 0.4114391570850889, "learning_rate": 3.451476793248946e-05, "loss": 0.2561, "loss_nan_ranks": 0, "loss_rank_avg": 0.19688798487186432, "step": 410, "valid_targets_mean": 5193.4, "valid_targets_min": 765 }, { "epoch": 0.6129985228951256, "grad_norm": 0.560472208109208, "learning_rate": 3.49367088607595e-05, "loss": 0.3089, "loss_nan_ranks": 0, "loss_rank_avg": 0.3748968243598938, "step": 415, "valid_targets_mean": 6106.8, "valid_targets_min": 673 }, { "epoch": 0.620384047267356, "grad_norm": 0.4389773616307953, "learning_rate": 3.535864978902954e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.25939327478408813, "step": 420, "valid_targets_mean": 5600.4, "valid_targets_min": 587 }, { "epoch": 0.6277695716395865, "grad_norm": 0.49005945851489136, "learning_rate": 3.578059071729958e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.2415715903043747, "step": 425, "valid_targets_mean": 5480.6, "valid_targets_min": 557 }, { "epoch": 0.6351550960118169, "grad_norm": 0.6120232650144795, "learning_rate": 3.6202531645569626e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.27258408069610596, "step": 430, "valid_targets_mean": 4020.8, "valid_targets_min": 575 }, { "epoch": 0.6425406203840472, "grad_norm": 0.5517761299010163, "learning_rate": 3.6624472573839666e-05, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.2571716904640198, "step": 435, "valid_targets_mean": 3986.9, "valid_targets_min": 570 }, { "epoch": 0.6499261447562777, "grad_norm": 0.4519259500134533, "learning_rate": 3.704641350210971e-05, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.23544706404209137, "step": 440, "valid_targets_mean": 5446.1, "valid_targets_min": 798 }, { "epoch": 0.6573116691285081, "grad_norm": 0.4627225505498187, "learning_rate": 3.746835443037975e-05, "loss": 0.2572, "loss_nan_ranks": 0, "loss_rank_avg": 0.22768300771713257, "step": 445, "valid_targets_mean": 5305.9, "valid_targets_min": 612 }, { "epoch": 0.6646971935007385, "grad_norm": 0.5459862764397345, "learning_rate": 3.7890295358649794e-05, "loss": 0.2509, "loss_nan_ranks": 0, "loss_rank_avg": 0.2680595815181732, "step": 450, "valid_targets_mean": 3753.4, "valid_targets_min": 637 }, { "epoch": 0.672082717872969, "grad_norm": 0.5037347511570361, "learning_rate": 3.8312236286919835e-05, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.2467479407787323, "step": 455, "valid_targets_mean": 5501.6, "valid_targets_min": 310 }, { "epoch": 0.6794682422451994, "grad_norm": 0.4327775289602796, "learning_rate": 3.873417721518988e-05, "loss": 0.2367, "loss_nan_ranks": 0, "loss_rank_avg": 0.19664692878723145, "step": 460, "valid_targets_mean": 5931.2, "valid_targets_min": 913 }, { "epoch": 0.6868537666174298, "grad_norm": 0.4409637060996679, "learning_rate": 3.915611814345992e-05, "loss": 0.2239, "loss_nan_ranks": 0, "loss_rank_avg": 0.21506735682487488, "step": 465, "valid_targets_mean": 6059.1, "valid_targets_min": 647 }, { "epoch": 0.6942392909896603, "grad_norm": 0.5504576504647792, "learning_rate": 3.957805907172996e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.2300184667110443, "step": 470, "valid_targets_mean": 3839.0, "valid_targets_min": 557 }, { "epoch": 0.7016248153618907, "grad_norm": 0.429274562141855, "learning_rate": 4e-05, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.2237507700920105, "step": 475, "valid_targets_mean": 6357.5, "valid_targets_min": 742 }, { "epoch": 0.7090103397341211, "grad_norm": 0.7536006693457217, "learning_rate": 3.9999864355811366e-05, "loss": 0.2377, "loss_nan_ranks": 0, "loss_rank_avg": 0.22905516624450684, "step": 480, "valid_targets_mean": 4381.5, "valid_targets_min": 729 }, { "epoch": 0.7163958641063516, "grad_norm": 0.43953758941215776, "learning_rate": 3.99994574250854e-05, "loss": 0.2316, "loss_nan_ranks": 0, "loss_rank_avg": 0.20200951397418976, "step": 485, "valid_targets_mean": 5644.1, "valid_targets_min": 683 }, { "epoch": 0.723781388478582, "grad_norm": 0.4723664561759756, "learning_rate": 3.999877921334187e-05, "loss": 0.2475, "loss_nan_ranks": 0, "loss_rank_avg": 0.26116621494293213, "step": 490, "valid_targets_mean": 5649.9, "valid_targets_min": 598 }, { "epoch": 0.7311669128508124, "grad_norm": 0.5372942073144541, "learning_rate": 3.999782972978035e-05, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.2597278356552124, "step": 495, "valid_targets_mean": 4376.8, "valid_targets_min": 711 }, { "epoch": 0.7385524372230429, "grad_norm": 0.4923885109877066, "learning_rate": 3.9996608987280005e-05, "loss": 0.2537, "loss_nan_ranks": 0, "loss_rank_avg": 0.3310204744338989, "step": 500, "valid_targets_mean": 5373.9, "valid_targets_min": 362 }, { "epoch": 0.7459379615952733, "grad_norm": 0.4360411302968856, "learning_rate": 3.999511700239951e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.23595163226127625, "step": 505, "valid_targets_mean": 5867.7, "valid_targets_min": 747 }, { "epoch": 0.7533234859675036, "grad_norm": 0.4125019822494474, "learning_rate": 3.999335379537677e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.22982177138328552, "step": 510, "valid_targets_mean": 5860.2, "valid_targets_min": 284 }, { "epoch": 0.7607090103397341, "grad_norm": 0.4816111850196653, "learning_rate": 3.999131939012866e-05, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.23170827329158783, "step": 515, "valid_targets_mean": 5939.9, "valid_targets_min": 573 }, { "epoch": 0.7680945347119645, "grad_norm": 0.5607421617686298, "learning_rate": 3.998901381425072e-05, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.27282047271728516, "step": 520, "valid_targets_mean": 4010.6, "valid_targets_min": 308 }, { "epoch": 0.7754800590841949, "grad_norm": 0.4899434940882494, "learning_rate": 3.998643709901673e-05, "loss": 0.2255, "loss_nan_ranks": 0, "loss_rank_avg": 0.2315795123577118, "step": 525, "valid_targets_mean": 4446.6, "valid_targets_min": 755 }, { "epoch": 0.7828655834564254, "grad_norm": 0.4551383882144779, "learning_rate": 3.998358927937835e-05, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.21953409910202026, "step": 530, "valid_targets_mean": 5531.2, "valid_targets_min": 538 }, { "epoch": 0.7902511078286558, "grad_norm": 0.4743224847774692, "learning_rate": 3.9980470393964584e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.23994377255439758, "step": 535, "valid_targets_mean": 4992.5, "valid_targets_min": 499 }, { "epoch": 0.7976366322008862, "grad_norm": 0.42125006599133685, "learning_rate": 3.997708048508131e-05, "loss": 0.2232, "loss_nan_ranks": 0, "loss_rank_avg": 0.19587251543998718, "step": 540, "valid_targets_mean": 5289.6, "valid_targets_min": 667 }, { "epoch": 0.8050221565731167, "grad_norm": 0.524726561877271, "learning_rate": 3.997341959871066e-05, "loss": 0.2255, "loss_nan_ranks": 0, "loss_rank_avg": 0.21869216859340668, "step": 545, "valid_targets_mean": 4091.0, "valid_targets_min": 641 }, { "epoch": 0.8124076809453471, "grad_norm": 1.0978518384034786, "learning_rate": 3.996948778451044e-05, "loss": 0.2382, "loss_nan_ranks": 0, "loss_rank_avg": 0.2922288179397583, "step": 550, "valid_targets_mean": 4755.1, "valid_targets_min": 683 }, { "epoch": 0.8197932053175776, "grad_norm": 0.434588106606303, "learning_rate": 3.996528509581343e-05, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.2291834056377411, "step": 555, "valid_targets_mean": 6349.8, "valid_targets_min": 911 }, { "epoch": 0.827178729689808, "grad_norm": 0.44781488594353586, "learning_rate": 3.996081158962664e-05, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.21667613089084625, "step": 560, "valid_targets_mean": 5273.2, "valid_targets_min": 510 }, { "epoch": 0.8345642540620384, "grad_norm": 0.4232290679425604, "learning_rate": 3.995606732663061e-05, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.21859529614448547, "step": 565, "valid_targets_mean": 6958.2, "valid_targets_min": 578 }, { "epoch": 0.8419497784342689, "grad_norm": 0.37603814378739714, "learning_rate": 3.9951052371178484e-05, "loss": 0.2041, "loss_nan_ranks": 0, "loss_rank_avg": 0.20742715895175934, "step": 570, "valid_targets_mean": 6439.2, "valid_targets_min": 948 }, { "epoch": 0.8493353028064993, "grad_norm": 0.5330316503851572, "learning_rate": 3.994576679129523e-05, "loss": 0.2666, "loss_nan_ranks": 0, "loss_rank_avg": 0.27818042039871216, "step": 575, "valid_targets_mean": 4627.2, "valid_targets_min": 603 }, { "epoch": 0.8567208271787297, "grad_norm": 0.48524432401103307, "learning_rate": 3.9940210658676674e-05, "loss": 0.2502, "loss_nan_ranks": 0, "loss_rank_avg": 0.2559252977371216, "step": 580, "valid_targets_mean": 4795.9, "valid_targets_min": 476 }, { "epoch": 0.8641063515509602, "grad_norm": 0.49687821950248273, "learning_rate": 3.993438404868851e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.22851648926734924, "step": 585, "valid_targets_mean": 5150.0, "valid_targets_min": 523 }, { "epoch": 0.8714918759231906, "grad_norm": 0.4956097153548755, "learning_rate": 3.9928287040365334e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.29340338706970215, "step": 590, "valid_targets_mean": 4955.4, "valid_targets_min": 602 }, { "epoch": 0.8788774002954209, "grad_norm": 0.47621975231571884, "learning_rate": 3.992191971640951e-05, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.27463576197624207, "step": 595, "valid_targets_mean": 5440.9, "valid_targets_min": 602 }, { "epoch": 0.8862629246676514, "grad_norm": 0.4864192134736827, "learning_rate": 3.9915282163190084e-05, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.202743798494339, "step": 600, "valid_targets_mean": 4574.8, "valid_targets_min": 529 }, { "epoch": 0.8936484490398818, "grad_norm": 0.4436441374970087, "learning_rate": 3.990837447074162e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.2884596586227417, "step": 605, "valid_targets_mean": 5406.1, "valid_targets_min": 654 }, { "epoch": 0.9010339734121122, "grad_norm": 0.5091014640879844, "learning_rate": 3.990119673276294e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.2561118006706238, "step": 610, "valid_targets_mean": 3856.2, "valid_targets_min": 395 }, { "epoch": 0.9084194977843427, "grad_norm": 0.44293254378519337, "learning_rate": 3.989374904661589e-05, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.2175714075565338, "step": 615, "valid_targets_mean": 5307.1, "valid_targets_min": 654 }, { "epoch": 0.9158050221565731, "grad_norm": 0.4969299448859931, "learning_rate": 3.988603151332402e-05, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.23327939212322235, "step": 620, "valid_targets_mean": 4357.9, "valid_targets_min": 932 }, { "epoch": 0.9231905465288035, "grad_norm": 0.399043646975211, "learning_rate": 3.987804423757116e-05, "loss": 0.2444, "loss_nan_ranks": 0, "loss_rank_avg": 0.2003873586654663, "step": 625, "valid_targets_mean": 6620.2, "valid_targets_min": 717 }, { "epoch": 0.930576070901034, "grad_norm": 0.5569804334944528, "learning_rate": 3.986978732770008e-05, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.25180336833000183, "step": 630, "valid_targets_mean": 5835.9, "valid_targets_min": 632 }, { "epoch": 0.9379615952732644, "grad_norm": 0.65226776693925, "learning_rate": 3.986126089571096e-05, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.25059741735458374, "step": 635, "valid_targets_mean": 4920.8, "valid_targets_min": 558 }, { "epoch": 0.9453471196454948, "grad_norm": 0.7108324020329172, "learning_rate": 3.98524650572599e-05, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.2292698323726654, "step": 640, "valid_targets_mean": 6018.6, "valid_targets_min": 596 }, { "epoch": 0.9527326440177253, "grad_norm": 0.6100872297295562, "learning_rate": 3.984339993165733e-05, "loss": 0.2483, "loss_nan_ranks": 0, "loss_rank_avg": 0.2530120611190796, "step": 645, "valid_targets_mean": 4852.8, "valid_targets_min": 491 }, { "epoch": 0.9601181683899557, "grad_norm": 0.6894230566439239, "learning_rate": 3.9834065641866405e-05, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.2521514594554901, "step": 650, "valid_targets_mean": 4665.9, "valid_targets_min": 651 }, { "epoch": 0.9675036927621861, "grad_norm": 0.6477076251824874, "learning_rate": 3.9824462314501355e-05, "loss": 0.2148, "loss_nan_ranks": 0, "loss_rank_avg": 0.21362358331680298, "step": 655, "valid_targets_mean": 5620.9, "valid_targets_min": 775 }, { "epoch": 0.9748892171344166, "grad_norm": 0.4865282373044303, "learning_rate": 3.981459007982573e-05, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.22964204847812653, "step": 660, "valid_targets_mean": 4150.7, "valid_targets_min": 476 }, { "epoch": 0.982274741506647, "grad_norm": 0.4265759209620169, "learning_rate": 3.980444907175065e-05, "loss": 0.2221, "loss_nan_ranks": 0, "loss_rank_avg": 0.23872928321361542, "step": 665, "valid_targets_mean": 4645.1, "valid_targets_min": 490 }, { "epoch": 0.9896602658788775, "grad_norm": 0.4337931141291071, "learning_rate": 3.979403942783301e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.21394482254981995, "step": 670, "valid_targets_mean": 5586.5, "valid_targets_min": 583 }, { "epoch": 0.9970457902511078, "grad_norm": 0.44216457771241374, "learning_rate": 3.9783361289273565e-05, "loss": 0.2307, "loss_nan_ranks": 0, "loss_rank_avg": 0.2214493751525879, "step": 675, "valid_targets_mean": 5189.8, "valid_targets_min": 490 }, { "epoch": 1.0044313146233383, "grad_norm": 0.4033533200689087, "learning_rate": 3.977241480091507e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.21175044775009155, "step": 680, "valid_targets_mean": 6346.5, "valid_targets_min": 2699 }, { "epoch": 1.0118168389955686, "grad_norm": 0.485561570780159, "learning_rate": 3.976120011124027e-05, "loss": 0.2282, "loss_nan_ranks": 0, "loss_rank_avg": 0.2394808530807495, "step": 685, "valid_targets_mean": 5191.0, "valid_targets_min": 764 }, { "epoch": 1.0192023633677991, "grad_norm": 0.4391190385256597, "learning_rate": 3.974971737236992e-05, "loss": 0.217, "loss_nan_ranks": 0, "loss_rank_avg": 0.23937949538230896, "step": 690, "valid_targets_mean": 5908.1, "valid_targets_min": 742 }, { "epoch": 1.0265878877400296, "grad_norm": 0.44514329511208256, "learning_rate": 3.9737966740060694e-05, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.20545028150081635, "step": 695, "valid_targets_mean": 4889.1, "valid_targets_min": 246 }, { "epoch": 1.03397341211226, "grad_norm": 0.5296228485775536, "learning_rate": 3.97259483737031e-05, "loss": 0.2484, "loss_nan_ranks": 0, "loss_rank_avg": 0.25395631790161133, "step": 700, "valid_targets_mean": 5731.1, "valid_targets_min": 556 }, { "epoch": 1.0413589364844904, "grad_norm": 0.4073116341963712, "learning_rate": 3.9713662436319283e-05, "loss": 0.2603, "loss_nan_ranks": 0, "loss_rank_avg": 0.234715536236763, "step": 705, "valid_targets_mean": 5917.2, "valid_targets_min": 781 }, { "epoch": 1.048744460856721, "grad_norm": 0.4815030594150368, "learning_rate": 3.9701109094560844e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.2784745395183563, "step": 710, "valid_targets_mean": 4806.1, "valid_targets_min": 559 }, { "epoch": 1.0561299852289512, "grad_norm": 0.49302209706755173, "learning_rate": 3.9688288518706576e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.2195298820734024, "step": 715, "valid_targets_mean": 4878.7, "valid_targets_min": 652 }, { "epoch": 1.0635155096011817, "grad_norm": 0.5556432641590098, "learning_rate": 3.967520088266014e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.3123176097869873, "step": 720, "valid_targets_mean": 4661.2, "valid_targets_min": 459 }, { "epoch": 1.0709010339734122, "grad_norm": 0.4534308645642078, "learning_rate": 3.96618463639477e-05, "loss": 0.2204, "loss_nan_ranks": 0, "loss_rank_avg": 0.2006494402885437, "step": 725, "valid_targets_mean": 4573.6, "valid_targets_min": 623 }, { "epoch": 1.0782865583456425, "grad_norm": 0.47188855620624076, "learning_rate": 3.9648225143715565e-05, "loss": 0.2215, "loss_nan_ranks": 0, "loss_rank_avg": 0.2375321090221405, "step": 730, "valid_targets_mean": 5050.3, "valid_targets_min": 697 }, { "epoch": 1.085672082717873, "grad_norm": 0.5815500233739369, "learning_rate": 3.9634337406727646e-05, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.2476039081811905, "step": 735, "valid_targets_mean": 4952.1, "valid_targets_min": 620 }, { "epoch": 1.0930576070901035, "grad_norm": 0.44455506894558233, "learning_rate": 3.962018334136304e-05, "loss": 0.204, "loss_nan_ranks": 0, "loss_rank_avg": 0.2000984251499176, "step": 740, "valid_targets_mean": 5665.1, "valid_targets_min": 564 }, { "epoch": 1.1004431314623337, "grad_norm": 0.41891782048261406, "learning_rate": 3.960576313961342e-05, "loss": 0.2056, "loss_nan_ranks": 0, "loss_rank_avg": 0.20635861158370972, "step": 745, "valid_targets_mean": 5981.8, "valid_targets_min": 553 }, { "epoch": 1.1078286558345642, "grad_norm": 0.43106390225148533, "learning_rate": 3.9591076997080425e-05, "loss": 0.2206, "loss_nan_ranks": 0, "loss_rank_avg": 0.23344707489013672, "step": 750, "valid_targets_mean": 5677.6, "valid_targets_min": 682 }, { "epoch": 1.1152141802067947, "grad_norm": 0.41866856940372654, "learning_rate": 3.9576125112973064e-05, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.2010667622089386, "step": 755, "valid_targets_mean": 5764.6, "valid_targets_min": 755 }, { "epoch": 1.122599704579025, "grad_norm": 0.3898308822960811, "learning_rate": 3.956090769010495e-05, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.21998938918113708, "step": 760, "valid_targets_mean": 7065.8, "valid_targets_min": 606 }, { "epoch": 1.1299852289512555, "grad_norm": 0.4317215373352644, "learning_rate": 3.954542493489158e-05, "loss": 0.2377, "loss_nan_ranks": 0, "loss_rank_avg": 0.23063355684280396, "step": 765, "valid_targets_mean": 6418.8, "valid_targets_min": 710 }, { "epoch": 1.137370753323486, "grad_norm": 0.4412576392418719, "learning_rate": 3.952967705734752e-05, "loss": 0.2179, "loss_nan_ranks": 0, "loss_rank_avg": 0.20747151970863342, "step": 770, "valid_targets_mean": 5115.1, "valid_targets_min": 600 }, { "epoch": 1.1447562776957163, "grad_norm": 0.5452994774328421, "learning_rate": 3.951366427108359e-05, "loss": 0.2195, "loss_nan_ranks": 0, "loss_rank_avg": 0.2622203826904297, "step": 775, "valid_targets_mean": 3728.9, "valid_targets_min": 762 }, { "epoch": 1.1521418020679468, "grad_norm": 0.4161239474977219, "learning_rate": 3.9497386793303934e-05, "loss": 0.2184, "loss_nan_ranks": 0, "loss_rank_avg": 0.23140665888786316, "step": 780, "valid_targets_mean": 6516.1, "valid_targets_min": 521 }, { "epoch": 1.1595273264401773, "grad_norm": 0.4996982771781497, "learning_rate": 3.9480844844803065e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.21708938479423523, "step": 785, "valid_targets_mean": 4092.6, "valid_targets_min": 491 }, { "epoch": 1.1669128508124076, "grad_norm": 0.43107207086038685, "learning_rate": 3.946403864996291e-05, "loss": 0.222, "loss_nan_ranks": 0, "loss_rank_avg": 0.19202640652656555, "step": 790, "valid_targets_mean": 5623.8, "valid_targets_min": 567 }, { "epoch": 1.174298375184638, "grad_norm": 0.6020812405004927, "learning_rate": 3.944696843674973e-05, "loss": 0.2265, "loss_nan_ranks": 0, "loss_rank_avg": 0.267403244972229, "step": 795, "valid_targets_mean": 3391.2, "valid_targets_min": 617 }, { "epoch": 1.1816838995568686, "grad_norm": 0.4663676848971227, "learning_rate": 3.942963443671105e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.2613796889781952, "step": 800, "valid_targets_mean": 5378.3, "valid_targets_min": 552 }, { "epoch": 1.1890694239290989, "grad_norm": 0.4485332389236638, "learning_rate": 3.9412036884972515e-05, "loss": 0.2151, "loss_nan_ranks": 0, "loss_rank_avg": 0.2017560601234436, "step": 805, "valid_targets_mean": 4622.5, "valid_targets_min": 531 }, { "epoch": 1.1964549483013294, "grad_norm": 0.47317157878156907, "learning_rate": 3.939417602023467e-05, "loss": 0.2169, "loss_nan_ranks": 0, "loss_rank_avg": 0.2027883231639862, "step": 810, "valid_targets_mean": 4890.3, "valid_targets_min": 638 }, { "epoch": 1.2038404726735599, "grad_norm": 0.5193762458310359, "learning_rate": 3.937605208476979e-05, "loss": 0.2488, "loss_nan_ranks": 0, "loss_rank_avg": 0.23114809393882751, "step": 815, "valid_targets_mean": 4104.7, "valid_targets_min": 659 }, { "epoch": 1.2112259970457901, "grad_norm": 0.5116940935110126, "learning_rate": 3.93576653244185e-05, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.3086828291416168, "step": 820, "valid_targets_mean": 5347.4, "valid_targets_min": 692 }, { "epoch": 1.2186115214180206, "grad_norm": 0.6948645135111495, "learning_rate": 3.933901598858653e-05, "loss": 0.2134, "loss_nan_ranks": 0, "loss_rank_avg": 0.23770800232887268, "step": 825, "valid_targets_mean": 4581.4, "valid_targets_min": 575 }, { "epoch": 1.2259970457902511, "grad_norm": 0.3666222705529873, "learning_rate": 3.9320104330241294e-05, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.20173095166683197, "step": 830, "valid_targets_mean": 7597.5, "valid_targets_min": 563 }, { "epoch": 1.2333825701624814, "grad_norm": 0.4553744544104897, "learning_rate": 3.9300930605908434e-05, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.2501322031021118, "step": 835, "valid_targets_mean": 5175.3, "valid_targets_min": 477 }, { "epoch": 1.240768094534712, "grad_norm": 0.4074174770824338, "learning_rate": 3.928149507566838e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.21756581962108612, "step": 840, "valid_targets_mean": 5838.4, "valid_targets_min": 709 }, { "epoch": 1.2481536189069424, "grad_norm": 0.3903886869594378, "learning_rate": 3.926179800315281e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.19205650687217712, "step": 845, "valid_targets_mean": 5413.8, "valid_targets_min": 497 }, { "epoch": 1.2555391432791727, "grad_norm": 0.48872055489952576, "learning_rate": 3.924183965554106e-05, "loss": 0.2295, "loss_nan_ranks": 0, "loss_rank_avg": 0.2304544299840927, "step": 850, "valid_targets_mean": 5223.9, "valid_targets_min": 362 }, { "epoch": 1.2629246676514032, "grad_norm": 0.5971024562814735, "learning_rate": 3.9221620303556515e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.1931340992450714, "step": 855, "valid_targets_mean": 6235.6, "valid_targets_min": 698 }, { "epoch": 1.2703101920236337, "grad_norm": 0.441865132454004, "learning_rate": 3.9201140221462947e-05, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.19833971560001373, "step": 860, "valid_targets_mean": 4980.0, "valid_targets_min": 229 }, { "epoch": 1.277695716395864, "grad_norm": 0.448378137812601, "learning_rate": 3.918039968706076e-05, "loss": 0.2303, "loss_nan_ranks": 0, "loss_rank_avg": 0.2166500836610794, "step": 865, "valid_targets_mean": 4924.2, "valid_targets_min": 586 }, { "epoch": 1.2850812407680945, "grad_norm": 0.38685678373728877, "learning_rate": 3.9159398981683245e-05, "loss": 0.2115, "loss_nan_ranks": 0, "loss_rank_avg": 0.17539414763450623, "step": 870, "valid_targets_mean": 6035.1, "valid_targets_min": 928 }, { "epoch": 1.292466765140325, "grad_norm": 0.4163449238539416, "learning_rate": 3.9138138390192776e-05, "loss": 0.218, "loss_nan_ranks": 0, "loss_rank_avg": 0.2028162181377411, "step": 875, "valid_targets_mean": 5722.0, "valid_targets_min": 752 }, { "epoch": 1.2998522895125553, "grad_norm": 0.5685979494164379, "learning_rate": 3.911661820097691e-05, "loss": 0.2277, "loss_nan_ranks": 0, "loss_rank_avg": 0.27309101819992065, "step": 880, "valid_targets_mean": 3300.4, "valid_targets_min": 311 }, { "epoch": 1.3072378138847858, "grad_norm": 0.4369045779107333, "learning_rate": 3.909483870594452e-05, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.2015451192855835, "step": 885, "valid_targets_mean": 5269.7, "valid_targets_min": 571 }, { "epoch": 1.3146233382570163, "grad_norm": 0.4193133405997814, "learning_rate": 3.9072800200521785e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.21048672497272491, "step": 890, "valid_targets_mean": 5464.1, "valid_targets_min": 748 }, { "epoch": 1.3220088626292466, "grad_norm": 0.388531558281405, "learning_rate": 3.905050298364824e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.16509976983070374, "step": 895, "valid_targets_mean": 5191.9, "valid_targets_min": 517 }, { "epoch": 1.329394387001477, "grad_norm": 0.47820157235033706, "learning_rate": 3.9027947357772664e-05, "loss": 0.2165, "loss_nan_ranks": 0, "loss_rank_avg": 0.2072378247976303, "step": 900, "valid_targets_mean": 4629.8, "valid_targets_min": 702 }, { "epoch": 1.3367799113737076, "grad_norm": 0.4354737992607275, "learning_rate": 3.900513362884901e-05, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.20593631267547607, "step": 905, "valid_targets_mean": 4609.3, "valid_targets_min": 531 }, { "epoch": 1.3441654357459378, "grad_norm": 0.49663576162369527, "learning_rate": 3.8982062106332264e-05, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.23853272199630737, "step": 910, "valid_targets_mean": 3835.1, "valid_targets_min": 564 }, { "epoch": 1.3515509601181683, "grad_norm": 0.46267728260164404, "learning_rate": 3.895873310317422e-05, "loss": 0.2136, "loss_nan_ranks": 0, "loss_rank_avg": 0.20141030848026276, "step": 915, "valid_targets_mean": 4257.8, "valid_targets_min": 807 }, { "epoch": 1.3589364844903988, "grad_norm": 0.4318042167691161, "learning_rate": 3.893514693581924e-05, "loss": 0.2379, "loss_nan_ranks": 0, "loss_rank_avg": 0.23438894748687744, "step": 920, "valid_targets_mean": 5685.5, "valid_targets_min": 637 }, { "epoch": 1.3663220088626291, "grad_norm": 0.46703807691935706, "learning_rate": 3.8911303924199976e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.22170604765415192, "step": 925, "valid_targets_mean": 4579.6, "valid_targets_min": 648 }, { "epoch": 1.3737075332348596, "grad_norm": 0.49253435998552936, "learning_rate": 3.888720439173304e-05, "loss": 0.2104, "loss_nan_ranks": 0, "loss_rank_avg": 0.18895632028579712, "step": 930, "valid_targets_mean": 5223.1, "valid_targets_min": 874 }, { "epoch": 1.3810930576070901, "grad_norm": 0.37295680843818396, "learning_rate": 3.886284866531457e-05, "loss": 0.2459, "loss_nan_ranks": 0, "loss_rank_avg": 0.23819585144519806, "step": 935, "valid_targets_mean": 7344.1, "valid_targets_min": 516 }, { "epoch": 1.3884785819793206, "grad_norm": 0.45860088434234825, "learning_rate": 3.883823707531585e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.20355328917503357, "step": 940, "valid_targets_mean": 4777.0, "valid_targets_min": 822 }, { "epoch": 1.395864106351551, "grad_norm": 0.4813637468871037, "learning_rate": 3.8813369955578795e-05, "loss": 0.2443, "loss_nan_ranks": 0, "loss_rank_avg": 0.24247971177101135, "step": 945, "valid_targets_mean": 4676.9, "valid_targets_min": 461 }, { "epoch": 1.4032496307237814, "grad_norm": 0.44965533755939013, "learning_rate": 3.878824764341143e-05, "loss": 0.2358, "loss_nan_ranks": 0, "loss_rank_avg": 0.2948012351989746, "step": 950, "valid_targets_mean": 6391.8, "valid_targets_min": 665 }, { "epoch": 1.410635155096012, "grad_norm": 0.4957030075557271, "learning_rate": 3.876287047958331e-05, "loss": 0.2266, "loss_nan_ranks": 0, "loss_rank_avg": 0.2564036250114441, "step": 955, "valid_targets_mean": 4930.7, "valid_targets_min": 709 }, { "epoch": 1.4180206794682422, "grad_norm": 0.4689797114164809, "learning_rate": 3.8737238808320936e-05, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.23838871717453003, "step": 960, "valid_targets_mean": 4520.2, "valid_targets_min": 581 }, { "epoch": 1.4254062038404727, "grad_norm": 0.45226562564371103, "learning_rate": 3.8711352977303015e-05, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.19582833349704742, "step": 965, "valid_targets_mean": 4792.9, "valid_targets_min": 336 }, { "epoch": 1.4327917282127032, "grad_norm": 0.4499057955750725, "learning_rate": 3.868521333765581e-05, "loss": 0.2247, "loss_nan_ranks": 0, "loss_rank_avg": 0.21399438381195068, "step": 970, "valid_targets_mean": 5207.8, "valid_targets_min": 535 }, { "epoch": 1.4401772525849335, "grad_norm": 0.3550283452289212, "learning_rate": 3.865882024394834e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.17050230503082275, "step": 975, "valid_targets_mean": 6535.8, "valid_targets_min": 578 }, { "epoch": 1.447562776957164, "grad_norm": 0.3851306477864997, "learning_rate": 3.863217405418759e-05, "loss": 0.216, "loss_nan_ranks": 0, "loss_rank_avg": 0.205580934882164, "step": 980, "valid_targets_mean": 5663.9, "valid_targets_min": 868 }, { "epoch": 1.4549483013293945, "grad_norm": 0.5896596645032985, "learning_rate": 3.8605275129813626e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.21005357801914215, "step": 985, "valid_targets_mean": 4708.6, "valid_targets_min": 768 }, { "epoch": 1.4623338257016247, "grad_norm": 0.48610764474272555, "learning_rate": 3.857812383569473e-05, "loss": 0.2101, "loss_nan_ranks": 0, "loss_rank_avg": 0.22247350215911865, "step": 990, "valid_targets_mean": 5245.6, "valid_targets_min": 643 }, { "epoch": 1.4697193500738552, "grad_norm": 0.4265714039395906, "learning_rate": 3.8550720540122436e-05, "loss": 0.2177, "loss_nan_ranks": 0, "loss_rank_avg": 0.2506152391433716, "step": 995, "valid_targets_mean": 5852.4, "valid_targets_min": 679 }, { "epoch": 1.4771048744460857, "grad_norm": 0.418243711485139, "learning_rate": 3.852306561480652e-05, "loss": 0.2186, "loss_nan_ranks": 0, "loss_rank_avg": 0.25498437881469727, "step": 1000, "valid_targets_mean": 6060.9, "valid_targets_min": 585 }, { "epoch": 1.4844903988183162, "grad_norm": 0.5725357827213264, "learning_rate": 3.8495159434869966e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.222720205783844, "step": 1005, "valid_targets_mean": 5578.1, "valid_targets_min": 424 }, { "epoch": 1.4918759231905465, "grad_norm": 0.7420773277261102, "learning_rate": 3.846700237884389e-05, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.2858394980430603, "step": 1010, "valid_targets_mean": 3759.1, "valid_targets_min": 407 }, { "epoch": 1.499261447562777, "grad_norm": 0.4640644425487349, "learning_rate": 3.84385948286624e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.21131858229637146, "step": 1015, "valid_targets_mean": 4703.7, "valid_targets_min": 460 }, { "epoch": 1.5066469719350075, "grad_norm": 0.47403611928498096, "learning_rate": 3.8409937169657393e-05, "loss": 0.2401, "loss_nan_ranks": 0, "loss_rank_avg": 0.2791014313697815, "step": 1020, "valid_targets_mean": 5770.7, "valid_targets_min": 572 }, { "epoch": 1.5140324963072378, "grad_norm": 0.3527301227310117, "learning_rate": 3.8381029790553376e-05, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.21376456320285797, "step": 1025, "valid_targets_mean": 7688.9, "valid_targets_min": 1061 }, { "epoch": 1.5214180206794683, "grad_norm": 0.48244790889065403, "learning_rate": 3.8351873083462135e-05, "loss": 0.2246, "loss_nan_ranks": 0, "loss_rank_avg": 0.22939425706863403, "step": 1030, "valid_targets_mean": 3952.4, "valid_targets_min": 614 }, { "epoch": 1.5288035450516988, "grad_norm": 0.4441322237358841, "learning_rate": 3.832246744387746e-05, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.19595670700073242, "step": 1035, "valid_targets_mean": 5734.9, "valid_targets_min": 602 }, { "epoch": 1.536189069423929, "grad_norm": 0.42687842371627116, "learning_rate": 3.829281327066977e-05, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.2039499282836914, "step": 1040, "valid_targets_mean": 5575.5, "valid_targets_min": 567 }, { "epoch": 1.5435745937961596, "grad_norm": 0.4616898715899763, "learning_rate": 3.826291096608068e-05, "loss": 0.2166, "loss_nan_ranks": 0, "loss_rank_avg": 0.24281984567642212, "step": 1045, "valid_targets_mean": 4569.6, "valid_targets_min": 566 }, { "epoch": 1.55096011816839, "grad_norm": 0.516188071513123, "learning_rate": 3.823276093571758e-05, "loss": 0.2119, "loss_nan_ranks": 0, "loss_rank_avg": 0.23861096799373627, "step": 1050, "valid_targets_mean": 5593.9, "valid_targets_min": 756 }, { "epoch": 1.5583456425406204, "grad_norm": 0.4323810628023057, "learning_rate": 3.820236358854812e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.18166664242744446, "step": 1055, "valid_targets_mean": 5191.4, "valid_targets_min": 548 }, { "epoch": 1.5657311669128509, "grad_norm": 0.41249483128752723, "learning_rate": 3.817171933689464e-05, "loss": 0.2096, "loss_nan_ranks": 0, "loss_rank_avg": 0.21327346563339233, "step": 1060, "valid_targets_mean": 6157.4, "valid_targets_min": 587 }, { "epoch": 1.5731166912850814, "grad_norm": 0.4280649794546595, "learning_rate": 3.81408285964286e-05, "loss": 0.2028, "loss_nan_ranks": 0, "loss_rank_avg": 0.2045423984527588, "step": 1065, "valid_targets_mean": 5231.2, "valid_targets_min": 583 }, { "epoch": 1.5805022156573116, "grad_norm": 0.3567235937466317, "learning_rate": 3.810969178616495e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.1872180700302124, "step": 1070, "valid_targets_mean": 6435.2, "valid_targets_min": 828 }, { "epoch": 1.5878877400295421, "grad_norm": 0.3967044287073082, "learning_rate": 3.807830932845643e-05, "loss": 0.2183, "loss_nan_ranks": 0, "loss_rank_avg": 0.21867504715919495, "step": 1075, "valid_targets_mean": 5695.5, "valid_targets_min": 370 }, { "epoch": 1.5952732644017726, "grad_norm": 0.4258406051484541, "learning_rate": 3.8046681648987826e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.21099427342414856, "step": 1080, "valid_targets_mean": 5131.6, "valid_targets_min": 578 }, { "epoch": 1.602658788774003, "grad_norm": 0.4734317720239788, "learning_rate": 3.801480917677025e-05, "loss": 0.2409, "loss_nan_ranks": 0, "loss_rank_avg": 0.20774179697036743, "step": 1085, "valid_targets_mean": 3967.3, "valid_targets_min": 535 }, { "epoch": 1.6100443131462334, "grad_norm": 0.44845704175379064, "learning_rate": 3.798269234413525e-05, "loss": 0.2214, "loss_nan_ranks": 0, "loss_rank_avg": 0.22882190346717834, "step": 1090, "valid_targets_mean": 4234.2, "valid_targets_min": 453 }, { "epoch": 1.617429837518464, "grad_norm": 0.43870094592908176, "learning_rate": 3.795033158672901e-05, "loss": 0.2071, "loss_nan_ranks": 0, "loss_rank_avg": 0.20205071568489075, "step": 1095, "valid_targets_mean": 4710.2, "valid_targets_min": 390 }, { "epoch": 1.6248153618906942, "grad_norm": 0.46114331054142615, "learning_rate": 3.7917727343506384e-05, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.2182081788778305, "step": 1100, "valid_targets_mean": 4210.6, "valid_targets_min": 630 }, { "epoch": 1.6322008862629247, "grad_norm": 0.46898057951501565, "learning_rate": 3.788488005672499e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.18588444590568542, "step": 1105, "valid_targets_mean": 5456.4, "valid_targets_min": 697 }, { "epoch": 1.6395864106351552, "grad_norm": 0.46882204005729433, "learning_rate": 3.785179017193918e-05, "loss": 0.2269, "loss_nan_ranks": 0, "loss_rank_avg": 0.2911528944969177, "step": 1110, "valid_targets_mean": 5871.7, "valid_targets_min": 546 }, { "epoch": 1.6469719350073855, "grad_norm": 0.5024285712997323, "learning_rate": 3.781845813799402e-05, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.2931421101093292, "step": 1115, "valid_targets_mean": 4670.3, "valid_targets_min": 451 }, { "epoch": 1.654357459379616, "grad_norm": 0.42105185416660457, "learning_rate": 3.778488440701918e-05, "loss": 0.2037, "loss_nan_ranks": 0, "loss_rank_avg": 0.22011511027812958, "step": 1120, "valid_targets_mean": 4687.1, "valid_targets_min": 298 }, { "epoch": 1.6617429837518465, "grad_norm": 0.4534305852538249, "learning_rate": 3.77510694344228e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.18383678793907166, "step": 1125, "valid_targets_mean": 5405.8, "valid_targets_min": 726 }, { "epoch": 1.6691285081240768, "grad_norm": 0.3951289835886458, "learning_rate": 3.771701367888534e-05, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.17336603999137878, "step": 1130, "valid_targets_mean": 5009.2, "valid_targets_min": 395 }, { "epoch": 1.6765140324963073, "grad_norm": 0.4886944664495892, "learning_rate": 3.7682717602353336e-05, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.2188146710395813, "step": 1135, "valid_targets_mean": 3926.0, "valid_targets_min": 310 }, { "epoch": 1.6838995568685378, "grad_norm": 0.39480650462231015, "learning_rate": 3.7648181670033125e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.20998279750347137, "step": 1140, "valid_targets_mean": 6034.9, "valid_targets_min": 592 }, { "epoch": 1.691285081240768, "grad_norm": 0.39214825097931927, "learning_rate": 3.761340635038456e-05, "loss": 0.2173, "loss_nan_ranks": 0, "loss_rank_avg": 0.1979064792394638, "step": 1145, "valid_targets_mean": 7045.8, "valid_targets_min": 525 }, { "epoch": 1.6986706056129985, "grad_norm": 0.38111774464102766, "learning_rate": 3.7578392115114655e-05, "loss": 0.2119, "loss_nan_ranks": 0, "loss_rank_avg": 0.20325309038162231, "step": 1150, "valid_targets_mean": 6202.9, "valid_targets_min": 630 }, { "epoch": 1.706056129985229, "grad_norm": 0.404770101827888, "learning_rate": 3.754313943917115e-05, "loss": 0.1936, "loss_nan_ranks": 0, "loss_rank_avg": 0.1922975480556488, "step": 1155, "valid_targets_mean": 5763.9, "valid_targets_min": 528 }, { "epoch": 1.7134416543574593, "grad_norm": 0.4064959538938459, "learning_rate": 3.7507648800736116e-05, "loss": 0.2044, "loss_nan_ranks": 0, "loss_rank_avg": 0.2195628136396408, "step": 1160, "valid_targets_mean": 5726.2, "valid_targets_min": 795 }, { "epoch": 1.7208271787296898, "grad_norm": 0.5078776991250893, "learning_rate": 3.747192068121943e-05, "loss": 0.2166, "loss_nan_ranks": 0, "loss_rank_avg": 0.24034610390663147, "step": 1165, "valid_targets_mean": 4283.9, "valid_targets_min": 309 }, { "epoch": 1.7282127031019203, "grad_norm": 0.5067333046365079, "learning_rate": 3.743595556525228e-05, "loss": 0.2192, "loss_nan_ranks": 0, "loss_rank_avg": 0.2246871292591095, "step": 1170, "valid_targets_mean": 3702.9, "valid_targets_min": 529 }, { "epoch": 1.7355982274741506, "grad_norm": 0.5019937895256118, "learning_rate": 3.7399753940680556e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.20047210156917572, "step": 1175, "valid_targets_mean": 3960.8, "valid_targets_min": 472 }, { "epoch": 1.742983751846381, "grad_norm": 0.41047915116673045, "learning_rate": 3.736331629855826e-05, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.2049740105867386, "step": 1180, "valid_targets_mean": 5736.0, "valid_targets_min": 815 }, { "epoch": 1.7503692762186116, "grad_norm": 0.3945106153005012, "learning_rate": 3.7326643133140833e-05, "loss": 0.2165, "loss_nan_ranks": 0, "loss_rank_avg": 0.20625770092010498, "step": 1185, "valid_targets_mean": 6195.1, "valid_targets_min": 250 }, { "epoch": 1.7577548005908419, "grad_norm": 0.4106742085350737, "learning_rate": 3.7289734941878455e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.24206054210662842, "step": 1190, "valid_targets_mean": 6082.2, "valid_targets_min": 568 }, { "epoch": 1.7651403249630724, "grad_norm": 0.5200799032564574, "learning_rate": 3.7252592225409285e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.28392231464385986, "step": 1195, "valid_targets_mean": 3605.9, "valid_targets_min": 523 }, { "epoch": 1.7725258493353029, "grad_norm": 0.470687041134897, "learning_rate": 3.721521548755269e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.21265387535095215, "step": 1200, "valid_targets_mean": 4151.9, "valid_targets_min": 541 }, { "epoch": 1.7799113737075332, "grad_norm": 0.4428156443932358, "learning_rate": 3.71776052353024e-05, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.21042832732200623, "step": 1205, "valid_targets_mean": 5545.3, "valid_targets_min": 701 }, { "epoch": 1.7872968980797637, "grad_norm": 0.45448533560080073, "learning_rate": 3.7139761978819625e-05, "loss": 0.2369, "loss_nan_ranks": 0, "loss_rank_avg": 0.27311086654663086, "step": 1210, "valid_targets_mean": 5298.8, "valid_targets_min": 628 }, { "epoch": 1.7946824224519942, "grad_norm": 0.4157213284903144, "learning_rate": 3.7101686231426145e-05, "loss": 0.2111, "loss_nan_ranks": 0, "loss_rank_avg": 0.21213330328464508, "step": 1215, "valid_targets_mean": 5659.4, "valid_targets_min": 830 }, { "epoch": 1.8020679468242244, "grad_norm": 0.3921888627239872, "learning_rate": 3.706337850959736e-05, "loss": 0.2073, "loss_nan_ranks": 0, "loss_rank_avg": 0.20621275901794434, "step": 1220, "valid_targets_mean": 6066.2, "valid_targets_min": 679 }, { "epoch": 1.809453471196455, "grad_norm": 0.393703088132589, "learning_rate": 3.702483933295524e-05, "loss": 0.2038, "loss_nan_ranks": 0, "loss_rank_avg": 0.20170754194259644, "step": 1225, "valid_targets_mean": 5131.7, "valid_targets_min": 594 }, { "epoch": 1.8168389955686854, "grad_norm": 0.429085603448917, "learning_rate": 3.698606922426133e-05, "loss": 0.1961, "loss_nan_ranks": 0, "loss_rank_avg": 0.21911361813545227, "step": 1230, "valid_targets_mean": 6525.8, "valid_targets_min": 673 }, { "epoch": 1.8242245199409157, "grad_norm": 0.41690498546700655, "learning_rate": 3.694706870940961e-05, "loss": 0.2107, "loss_nan_ranks": 0, "loss_rank_avg": 0.20087522268295288, "step": 1235, "valid_targets_mean": 5197.6, "valid_targets_min": 656 }, { "epoch": 1.8316100443131462, "grad_norm": 0.4214260567191511, "learning_rate": 3.690783831741942e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.24707287549972534, "step": 1240, "valid_targets_mean": 5131.9, "valid_targets_min": 642 }, { "epoch": 1.8389955686853767, "grad_norm": 0.42497684417714315, "learning_rate": 3.686837858042821e-05, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.2418084293603897, "step": 1245, "valid_targets_mean": 6411.4, "valid_targets_min": 726 }, { "epoch": 1.846381093057607, "grad_norm": 0.43456506500215386, "learning_rate": 3.6828690033684394e-05, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.23421086370944977, "step": 1250, "valid_targets_mean": 4884.8, "valid_targets_min": 637 }, { "epoch": 1.8537666174298375, "grad_norm": 0.3590270619837384, "learning_rate": 3.678877321554003e-05, "loss": 0.2317, "loss_nan_ranks": 0, "loss_rank_avg": 0.19189848005771637, "step": 1255, "valid_targets_mean": 6340.3, "valid_targets_min": 588 }, { "epoch": 1.861152141802068, "grad_norm": 0.4491792252049705, "learning_rate": 3.674862866744358e-05, "loss": 0.2238, "loss_nan_ranks": 0, "loss_rank_avg": 0.23957936465740204, "step": 1260, "valid_targets_mean": 4542.8, "valid_targets_min": 638 }, { "epoch": 1.8685376661742983, "grad_norm": 0.41595374872963425, "learning_rate": 3.6708256933932485e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.19980810582637787, "step": 1265, "valid_targets_mean": 5785.6, "valid_targets_min": 379 }, { "epoch": 1.8759231905465288, "grad_norm": 0.47288076543534235, "learning_rate": 3.6667658562625867e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.2654092311859131, "step": 1270, "valid_targets_mean": 5471.1, "valid_targets_min": 666 }, { "epoch": 1.8833087149187593, "grad_norm": 0.38192384234870763, "learning_rate": 3.662683410421703e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.19015946984291077, "step": 1275, "valid_targets_mean": 5607.4, "valid_targets_min": 810 }, { "epoch": 1.8906942392909896, "grad_norm": 0.4085790502454245, "learning_rate": 3.6585784112466034e-05, "loss": 0.2145, "loss_nan_ranks": 0, "loss_rank_avg": 0.23992851376533508, "step": 1280, "valid_targets_mean": 5566.8, "valid_targets_min": 706 }, { "epoch": 1.89807976366322, "grad_norm": 0.3923685608209056, "learning_rate": 3.6544509144192153e-05, "loss": 0.2186, "loss_nan_ranks": 0, "loss_rank_avg": 0.19036059081554413, "step": 1285, "valid_targets_mean": 5585.4, "valid_targets_min": 766 }, { "epoch": 1.9054652880354506, "grad_norm": 0.460825966848905, "learning_rate": 3.650300975926635e-05, "loss": 0.2309, "loss_nan_ranks": 0, "loss_rank_avg": 0.20123234391212463, "step": 1290, "valid_targets_mean": 4738.8, "valid_targets_min": 476 }, { "epoch": 1.9128508124076808, "grad_norm": 0.46958242857442417, "learning_rate": 3.646128652060367e-05, "loss": 0.2147, "loss_nan_ranks": 0, "loss_rank_avg": 0.20810635387897491, "step": 1295, "valid_targets_mean": 4939.5, "valid_targets_min": 640 }, { "epoch": 1.9202363367799113, "grad_norm": 0.513107015645425, "learning_rate": 3.6419339994155596e-05, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.23249667882919312, "step": 1300, "valid_targets_mean": 3900.5, "valid_targets_min": 512 }, { "epoch": 1.9276218611521418, "grad_norm": 0.41491988804017377, "learning_rate": 3.637717074890238e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.20350153744220734, "step": 1305, "valid_targets_mean": 5207.5, "valid_targets_min": 687 }, { "epoch": 1.9350073855243721, "grad_norm": 0.3852016695481521, "learning_rate": 3.633477935684532e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.16912466287612915, "step": 1310, "valid_targets_mean": 5948.2, "valid_targets_min": 558 }, { "epoch": 1.9423929098966026, "grad_norm": 0.47994385762704583, "learning_rate": 3.629216639299903e-05, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.2138756513595581, "step": 1315, "valid_targets_mean": 4660.0, "valid_targets_min": 546 }, { "epoch": 1.9497784342688331, "grad_norm": 0.43044739199814863, "learning_rate": 3.624933243538359e-05, "loss": 0.2237, "loss_nan_ranks": 0, "loss_rank_avg": 0.20759987831115723, "step": 1320, "valid_targets_mean": 4612.2, "valid_targets_min": 586 }, { "epoch": 1.9571639586410634, "grad_norm": 0.44206360398309225, "learning_rate": 3.6206278065016744e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.20062926411628723, "step": 1325, "valid_targets_mean": 4257.2, "valid_targets_min": 474 }, { "epoch": 1.964549483013294, "grad_norm": 0.832328393558017, "learning_rate": 3.616300386590601e-05, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.2263094186782837, "step": 1330, "valid_targets_mean": 3523.4, "valid_targets_min": 320 }, { "epoch": 1.9719350073855244, "grad_norm": 0.5608605363552897, "learning_rate": 3.6119510425040746e-05, "loss": 0.2153, "loss_nan_ranks": 0, "loss_rank_avg": 0.2241973727941513, "step": 1335, "valid_targets_mean": 3184.9, "valid_targets_min": 400 }, { "epoch": 1.9793205317577547, "grad_norm": 0.42827418469595757, "learning_rate": 3.6075798332384205e-05, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.21591341495513916, "step": 1340, "valid_targets_mean": 5014.1, "valid_targets_min": 703 }, { "epoch": 1.9867060561299852, "grad_norm": 0.4376829994779159, "learning_rate": 3.603186818086552e-05, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.24252906441688538, "step": 1345, "valid_targets_mean": 5612.9, "valid_targets_min": 843 }, { "epoch": 1.9940915805022157, "grad_norm": 0.48296281574524147, "learning_rate": 3.598772056637166e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.2911834716796875, "step": 1350, "valid_targets_mean": 5862.9, "valid_targets_min": 542 }, { "epoch": 2.001477104874446, "grad_norm": 0.4285021994401378, "learning_rate": 3.594335608773937e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.17348650097846985, "step": 1355, "valid_targets_mean": 5699.8, "valid_targets_min": 622 }, { "epoch": 2.0088626292466767, "grad_norm": 0.5571499078773812, "learning_rate": 3.589877534674702e-05, "loss": 0.2235, "loss_nan_ranks": 0, "loss_rank_avg": 0.21984922885894775, "step": 1360, "valid_targets_mean": 4844.9, "valid_targets_min": 310 }, { "epoch": 2.016248153618907, "grad_norm": 0.4762775499228357, "learning_rate": 3.585397894810645e-05, "loss": 0.2174, "loss_nan_ranks": 0, "loss_rank_avg": 0.2565491497516632, "step": 1365, "valid_targets_mean": 5172.8, "valid_targets_min": 531 }, { "epoch": 2.0236336779911372, "grad_norm": 0.4890064307141238, "learning_rate": 3.580896749945478e-05, "loss": 0.1871, "loss_nan_ranks": 0, "loss_rank_avg": 0.198519766330719, "step": 1370, "valid_targets_mean": 5031.6, "valid_targets_min": 709 }, { "epoch": 2.031019202363368, "grad_norm": 0.42188127103720335, "learning_rate": 3.576374161134614e-05, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.17222025990486145, "step": 1375, "valid_targets_mean": 5100.7, "valid_targets_min": 506 }, { "epoch": 2.0384047267355982, "grad_norm": 0.4032153526008752, "learning_rate": 3.571830189724344e-05, "loss": 0.2007, "loss_nan_ranks": 0, "loss_rank_avg": 0.22092564404010773, "step": 1380, "valid_targets_mean": 6401.4, "valid_targets_min": 733 }, { "epoch": 2.0457902511078285, "grad_norm": 0.4090149314677475, "learning_rate": 3.5672648973509975e-05, "loss": 0.2037, "loss_nan_ranks": 0, "loss_rank_avg": 0.19857646524906158, "step": 1385, "valid_targets_mean": 5839.8, "valid_targets_min": 589 }, { "epoch": 2.0531757754800593, "grad_norm": 0.4666629189772267, "learning_rate": 3.5626783459401136e-05, "loss": 0.1969, "loss_nan_ranks": 0, "loss_rank_avg": 0.22908130288124084, "step": 1390, "valid_targets_mean": 4732.4, "valid_targets_min": 481 }, { "epoch": 2.0605612998522895, "grad_norm": 0.5167728208836535, "learning_rate": 3.558070597705597e-05, "loss": 0.2147, "loss_nan_ranks": 0, "loss_rank_avg": 0.30561476945877075, "step": 1395, "valid_targets_mean": 5980.4, "valid_targets_min": 499 }, { "epoch": 2.06794682422452, "grad_norm": 0.4957521107813994, "learning_rate": 3.553441715148874e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.24766743183135986, "step": 1400, "valid_targets_mean": 5423.2, "valid_targets_min": 636 }, { "epoch": 2.0753323485967505, "grad_norm": 0.5065232042372999, "learning_rate": 3.5487917610580464e-05, "loss": 0.1913, "loss_nan_ranks": 0, "loss_rank_avg": 0.19253401458263397, "step": 1405, "valid_targets_mean": 4459.0, "valid_targets_min": 731 }, { "epoch": 2.082717872968981, "grad_norm": 0.4366761703530371, "learning_rate": 3.5441207985070405e-05, "loss": 0.2008, "loss_nan_ranks": 0, "loss_rank_avg": 0.20609664916992188, "step": 1410, "valid_targets_mean": 5449.8, "valid_targets_min": 973 }, { "epoch": 2.090103397341211, "grad_norm": 0.3956592099323369, "learning_rate": 3.5394288908547476e-05, "loss": 0.2039, "loss_nan_ranks": 0, "loss_rank_avg": 0.1563621610403061, "step": 1415, "valid_targets_mean": 5519.1, "valid_targets_min": 520 }, { "epoch": 2.097488921713442, "grad_norm": 0.5353026127089262, "learning_rate": 3.534716101744168e-05, "loss": 0.1847, "loss_nan_ranks": 0, "loss_rank_avg": 0.1830843836069107, "step": 1420, "valid_targets_mean": 3676.1, "valid_targets_min": 541 }, { "epoch": 2.104874446085672, "grad_norm": 0.4240842603893816, "learning_rate": 3.529982495101549e-05, "loss": 0.2007, "loss_nan_ranks": 0, "loss_rank_avg": 0.1899888962507248, "step": 1425, "valid_targets_mean": 5484.6, "valid_targets_min": 573 }, { "epoch": 2.1122599704579024, "grad_norm": 0.4026373876082126, "learning_rate": 3.5252281351355124e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.18199166655540466, "step": 1430, "valid_targets_mean": 5762.3, "valid_targets_min": 564 }, { "epoch": 2.119645494830133, "grad_norm": 0.40632759254314066, "learning_rate": 3.520453086336188e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.1754504293203354, "step": 1435, "valid_targets_mean": 5398.9, "valid_targets_min": 642 }, { "epoch": 2.1270310192023634, "grad_norm": 0.35808057513210484, "learning_rate": 3.515657413474339e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.13614241778850555, "step": 1440, "valid_targets_mean": 6742.3, "valid_targets_min": 736 }, { "epoch": 2.1344165435745936, "grad_norm": 0.4139451850923316, "learning_rate": 3.5108411816004796e-05, "loss": 0.1791, "loss_nan_ranks": 0, "loss_rank_avg": 0.15198799967765808, "step": 1445, "valid_targets_mean": 4605.1, "valid_targets_min": 696 }, { "epoch": 2.1418020679468244, "grad_norm": 0.4487084052336881, "learning_rate": 3.506004456043997e-05, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.18390825390815735, "step": 1450, "valid_targets_mean": 4883.0, "valid_targets_min": 631 }, { "epoch": 2.1491875923190547, "grad_norm": 0.4525728518238653, "learning_rate": 3.501147302412263e-05, "loss": 0.2171, "loss_nan_ranks": 0, "loss_rank_avg": 0.22244812548160553, "step": 1455, "valid_targets_mean": 4889.0, "valid_targets_min": 640 }, { "epoch": 2.156573116691285, "grad_norm": 0.4649134318287312, "learning_rate": 3.496269786589743e-05, "loss": 0.2049, "loss_nan_ranks": 0, "loss_rank_avg": 0.19458895921707153, "step": 1460, "valid_targets_mean": 5381.3, "valid_targets_min": 727 }, { "epoch": 2.1639586410635157, "grad_norm": 0.3972438491459193, "learning_rate": 3.491371974737105e-05, "loss": 0.2172, "loss_nan_ranks": 0, "loss_rank_avg": 0.19966194033622742, "step": 1465, "valid_targets_mean": 6120.7, "valid_targets_min": 289 }, { "epoch": 2.171344165435746, "grad_norm": 0.4119929448789575, "learning_rate": 3.486453933290321e-05, "loss": 0.2125, "loss_nan_ranks": 0, "loss_rank_avg": 0.2048000693321228, "step": 1470, "valid_targets_mean": 5923.5, "valid_targets_min": 695 }, { "epoch": 2.178729689807976, "grad_norm": 0.43265541786608985, "learning_rate": 3.481515728959764e-05, "loss": 0.2107, "loss_nan_ranks": 0, "loss_rank_avg": 0.19329239428043365, "step": 1475, "valid_targets_mean": 5209.0, "valid_targets_min": 559 }, { "epoch": 2.186115214180207, "grad_norm": 0.726326713865377, "learning_rate": 3.4765574287293064e-05, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.22369539737701416, "step": 1480, "valid_targets_mean": 3706.1, "valid_targets_min": 348 }, { "epoch": 2.193500738552437, "grad_norm": 0.4285241209732484, "learning_rate": 3.47157909985541e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.1844395101070404, "step": 1485, "valid_targets_mean": 5193.9, "valid_targets_min": 655 }, { "epoch": 2.2008862629246675, "grad_norm": 0.3568827709297404, "learning_rate": 3.466580809866213e-05, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.16118377447128296, "step": 1490, "valid_targets_mean": 5637.3, "valid_targets_min": 616 }, { "epoch": 2.208271787296898, "grad_norm": 0.40674844742126304, "learning_rate": 3.461562626560613e-05, "loss": 0.2318, "loss_nan_ranks": 0, "loss_rank_avg": 0.1650213599205017, "step": 1495, "valid_targets_mean": 5220.6, "valid_targets_min": 578 }, { "epoch": 2.2156573116691285, "grad_norm": 0.40044238504347957, "learning_rate": 3.456524618007352e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.18922209739685059, "step": 1500, "valid_targets_mean": 5842.4, "valid_targets_min": 680 }, { "epoch": 2.2230428360413588, "grad_norm": 0.46819866949961275, "learning_rate": 3.451466852544087e-05, "loss": 0.2117, "loss_nan_ranks": 0, "loss_rank_avg": 0.22434237599372864, "step": 1505, "valid_targets_mean": 4454.3, "valid_targets_min": 585 }, { "epoch": 2.2304283604135895, "grad_norm": 0.358887635540945, "learning_rate": 3.446389398776468e-05, "loss": 0.1845, "loss_nan_ranks": 0, "loss_rank_avg": 0.16988348960876465, "step": 1510, "valid_targets_mean": 6279.1, "valid_targets_min": 710 }, { "epoch": 2.2378138847858198, "grad_norm": 0.40829806216099035, "learning_rate": 3.441292325577204e-05, "loss": 0.1951, "loss_nan_ranks": 0, "loss_rank_avg": 0.1971379816532135, "step": 1515, "valid_targets_mean": 6296.1, "valid_targets_min": 822 }, { "epoch": 2.24519940915805, "grad_norm": 0.40160684926373197, "learning_rate": 3.436175702085132e-05, "loss": 0.2108, "loss_nan_ranks": 0, "loss_rank_avg": 0.17605721950531006, "step": 1520, "valid_targets_mean": 5582.8, "valid_targets_min": 486 }, { "epoch": 2.2525849335302808, "grad_norm": 0.5229993777219565, "learning_rate": 3.431039597704275e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.23692980408668518, "step": 1525, "valid_targets_mean": 4018.5, "valid_targets_min": 479 }, { "epoch": 2.259970457902511, "grad_norm": 0.6849225115875504, "learning_rate": 3.425884082102904e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.28416967391967773, "step": 1530, "valid_targets_mean": 2544.4, "valid_targets_min": 400 }, { "epoch": 2.2673559822747413, "grad_norm": 0.4227339555943465, "learning_rate": 3.4207092252125934e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.20092085003852844, "step": 1535, "valid_targets_mean": 5492.9, "valid_targets_min": 654 }, { "epoch": 2.274741506646972, "grad_norm": 0.4345429425277249, "learning_rate": 3.415515097227269e-05, "loss": 0.2065, "loss_nan_ranks": 0, "loss_rank_avg": 0.21635641157627106, "step": 1540, "valid_targets_mean": 5030.1, "valid_targets_min": 489 }, { "epoch": 2.2821270310192023, "grad_norm": 0.4693229139379586, "learning_rate": 3.4103017686022584e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.2364303320646286, "step": 1545, "valid_targets_mean": 4731.6, "valid_targets_min": 562 }, { "epoch": 2.2895125553914326, "grad_norm": 0.38590061526432556, "learning_rate": 3.4050693100533334e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.16934344172477722, "step": 1550, "valid_targets_mean": 6597.2, "valid_targets_min": 590 }, { "epoch": 2.2968980797636633, "grad_norm": 0.3661821378036947, "learning_rate": 3.399817792555756e-05, "loss": 0.1917, "loss_nan_ranks": 0, "loss_rank_avg": 0.15037478506565094, "step": 1555, "valid_targets_mean": 5859.4, "valid_targets_min": 620 }, { "epoch": 2.3042836041358936, "grad_norm": 0.5749118981748869, "learning_rate": 3.394547287343307e-05, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.21516035497188568, "step": 1560, "valid_targets_mean": 3785.1, "valid_targets_min": 308 }, { "epoch": 2.311669128508124, "grad_norm": 0.5222981613404089, "learning_rate": 3.389257865907329e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.2672545909881592, "step": 1565, "valid_targets_mean": 4263.8, "valid_targets_min": 562 }, { "epoch": 2.3190546528803546, "grad_norm": 0.39866742666796046, "learning_rate": 3.383949599995747e-05, "loss": 0.2183, "loss_nan_ranks": 0, "loss_rank_avg": 0.20826904475688934, "step": 1570, "valid_targets_mean": 6104.1, "valid_targets_min": 490 }, { "epoch": 2.326440177252585, "grad_norm": 0.5020262347414661, "learning_rate": 3.378622561612105e-05, "loss": 0.2017, "loss_nan_ranks": 0, "loss_rank_avg": 0.17644500732421875, "step": 1575, "valid_targets_mean": 4395.3, "valid_targets_min": 535 }, { "epoch": 2.333825701624815, "grad_norm": 0.48126474522159196, "learning_rate": 3.3732768230145834e-05, "loss": 0.1992, "loss_nan_ranks": 0, "loss_rank_avg": 0.2069077491760254, "step": 1580, "valid_targets_mean": 4419.8, "valid_targets_min": 617 }, { "epoch": 2.341211225997046, "grad_norm": 0.35388137699572986, "learning_rate": 3.3679124567150195e-05, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.15227368474006653, "step": 1585, "valid_targets_mean": 6494.9, "valid_targets_min": 682 }, { "epoch": 2.348596750369276, "grad_norm": 0.3840750165781411, "learning_rate": 3.362529535477923e-05, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.170127272605896, "step": 1590, "valid_targets_mean": 6790.0, "valid_targets_min": 1006 }, { "epoch": 2.3559822747415065, "grad_norm": 0.5434507333346537, "learning_rate": 3.357128132319494e-05, "loss": 0.2114, "loss_nan_ranks": 0, "loss_rank_avg": 0.20456504821777344, "step": 1595, "valid_targets_mean": 3017.6, "valid_targets_min": 320 }, { "epoch": 2.363367799113737, "grad_norm": 0.4069694394082241, "learning_rate": 3.3517083205066275e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.19211331009864807, "step": 1600, "valid_targets_mean": 5513.6, "valid_targets_min": 681 }, { "epoch": 2.3707533234859675, "grad_norm": 0.41784163330661017, "learning_rate": 3.34627017355592e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.18239319324493408, "step": 1605, "valid_targets_mean": 4941.2, "valid_targets_min": 540 }, { "epoch": 2.3781388478581977, "grad_norm": 0.39238043020867075, "learning_rate": 3.340813765232675e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.1841011941432953, "step": 1610, "valid_targets_mean": 5700.5, "valid_targets_min": 517 }, { "epoch": 2.3855243722304285, "grad_norm": 0.4201145604723071, "learning_rate": 3.3353391695499e-05, "loss": 0.2, "loss_nan_ranks": 0, "loss_rank_avg": 0.20100927352905273, "step": 1615, "valid_targets_mean": 5057.5, "valid_targets_min": 491 }, { "epoch": 2.3929098966026587, "grad_norm": 0.41846525077178565, "learning_rate": 3.329846460767305e-05, "loss": 0.1919, "loss_nan_ranks": 0, "loss_rank_avg": 0.20187963545322418, "step": 1620, "valid_targets_mean": 4845.5, "valid_targets_min": 523 }, { "epoch": 2.4002954209748895, "grad_norm": 0.40798367807953856, "learning_rate": 3.324335713390292e-05, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.15751047432422638, "step": 1625, "valid_targets_mean": 5196.8, "valid_targets_min": 314 }, { "epoch": 2.4076809453471197, "grad_norm": 0.4061768747540575, "learning_rate": 3.3188070021689464e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.17988130450248718, "step": 1630, "valid_targets_mean": 5505.8, "valid_targets_min": 605 }, { "epoch": 2.41506646971935, "grad_norm": 0.46242647917420265, "learning_rate": 3.313260402097024e-05, "loss": 0.2236, "loss_nan_ranks": 0, "loss_rank_avg": 0.2638862729072571, "step": 1635, "valid_targets_mean": 5006.3, "valid_targets_min": 510 }, { "epoch": 2.4224519940915803, "grad_norm": 0.49810161190363844, "learning_rate": 3.307695988410931e-05, "loss": 0.2147, "loss_nan_ranks": 0, "loss_rank_avg": 0.2404661476612091, "step": 1640, "valid_targets_mean": 5057.5, "valid_targets_min": 870 }, { "epoch": 2.429837518463811, "grad_norm": 0.49091951535741857, "learning_rate": 3.302113836588705e-05, "loss": 0.1857, "loss_nan_ranks": 0, "loss_rank_avg": 0.21287889778614044, "step": 1645, "valid_targets_mean": 3981.2, "valid_targets_min": 336 }, { "epoch": 2.4372230428360413, "grad_norm": 0.570596929329595, "learning_rate": 3.296514022348991e-05, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.22047343850135803, "step": 1650, "valid_targets_mean": 5769.9, "valid_targets_min": 747 }, { "epoch": 2.444608567208272, "grad_norm": 0.45209355569835663, "learning_rate": 3.2908966216500164e-05, "loss": 0.1951, "loss_nan_ranks": 0, "loss_rank_avg": 0.17555588483810425, "step": 1655, "valid_targets_mean": 5262.3, "valid_targets_min": 642 }, { "epoch": 2.4519940915805023, "grad_norm": 0.5750894848392384, "learning_rate": 3.2852617106885554e-05, "loss": 0.1904, "loss_nan_ranks": 0, "loss_rank_avg": 0.24034175276756287, "step": 1660, "valid_targets_mean": 2897.2, "valid_targets_min": 553 }, { "epoch": 2.4593796159527326, "grad_norm": 0.44533416665746417, "learning_rate": 3.279609365898903e-05, "loss": 0.1968, "loss_nan_ranks": 0, "loss_rank_avg": 0.18521445989608765, "step": 1665, "valid_targets_mean": 4074.0, "valid_targets_min": 559 }, { "epoch": 2.466765140324963, "grad_norm": 0.3666396515845462, "learning_rate": 3.273939663951828e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.1782068908214569, "step": 1670, "valid_targets_mean": 6837.4, "valid_targets_min": 600 }, { "epoch": 2.4741506646971936, "grad_norm": 0.3899278710986994, "learning_rate": 3.268252681753546e-05, "loss": 0.2211, "loss_nan_ranks": 0, "loss_rank_avg": 0.2376466989517212, "step": 1675, "valid_targets_mean": 6254.3, "valid_targets_min": 784 }, { "epoch": 2.481536189069424, "grad_norm": 0.4081436844860877, "learning_rate": 3.262548496444664e-05, "loss": 0.1934, "loss_nan_ranks": 0, "loss_rank_avg": 0.19119364023208618, "step": 1680, "valid_targets_mean": 5165.9, "valid_targets_min": 669 }, { "epoch": 2.4889217134416546, "grad_norm": 0.3782408782114525, "learning_rate": 3.25682718539914e-05, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.1731245368719101, "step": 1685, "valid_targets_mean": 6192.8, "valid_targets_min": 844 }, { "epoch": 2.496307237813885, "grad_norm": 0.5214383122274813, "learning_rate": 3.251088826223235e-05, "loss": 0.2174, "loss_nan_ranks": 0, "loss_rank_avg": 0.2473294734954834, "step": 1690, "valid_targets_mean": 3865.7, "valid_targets_min": 553 }, { "epoch": 2.503692762186115, "grad_norm": 0.48463478522919884, "learning_rate": 3.245333496754455e-05, "loss": 0.2039, "loss_nan_ranks": 0, "loss_rank_avg": 0.2620091736316681, "step": 1695, "valid_targets_mean": 4272.6, "valid_targets_min": 713 }, { "epoch": 2.5110782865583454, "grad_norm": 0.48594394962497084, "learning_rate": 3.239561275060501e-05, "loss": 0.2043, "loss_nan_ranks": 0, "loss_rank_avg": 0.23510144650936127, "step": 1700, "valid_targets_mean": 4500.4, "valid_targets_min": 516 }, { "epoch": 2.518463810930576, "grad_norm": 0.36026021621317095, "learning_rate": 3.233772239438206e-05, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.24801120162010193, "step": 1705, "valid_targets_mean": 7072.2, "valid_targets_min": 775 }, { "epoch": 2.5258493353028064, "grad_norm": 0.5691361574973622, "learning_rate": 3.2279664684124724e-05, "loss": 0.1969, "loss_nan_ranks": 0, "loss_rank_avg": 0.24925799667835236, "step": 1710, "valid_targets_mean": 4504.7, "valid_targets_min": 377 }, { "epoch": 2.533234859675037, "grad_norm": 0.399794469998823, "learning_rate": 3.22214404073521e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.16049984097480774, "step": 1715, "valid_targets_mean": 6125.9, "valid_targets_min": 497 }, { "epoch": 2.5406203840472674, "grad_norm": 0.41442596267228626, "learning_rate": 3.216305035384268e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.17098268866539001, "step": 1720, "valid_targets_mean": 5603.4, "valid_targets_min": 686 }, { "epoch": 2.5480059084194977, "grad_norm": 0.4162604595759132, "learning_rate": 3.210449531562361e-05, "loss": 0.1942, "loss_nan_ranks": 0, "loss_rank_avg": 0.16771002113819122, "step": 1725, "valid_targets_mean": 4639.4, "valid_targets_min": 552 }, { "epoch": 2.555391432791728, "grad_norm": 0.38874831725964026, "learning_rate": 3.2045776086959945e-05, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.17640861868858337, "step": 1730, "valid_targets_mean": 5082.9, "valid_targets_min": 125 }, { "epoch": 2.5627769571639587, "grad_norm": 0.36315151583426797, "learning_rate": 3.1986893464343913e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.1778927743434906, "step": 1735, "valid_targets_mean": 5937.7, "valid_targets_min": 826 }, { "epoch": 2.570162481536189, "grad_norm": 0.44124180419701514, "learning_rate": 3.192784824648405e-05, "loss": 0.2125, "loss_nan_ranks": 0, "loss_rank_avg": 0.22931697964668274, "step": 1740, "valid_targets_mean": 4890.1, "valid_targets_min": 436 }, { "epoch": 2.5775480059084197, "grad_norm": 0.4646453073195735, "learning_rate": 3.186864123429443e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.1924285590648651, "step": 1745, "valid_targets_mean": 4559.1, "valid_targets_min": 626 }, { "epoch": 2.58493353028065, "grad_norm": 0.3769877916171565, "learning_rate": 3.180927323088377e-05, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.19486212730407715, "step": 1750, "valid_targets_mean": 7005.6, "valid_targets_min": 873 }, { "epoch": 2.5923190546528803, "grad_norm": 0.4122861646475437, "learning_rate": 3.1749745041544535e-05, "loss": 0.202, "loss_nan_ranks": 0, "loss_rank_avg": 0.1655203104019165, "step": 1755, "valid_targets_mean": 5165.2, "valid_targets_min": 362 }, { "epoch": 2.5997045790251105, "grad_norm": 0.46795037129236655, "learning_rate": 3.169005747374202e-05, "loss": 0.2191, "loss_nan_ranks": 0, "loss_rank_avg": 0.210823655128479, "step": 1760, "valid_targets_mean": 4634.7, "valid_targets_min": 557 }, { "epoch": 2.6070901033973413, "grad_norm": 0.40305455364946613, "learning_rate": 3.163021133710339e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.19001798331737518, "step": 1765, "valid_targets_mean": 6316.5, "valid_targets_min": 515 }, { "epoch": 2.6144756277695715, "grad_norm": 0.37687379981581354, "learning_rate": 3.1570207443406715e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.156022310256958, "step": 1770, "valid_targets_mean": 5602.8, "valid_targets_min": 636 }, { "epoch": 2.6218611521418023, "grad_norm": 0.41470758369539723, "learning_rate": 3.1510046606569944e-05, "loss": 0.1782, "loss_nan_ranks": 0, "loss_rank_avg": 0.1826784908771515, "step": 1775, "valid_targets_mean": 5436.1, "valid_targets_min": 541 }, { "epoch": 2.6292466765140325, "grad_norm": 0.3852868541588975, "learning_rate": 3.1449729642639856e-05, "loss": 0.1918, "loss_nan_ranks": 0, "loss_rank_avg": 0.17214235663414001, "step": 1780, "valid_targets_mean": 5589.0, "valid_targets_min": 475 }, { "epoch": 2.636632200886263, "grad_norm": 0.4088176838039698, "learning_rate": 3.138925736978103e-05, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.18025021255016327, "step": 1785, "valid_targets_mean": 4904.5, "valid_targets_min": 833 }, { "epoch": 2.644017725258493, "grad_norm": 0.4491076662753666, "learning_rate": 3.132863060826469e-05, "loss": 0.1961, "loss_nan_ranks": 0, "loss_rank_avg": 0.18313133716583252, "step": 1790, "valid_targets_mean": 4372.4, "valid_targets_min": 504 }, { "epoch": 2.651403249630724, "grad_norm": 0.4132101343175699, "learning_rate": 3.126785018045764e-05, "loss": 0.2117, "loss_nan_ranks": 0, "loss_rank_avg": 0.18020716309547424, "step": 1795, "valid_targets_mean": 5285.4, "valid_targets_min": 324 }, { "epoch": 2.658788774002954, "grad_norm": 0.6224525946031296, "learning_rate": 3.120691691081104e-05, "loss": 0.1933, "loss_nan_ranks": 0, "loss_rank_avg": 0.18289199471473694, "step": 1800, "valid_targets_mean": 5814.2, "valid_targets_min": 712 }, { "epoch": 2.666174298375185, "grad_norm": 0.37344081795259465, "learning_rate": 3.1145831625849315e-05, "loss": 0.2139, "loss_nan_ranks": 0, "loss_rank_avg": 0.18605783581733704, "step": 1805, "valid_targets_mean": 6338.0, "valid_targets_min": 708 }, { "epoch": 2.673559822747415, "grad_norm": 0.45469603573341405, "learning_rate": 3.1084595154158814e-05, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.20985165238380432, "step": 1810, "valid_targets_mean": 4686.1, "valid_targets_min": 694 }, { "epoch": 2.6809453471196454, "grad_norm": 0.42143425429690434, "learning_rate": 3.1023208326376716e-05, "loss": 0.2089, "loss_nan_ranks": 0, "loss_rank_avg": 0.1601705253124237, "step": 1815, "valid_targets_mean": 5887.0, "valid_targets_min": 629 }, { "epoch": 2.6883308714918757, "grad_norm": 0.4566218104083272, "learning_rate": 3.0961671975179674e-05, "loss": 0.1909, "loss_nan_ranks": 0, "loss_rank_avg": 0.22524869441986084, "step": 1820, "valid_targets_mean": 5187.4, "valid_targets_min": 425 }, { "epoch": 2.6957163958641064, "grad_norm": 0.45904018086003157, "learning_rate": 3.08999869352725e-05, "loss": 0.1894, "loss_nan_ranks": 0, "loss_rank_avg": 0.2111627757549286, "step": 1825, "valid_targets_mean": 4385.9, "valid_targets_min": 476 }, { "epoch": 2.7031019202363367, "grad_norm": 0.3947587132525764, "learning_rate": 3.0838154043376936e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.1816597878932953, "step": 1830, "valid_targets_mean": 5509.4, "valid_targets_min": 311 }, { "epoch": 2.7104874446085674, "grad_norm": 0.44429247184816495, "learning_rate": 3.077617413822022e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.16769450902938843, "step": 1835, "valid_targets_mean": 5723.1, "valid_targets_min": 650 }, { "epoch": 2.7178729689807977, "grad_norm": 0.39766345484896237, "learning_rate": 3.0714048060523745e-05, "loss": 0.2043, "loss_nan_ranks": 0, "loss_rank_avg": 0.183930903673172, "step": 1840, "valid_targets_mean": 5270.6, "valid_targets_min": 926 }, { "epoch": 2.725258493353028, "grad_norm": 0.36819777572651946, "learning_rate": 3.065177665299166e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.18269002437591553, "step": 1845, "valid_targets_mean": 6104.4, "valid_targets_min": 573 }, { "epoch": 2.7326440177252582, "grad_norm": 0.656642708317576, "learning_rate": 3.0589360760299416e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.2284368872642517, "step": 1850, "valid_targets_mean": 4357.9, "valid_targets_min": 457 }, { "epoch": 2.740029542097489, "grad_norm": 0.40389665086925014, "learning_rate": 3.052680122908232e-05, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.1856120228767395, "step": 1855, "valid_targets_mean": 4957.6, "valid_targets_min": 529 }, { "epoch": 2.7474150664697192, "grad_norm": 0.34197083654429966, "learning_rate": 3.046409890792406e-05, "loss": 0.2, "loss_nan_ranks": 0, "loss_rank_avg": 0.15076898038387299, "step": 1860, "valid_targets_mean": 5943.9, "valid_targets_min": 490 }, { "epoch": 2.75480059084195, "grad_norm": 0.39694434070650186, "learning_rate": 3.040125464734519e-05, "loss": 0.2186, "loss_nan_ranks": 0, "loss_rank_avg": 0.22727245092391968, "step": 1865, "valid_targets_mean": 6380.9, "valid_targets_min": 611 }, { "epoch": 2.7621861152141802, "grad_norm": 0.48955312172318344, "learning_rate": 3.0338269299791573e-05, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.18965637683868408, "step": 1870, "valid_targets_mean": 4740.5, "valid_targets_min": 595 }, { "epoch": 2.7695716395864105, "grad_norm": 0.498553979771601, "learning_rate": 3.0275143719622853e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.18993785977363586, "step": 1875, "valid_targets_mean": 6250.0, "valid_targets_min": 790 }, { "epoch": 2.7769571639586412, "grad_norm": 0.4680949760689842, "learning_rate": 3.0211878763100836e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.19833850860595703, "step": 1880, "valid_targets_mean": 4042.8, "valid_targets_min": 639 }, { "epoch": 2.7843426883308715, "grad_norm": 0.6983614556096809, "learning_rate": 3.0148475288377896e-05, "loss": 0.1929, "loss_nan_ranks": 0, "loss_rank_avg": 0.18655887246131897, "step": 1885, "valid_targets_mean": 5421.7, "valid_targets_min": 761 }, { "epoch": 2.791728212703102, "grad_norm": 0.3993729610123753, "learning_rate": 3.0084934155485315e-05, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.17627528309822083, "step": 1890, "valid_targets_mean": 5305.3, "valid_targets_min": 598 }, { "epoch": 2.7991137370753325, "grad_norm": 0.3486684335819875, "learning_rate": 3.0021256226321643e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.17181184887886047, "step": 1895, "valid_targets_mean": 6981.1, "valid_targets_min": 461 }, { "epoch": 2.806499261447563, "grad_norm": 0.3996801724597566, "learning_rate": 2.995744236464098e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.19423222541809082, "step": 1900, "valid_targets_mean": 5607.2, "valid_targets_min": 658 }, { "epoch": 2.813884785819793, "grad_norm": 0.4684471879315951, "learning_rate": 2.9893493436041274e-05, "loss": 0.2038, "loss_nan_ranks": 0, "loss_rank_avg": 0.2360610067844391, "step": 1905, "valid_targets_mean": 4200.7, "valid_targets_min": 726 }, { "epoch": 2.821270310192024, "grad_norm": 0.5224516946852575, "learning_rate": 2.9829410307952577e-05, "loss": 0.1877, "loss_nan_ranks": 0, "loss_rank_avg": 0.18097460269927979, "step": 1910, "valid_targets_mean": 5226.1, "valid_targets_min": 453 }, { "epoch": 2.828655834564254, "grad_norm": 0.3919890597149292, "learning_rate": 2.9765193849625283e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.16534635424613953, "step": 1915, "valid_targets_mean": 5494.3, "valid_targets_min": 459 }, { "epoch": 2.8360413589364843, "grad_norm": 0.3195931232516741, "learning_rate": 2.9700844932118334e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.1442551165819168, "step": 1920, "valid_targets_mean": 6732.5, "valid_targets_min": 614 }, { "epoch": 2.843426883308715, "grad_norm": 0.42131927060359514, "learning_rate": 2.9636364428287395e-05, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.19797298312187195, "step": 1925, "valid_targets_mean": 4944.9, "valid_targets_min": 456 }, { "epoch": 2.8508124076809453, "grad_norm": 0.3873317542623266, "learning_rate": 2.9571753212773028e-05, "loss": 0.2149, "loss_nan_ranks": 0, "loss_rank_avg": 0.17931729555130005, "step": 1930, "valid_targets_mean": 5626.6, "valid_targets_min": 496 }, { "epoch": 2.8581979320531756, "grad_norm": 0.4030896596505125, "learning_rate": 2.9507012161988827e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.17033201456069946, "step": 1935, "valid_targets_mean": 6326.3, "valid_targets_min": 768 }, { "epoch": 2.8655834564254064, "grad_norm": 0.4444109946556492, "learning_rate": 2.9442142154109522e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.1885213851928711, "step": 1940, "valid_targets_mean": 5517.4, "valid_targets_min": 802 }, { "epoch": 2.8729689807976366, "grad_norm": 0.46145234382410805, "learning_rate": 2.937714406905906e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.20272204279899597, "step": 1945, "valid_targets_mean": 5488.1, "valid_targets_min": 656 }, { "epoch": 2.880354505169867, "grad_norm": 0.42923087358401046, "learning_rate": 2.9312018788498714e-05, "loss": 0.2022, "loss_nan_ranks": 0, "loss_rank_avg": 0.19835910201072693, "step": 1950, "valid_targets_mean": 4609.9, "valid_targets_min": 246 }, { "epoch": 2.8877400295420976, "grad_norm": 0.36880559499022475, "learning_rate": 2.924676719581506e-05, "loss": 0.1928, "loss_nan_ranks": 0, "loss_rank_avg": 0.19959020614624023, "step": 1955, "valid_targets_mean": 7206.6, "valid_targets_min": 337 }, { "epoch": 2.895125553914328, "grad_norm": 0.3694784724494498, "learning_rate": 2.9181390176108024e-05, "loss": 0.1957, "loss_nan_ranks": 0, "loss_rank_avg": 0.16610810160636902, "step": 1960, "valid_targets_mean": 5820.9, "valid_targets_min": 743 }, { "epoch": 2.902511078286558, "grad_norm": 0.3748352447951345, "learning_rate": 2.911588861617889e-05, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.1821543574333191, "step": 1965, "valid_targets_mean": 6034.1, "valid_targets_min": 257 }, { "epoch": 2.909896602658789, "grad_norm": 0.46557987222831126, "learning_rate": 2.9050263404518254e-05, "loss": 0.2077, "loss_nan_ranks": 0, "loss_rank_avg": 0.2896730303764343, "step": 1970, "valid_targets_mean": 5670.9, "valid_targets_min": 664 }, { "epoch": 2.917282127031019, "grad_norm": 0.45582660198656316, "learning_rate": 2.8984515431293982e-05, "loss": 0.2213, "loss_nan_ranks": 0, "loss_rank_avg": 0.21186470985412598, "step": 1975, "valid_targets_mean": 5415.5, "valid_targets_min": 511 }, { "epoch": 2.9246676514032495, "grad_norm": 0.39058091819087787, "learning_rate": 2.89186455883391e-05, "loss": 0.2232, "loss_nan_ranks": 0, "loss_rank_avg": 0.18955285847187042, "step": 1980, "valid_targets_mean": 5434.4, "valid_targets_min": 675 }, { "epoch": 2.93205317577548, "grad_norm": 0.38016760545252115, "learning_rate": 2.8852654769139774e-05, "loss": 0.2191, "loss_nan_ranks": 0, "loss_rank_avg": 0.243728905916214, "step": 1985, "valid_targets_mean": 6925.2, "valid_targets_min": 673 }, { "epoch": 2.9394387001477105, "grad_norm": 0.546712089772061, "learning_rate": 2.8786543868823104e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.17349129915237427, "step": 1990, "valid_targets_mean": 4468.9, "valid_targets_min": 543 }, { "epoch": 2.9468242245199407, "grad_norm": 0.4515115845526151, "learning_rate": 2.8720313784145036e-05, "loss": 0.1934, "loss_nan_ranks": 0, "loss_rank_avg": 0.20189234614372253, "step": 1995, "valid_targets_mean": 4474.2, "valid_targets_min": 495 }, { "epoch": 2.9542097488921715, "grad_norm": 0.3831876618295643, "learning_rate": 2.865396541347818e-05, "loss": 0.1951, "loss_nan_ranks": 0, "loss_rank_avg": 0.15678755939006805, "step": 2000, "valid_targets_mean": 4760.3, "valid_targets_min": 370 }, { "epoch": 2.9615952732644018, "grad_norm": 0.40740457187470347, "learning_rate": 2.8587499656799624e-05, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.17568612098693848, "step": 2005, "valid_targets_mean": 4997.9, "valid_targets_min": 742 }, { "epoch": 2.9689807976366325, "grad_norm": 0.3735878296428736, "learning_rate": 2.852091741567874e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.21047380566596985, "step": 2010, "valid_targets_mean": 6746.7, "valid_targets_min": 587 }, { "epoch": 2.9763663220088628, "grad_norm": 0.4064437208033243, "learning_rate": 2.8454219593264924e-05, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.168643057346344, "step": 2015, "valid_targets_mean": 5444.5, "valid_targets_min": 282 }, { "epoch": 2.983751846381093, "grad_norm": 0.4221057265749455, "learning_rate": 2.8387407094275378e-05, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.20394739508628845, "step": 2020, "valid_targets_mean": 5266.9, "valid_targets_min": 790 }, { "epoch": 2.9911373707533233, "grad_norm": 0.35734323137197604, "learning_rate": 2.8320480824982836e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.15881027281284332, "step": 2025, "valid_targets_mean": 5607.5, "valid_targets_min": 572 }, { "epoch": 2.998522895125554, "grad_norm": 0.40362443061193043, "learning_rate": 2.825344169320323e-05, "loss": 0.1877, "loss_nan_ranks": 0, "loss_rank_avg": 0.19752827286720276, "step": 2030, "valid_targets_mean": 5551.8, "valid_targets_min": 636 }, { "epoch": 3.0059084194977843, "grad_norm": 0.3483325395168603, "learning_rate": 2.818629060828344e-05, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.15444116294384003, "step": 2035, "valid_targets_mean": 6590.1, "valid_targets_min": 2768 }, { "epoch": 3.0132939438700146, "grad_norm": 0.46266772441200416, "learning_rate": 2.811902848108889e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.18906280398368835, "step": 2040, "valid_targets_mean": 4889.4, "valid_targets_min": 873 }, { "epoch": 3.0206794682422453, "grad_norm": 0.41227568999635833, "learning_rate": 2.8051656223991274e-05, "loss": 0.1989, "loss_nan_ranks": 0, "loss_rank_avg": 0.16269494593143463, "step": 2045, "valid_targets_mean": 5567.1, "valid_targets_min": 616 }, { "epoch": 3.0280649926144756, "grad_norm": 0.46419141803047215, "learning_rate": 2.798417475085608e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.1930653154850006, "step": 2050, "valid_targets_mean": 5456.0, "valid_targets_min": 708 }, { "epoch": 3.035450516986706, "grad_norm": 0.4383446251656798, "learning_rate": 2.791658497703029e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.18855616450309753, "step": 2055, "valid_targets_mean": 5512.9, "valid_targets_min": 571 }, { "epoch": 3.0428360413589366, "grad_norm": 0.37011575013943987, "learning_rate": 2.7848887819329903e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.16166454553604126, "step": 2060, "valid_targets_mean": 6532.8, "valid_targets_min": 1512 }, { "epoch": 3.050221565731167, "grad_norm": 0.40311646790756955, "learning_rate": 2.7781084196027527e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.19137972593307495, "step": 2065, "valid_targets_mean": 5962.6, "valid_targets_min": 564 }, { "epoch": 3.057607090103397, "grad_norm": 0.4275359756981932, "learning_rate": 2.7713175026839905e-05, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.21499311923980713, "step": 2070, "valid_targets_mean": 5277.0, "valid_targets_min": 709 }, { "epoch": 3.064992614475628, "grad_norm": 0.3752504219955399, "learning_rate": 2.7645161232915444e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.16594503819942474, "step": 2075, "valid_targets_mean": 6164.9, "valid_targets_min": 432 }, { "epoch": 3.072378138847858, "grad_norm": 0.4882106097565124, "learning_rate": 2.7577043736821748e-05, "loss": 0.1793, "loss_nan_ranks": 0, "loss_rank_avg": 0.21406424045562744, "step": 2080, "valid_targets_mean": 4252.2, "valid_targets_min": 625 }, { "epoch": 3.0797636632200884, "grad_norm": 0.3525875278030082, "learning_rate": 2.750882346253305e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.13793540000915527, "step": 2085, "valid_targets_mean": 6917.0, "valid_targets_min": 778 }, { "epoch": 3.087149187592319, "grad_norm": 0.4320447754658649, "learning_rate": 2.7440501335417748e-05, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.1812410056591034, "step": 2090, "valid_targets_mean": 5966.3, "valid_targets_min": 497 }, { "epoch": 3.0945347119645494, "grad_norm": 0.5117110061423488, "learning_rate": 2.7372078282225772e-05, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.2231147289276123, "step": 2095, "valid_targets_mean": 4128.2, "valid_targets_min": 540 }, { "epoch": 3.1019202363367797, "grad_norm": 0.4095198035952486, "learning_rate": 2.730355523107608e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.16321970522403717, "step": 2100, "valid_targets_mean": 5197.5, "valid_targets_min": 461 }, { "epoch": 3.1093057607090104, "grad_norm": 0.47545224234959904, "learning_rate": 2.7234933111444046e-05, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.16089124977588654, "step": 2105, "valid_targets_mean": 3588.7, "valid_targets_min": 322 }, { "epoch": 3.1166912850812407, "grad_norm": 0.3910891142579986, "learning_rate": 2.7166212854148838e-05, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.2100703865289688, "step": 2110, "valid_targets_mean": 6335.6, "valid_targets_min": 708 }, { "epoch": 3.124076809453471, "grad_norm": 0.4204297819786424, "learning_rate": 2.709739539134081e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.17549830675125122, "step": 2115, "valid_targets_mean": 4854.4, "valid_targets_min": 803 }, { "epoch": 3.1314623338257017, "grad_norm": 0.4084245651713014, "learning_rate": 2.7028481656488856e-05, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.15884898602962494, "step": 2120, "valid_targets_mean": 4327.5, "valid_targets_min": 546 }, { "epoch": 3.138847858197932, "grad_norm": 0.5289348550596176, "learning_rate": 2.6959472584367737e-05, "loss": 0.1868, "loss_nan_ranks": 0, "loss_rank_avg": 0.18101103603839874, "step": 2125, "valid_targets_mean": 4410.6, "valid_targets_min": 696 }, { "epoch": 3.1462333825701623, "grad_norm": 0.4419683145308729, "learning_rate": 2.689036911104542e-05, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.24032284319400787, "step": 2130, "valid_targets_mean": 5461.6, "valid_targets_min": 730 }, { "epoch": 3.153618906942393, "grad_norm": 0.7124574698928174, "learning_rate": 2.6821172173870355e-05, "loss": 0.1795, "loss_nan_ranks": 0, "loss_rank_avg": 0.15942493081092834, "step": 2135, "valid_targets_mean": 5982.3, "valid_targets_min": 228 }, { "epoch": 3.1610044313146233, "grad_norm": 0.4691946439142087, "learning_rate": 2.6751882711458783e-05, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.16036120057106018, "step": 2140, "valid_targets_mean": 4745.8, "valid_targets_min": 652 }, { "epoch": 3.1683899556868536, "grad_norm": 0.3657559670571617, "learning_rate": 2.6682501663682e-05, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.16519255936145782, "step": 2145, "valid_targets_mean": 6309.1, "valid_targets_min": 684 }, { "epoch": 3.1757754800590843, "grad_norm": 0.4525601076810765, "learning_rate": 2.661302997165359e-05, "loss": 0.1784, "loss_nan_ranks": 0, "loss_rank_avg": 0.16392679512500763, "step": 2150, "valid_targets_mean": 4315.6, "valid_targets_min": 598 }, { "epoch": 3.1831610044313146, "grad_norm": 0.4756846684204359, "learning_rate": 2.6543468577716694e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.2014717161655426, "step": 2155, "valid_targets_mean": 4423.4, "valid_targets_min": 594 }, { "epoch": 3.1905465288035453, "grad_norm": 0.4270410035428385, "learning_rate": 2.6473818425431185e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.1542786955833435, "step": 2160, "valid_targets_mean": 5105.6, "valid_targets_min": 348 }, { "epoch": 3.1979320531757756, "grad_norm": 0.4702062705925336, "learning_rate": 2.640408045956091e-05, "loss": 0.1884, "loss_nan_ranks": 0, "loss_rank_avg": 0.19304950535297394, "step": 2165, "valid_targets_mean": 4532.8, "valid_targets_min": 674 }, { "epoch": 3.205317577548006, "grad_norm": 0.45151853190869246, "learning_rate": 2.6334255626060842e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.19992440938949585, "step": 2170, "valid_targets_mean": 4673.7, "valid_targets_min": 658 }, { "epoch": 3.212703101920236, "grad_norm": 0.42434196985334355, "learning_rate": 2.626434487206428e-05, "loss": 0.1763, "loss_nan_ranks": 0, "loss_rank_avg": 0.18652237951755524, "step": 2175, "valid_targets_mean": 5400.8, "valid_targets_min": 528 }, { "epoch": 3.220088626292467, "grad_norm": 0.4063121122695259, "learning_rate": 2.6194349145869965e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.16594845056533813, "step": 2180, "valid_targets_mean": 5230.7, "valid_targets_min": 369 }, { "epoch": 3.227474150664697, "grad_norm": 0.447772859466632, "learning_rate": 2.6124269396929256e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.17529018223285675, "step": 2185, "valid_targets_mean": 4556.4, "valid_targets_min": 562 }, { "epoch": 3.234859675036928, "grad_norm": 0.40325224428720596, "learning_rate": 2.6054106575833206e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.18165422976016998, "step": 2190, "valid_targets_mean": 5751.3, "valid_targets_min": 644 }, { "epoch": 3.242245199409158, "grad_norm": 0.4248179861853043, "learning_rate": 2.5983861634299715e-05, "loss": 0.1938, "loss_nan_ranks": 0, "loss_rank_avg": 0.15987026691436768, "step": 2195, "valid_targets_mean": 5245.4, "valid_targets_min": 605 }, { "epoch": 3.2496307237813884, "grad_norm": 0.43315325209313854, "learning_rate": 2.5913535525160608e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.19797955453395844, "step": 2200, "valid_targets_mean": 5092.6, "valid_targets_min": 595 }, { "epoch": 3.2570162481536187, "grad_norm": 0.45899763861106463, "learning_rate": 2.5843129202348666e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.1837209016084671, "step": 2205, "valid_targets_mean": 5431.0, "valid_targets_min": 905 }, { "epoch": 3.2644017725258494, "grad_norm": 0.34185089958623904, "learning_rate": 2.577264362088475e-05, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.12556633353233337, "step": 2210, "valid_targets_mean": 6299.7, "valid_targets_min": 521 }, { "epoch": 3.2717872968980797, "grad_norm": 0.41205572297039716, "learning_rate": 2.5702079736864815e-05, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.16507720947265625, "step": 2215, "valid_targets_mean": 5128.1, "valid_targets_min": 821 }, { "epoch": 3.2791728212703104, "grad_norm": 0.3997869068309829, "learning_rate": 2.5631438507446936e-05, "loss": 0.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.1773259937763214, "step": 2220, "valid_targets_mean": 5669.0, "valid_targets_min": 665 }, { "epoch": 3.2865583456425407, "grad_norm": 0.4984598466794601, "learning_rate": 2.5560720890838332e-05, "loss": 0.1908, "loss_nan_ranks": 0, "loss_rank_avg": 0.2146761119365692, "step": 2225, "valid_targets_mean": 4352.7, "valid_targets_min": 648 }, { "epoch": 3.293943870014771, "grad_norm": 0.47607510524209484, "learning_rate": 2.5489927846282386e-05, "loss": 0.1822, "loss_nan_ranks": 0, "loss_rank_avg": 0.1854625642299652, "step": 2230, "valid_targets_mean": 4233.4, "valid_targets_min": 504 }, { "epoch": 3.3013293943870012, "grad_norm": 0.4239465864105787, "learning_rate": 2.5419060334045606e-05, "loss": 0.187, "loss_nan_ranks": 0, "loss_rank_avg": 0.17958292365074158, "step": 2235, "valid_targets_mean": 5336.4, "valid_targets_min": 674 }, { "epoch": 3.308714918759232, "grad_norm": 0.4619161542340498, "learning_rate": 2.5348119315404604e-05, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.17576739192008972, "step": 2240, "valid_targets_mean": 5028.8, "valid_targets_min": 572 }, { "epoch": 3.3161004431314622, "grad_norm": 0.37782695093104735, "learning_rate": 2.5277105752633083e-05, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.1741185039281845, "step": 2245, "valid_targets_mean": 5921.9, "valid_targets_min": 425 }, { "epoch": 3.323485967503693, "grad_norm": 0.46105586751392597, "learning_rate": 2.520602060898874e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.2181580513715744, "step": 2250, "valid_targets_mean": 4782.2, "valid_targets_min": 785 }, { "epoch": 3.3308714918759232, "grad_norm": 0.44233045621174916, "learning_rate": 2.5134864848700247e-05, "loss": 0.1926, "loss_nan_ranks": 0, "loss_rank_avg": 0.21820692718029022, "step": 2255, "valid_targets_mean": 5393.2, "valid_targets_min": 628 }, { "epoch": 3.3382570162481535, "grad_norm": 0.4176926479653841, "learning_rate": 2.5063639436954145e-05, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.2524767518043518, "step": 2260, "valid_targets_mean": 6778.2, "valid_targets_min": 609 }, { "epoch": 3.345642540620384, "grad_norm": 0.3785623480657544, "learning_rate": 2.499234533988174e-05, "loss": 0.2208, "loss_nan_ranks": 0, "loss_rank_avg": 0.15883594751358032, "step": 2265, "valid_targets_mean": 6011.2, "valid_targets_min": 541 }, { "epoch": 3.3530280649926145, "grad_norm": 0.9489103748663574, "learning_rate": 2.4920983524546035e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.19622023403644562, "step": 2270, "valid_targets_mean": 2849.2, "valid_targets_min": 336 }, { "epoch": 3.360413589364845, "grad_norm": 0.4851485979634193, "learning_rate": 2.4849554958928582e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.1570294201374054, "step": 2275, "valid_targets_mean": 4828.0, "valid_targets_min": 533 }, { "epoch": 3.3677991137370755, "grad_norm": 0.38871049650595657, "learning_rate": 2.477806061191637e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.16449853777885437, "step": 2280, "valid_targets_mean": 6279.4, "valid_targets_min": 623 }, { "epoch": 3.375184638109306, "grad_norm": 0.3846163906395918, "learning_rate": 2.4706501453288656e-05, "loss": 0.1927, "loss_nan_ranks": 0, "loss_rank_avg": 0.17619986832141876, "step": 2285, "valid_targets_mean": 5938.9, "valid_targets_min": 718 }, { "epoch": 3.382570162481536, "grad_norm": 0.4036981390266134, "learning_rate": 2.4634878453703857e-05, "loss": 0.1728, "loss_nan_ranks": 0, "loss_rank_avg": 0.16103024780750275, "step": 2290, "valid_targets_mean": 5504.4, "valid_targets_min": 1317 }, { "epoch": 3.389955686853767, "grad_norm": 0.6582445011580204, "learning_rate": 2.4563192584686325e-05, "loss": 0.1801, "loss_nan_ranks": 0, "loss_rank_avg": 0.192658931016922, "step": 2295, "valid_targets_mean": 3992.2, "valid_targets_min": 602 }, { "epoch": 3.397341211225997, "grad_norm": 0.37316580719925574, "learning_rate": 2.4491444818613218e-05, "loss": 0.1823, "loss_nan_ranks": 0, "loss_rank_avg": 0.1514277458190918, "step": 2300, "valid_targets_mean": 6166.7, "valid_targets_min": 493 }, { "epoch": 3.4047267355982274, "grad_norm": 0.36651337529440386, "learning_rate": 2.441963612870129e-05, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.17430251836776733, "step": 2305, "valid_targets_mean": 6701.6, "valid_targets_min": 1299 }, { "epoch": 3.412112259970458, "grad_norm": 0.4562920402638719, "learning_rate": 2.4347767488993697e-05, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.17882443964481354, "step": 2310, "valid_targets_mean": 4928.1, "valid_targets_min": 677 }, { "epoch": 3.4194977843426884, "grad_norm": 0.40217427857200977, "learning_rate": 2.4275839874346757e-05, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.21625502407550812, "step": 2315, "valid_targets_mean": 5914.1, "valid_targets_min": 642 }, { "epoch": 3.4268833087149186, "grad_norm": 0.4676729858346907, "learning_rate": 2.4203854260416764e-05, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.18612849712371826, "step": 2320, "valid_targets_mean": 4202.7, "valid_targets_min": 513 }, { "epoch": 3.4342688330871494, "grad_norm": 0.5053850543812328, "learning_rate": 2.4131811623646745e-05, "loss": 0.1777, "loss_nan_ranks": 0, "loss_rank_avg": 0.20099109411239624, "step": 2325, "valid_targets_mean": 5066.5, "valid_targets_min": 799 }, { "epoch": 3.4416543574593796, "grad_norm": 0.4177536175359703, "learning_rate": 2.4059712941253205e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.17040522396564484, "step": 2330, "valid_targets_mean": 6019.4, "valid_targets_min": 622 }, { "epoch": 3.44903988183161, "grad_norm": 0.3896994204855158, "learning_rate": 2.3987559191212855e-05, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.17240211367607117, "step": 2335, "valid_targets_mean": 5771.4, "valid_targets_min": 820 }, { "epoch": 3.4564254062038406, "grad_norm": 0.4519987685160109, "learning_rate": 2.3915351352249392e-05, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.194617360830307, "step": 2340, "valid_targets_mean": 4527.7, "valid_targets_min": 726 }, { "epoch": 3.463810930576071, "grad_norm": 0.5253399465778659, "learning_rate": 2.3843090403820198e-05, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.16879601776599884, "step": 2345, "valid_targets_mean": 6142.8, "valid_targets_min": 451 }, { "epoch": 3.471196454948301, "grad_norm": 0.4277432003720903, "learning_rate": 2.3770777326103033e-05, "loss": 0.1891, "loss_nan_ranks": 0, "loss_rank_avg": 0.18401449918746948, "step": 2350, "valid_targets_mean": 5573.9, "valid_targets_min": 477 }, { "epoch": 3.478581979320532, "grad_norm": 0.4257500742732944, "learning_rate": 2.3698413099982772e-05, "loss": 0.1868, "loss_nan_ranks": 0, "loss_rank_avg": 0.23105338215827942, "step": 2355, "valid_targets_mean": 6022.1, "valid_targets_min": 577 }, { "epoch": 3.485967503692762, "grad_norm": 0.35202882188870804, "learning_rate": 2.3625998707038095e-05, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.15384787321090698, "step": 2360, "valid_targets_mean": 6247.2, "valid_targets_min": 743 }, { "epoch": 3.4933530280649925, "grad_norm": 0.5362069711243463, "learning_rate": 2.355353512952816e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.2501859962940216, "step": 2365, "valid_targets_mean": 3637.5, "valid_targets_min": 557 }, { "epoch": 3.500738552437223, "grad_norm": 0.627740196350393, "learning_rate": 2.3481023350379282e-05, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.1972651183605194, "step": 2370, "valid_targets_mean": 3431.4, "valid_targets_min": 298 }, { "epoch": 3.5081240768094535, "grad_norm": 0.42738807000739665, "learning_rate": 2.3408464353171603e-05, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.17980587482452393, "step": 2375, "valid_targets_mean": 4957.2, "valid_targets_min": 606 }, { "epoch": 3.5155096011816838, "grad_norm": 0.4123970309337914, "learning_rate": 2.3335859122125762e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.1853245347738266, "step": 2380, "valid_targets_mean": 4892.4, "valid_targets_min": 658 }, { "epoch": 3.5228951255539145, "grad_norm": 0.42163919981185066, "learning_rate": 2.3263208642089517e-05, "loss": 0.1855, "loss_nan_ranks": 0, "loss_rank_avg": 0.15585747361183167, "step": 2385, "valid_targets_mean": 4967.4, "valid_targets_min": 606 }, { "epoch": 3.5302806499261448, "grad_norm": 0.3631774625240425, "learning_rate": 2.319051389852441e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.15152710676193237, "step": 2390, "valid_targets_mean": 6531.5, "valid_targets_min": 526 }, { "epoch": 3.537666174298375, "grad_norm": 0.4386225168817978, "learning_rate": 2.311777587749239e-05, "loss": 0.187, "loss_nan_ranks": 0, "loss_rank_avg": 0.17836642265319824, "step": 2395, "valid_targets_mean": 5189.2, "valid_targets_min": 400 }, { "epoch": 3.5450516986706058, "grad_norm": 0.37272488284870037, "learning_rate": 2.3044995565642453e-05, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.15524575114250183, "step": 2400, "valid_targets_mean": 5844.1, "valid_targets_min": 323 }, { "epoch": 3.552437223042836, "grad_norm": 0.4273954739176906, "learning_rate": 2.2972173950197223e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.19005119800567627, "step": 2405, "valid_targets_mean": 5287.6, "valid_targets_min": 522 }, { "epoch": 3.5598227474150663, "grad_norm": 0.3809128573118705, "learning_rate": 2.2899312018939598e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.16557791829109192, "step": 2410, "valid_targets_mean": 5387.4, "valid_targets_min": 424 }, { "epoch": 3.567208271787297, "grad_norm": 0.445270409658121, "learning_rate": 2.2826410760199327e-05, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.16389130055904388, "step": 2415, "valid_targets_mean": 6058.5, "valid_targets_min": 699 }, { "epoch": 3.5745937961595273, "grad_norm": 0.7167965047318506, "learning_rate": 2.2753471162839637e-05, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.20100605487823486, "step": 2420, "valid_targets_mean": 6238.5, "valid_targets_min": 567 }, { "epoch": 3.5819793205317576, "grad_norm": 0.44061592794128485, "learning_rate": 2.2680494216243762e-05, "loss": 0.2084, "loss_nan_ranks": 0, "loss_rank_avg": 0.20798034965991974, "step": 2425, "valid_targets_mean": 5419.6, "valid_targets_min": 628 }, { "epoch": 3.5893648449039883, "grad_norm": 0.39676272392212464, "learning_rate": 2.2607480910301564e-05, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.18191611766815186, "step": 2430, "valid_targets_mean": 6013.3, "valid_targets_min": 704 }, { "epoch": 3.5967503692762186, "grad_norm": 0.38941782318875595, "learning_rate": 2.253443223539613e-05, "loss": 0.17, "loss_nan_ranks": 0, "loss_rank_avg": 0.17795924842357635, "step": 2435, "valid_targets_mean": 5669.7, "valid_targets_min": 647 }, { "epoch": 3.604135893648449, "grad_norm": 0.3942812475735809, "learning_rate": 2.246134918239028e-05, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.1445077508687973, "step": 2440, "valid_targets_mean": 5918.6, "valid_targets_min": 641 }, { "epoch": 3.6115214180206796, "grad_norm": 0.3878199914386221, "learning_rate": 2.2388232742613146e-05, "loss": 0.1951, "loss_nan_ranks": 0, "loss_rank_avg": 0.15950973331928253, "step": 2445, "valid_targets_mean": 5599.8, "valid_targets_min": 462 }, { "epoch": 3.61890694239291, "grad_norm": 0.40119193945091164, "learning_rate": 2.231508390784674e-05, "loss": 0.1777, "loss_nan_ranks": 0, "loss_rank_avg": 0.18693730235099792, "step": 2450, "valid_targets_mean": 5479.7, "valid_targets_min": 683 }, { "epoch": 3.62629246676514, "grad_norm": 0.41270041132362517, "learning_rate": 2.2241903670312516e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.1751289963722229, "step": 2455, "valid_targets_mean": 6304.4, "valid_targets_min": 729 }, { "epoch": 3.633677991137371, "grad_norm": 0.37919593321209355, "learning_rate": 2.216869302265785e-05, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.180336594581604, "step": 2460, "valid_targets_mean": 6089.2, "valid_targets_min": 683 }, { "epoch": 3.641063515509601, "grad_norm": 0.41713272138692914, "learning_rate": 2.2095452957942643e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.17298147082328796, "step": 2465, "valid_targets_mean": 5199.1, "valid_targets_min": 547 }, { "epoch": 3.6484490398818314, "grad_norm": 0.5197567957007619, "learning_rate": 2.2022184469625797e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.1868414729833603, "step": 2470, "valid_targets_mean": 4258.9, "valid_targets_min": 620 }, { "epoch": 3.655834564254062, "grad_norm": 0.39404420347224917, "learning_rate": 2.1948888551551795e-05, "loss": 0.175, "loss_nan_ranks": 0, "loss_rank_avg": 0.16973114013671875, "step": 2475, "valid_targets_mean": 5702.5, "valid_targets_min": 528 }, { "epoch": 3.6632200886262924, "grad_norm": 0.49672107594538334, "learning_rate": 2.1875566197937154e-05, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.22505685687065125, "step": 2480, "valid_targets_mean": 4229.1, "valid_targets_min": 614 }, { "epoch": 3.670605612998523, "grad_norm": 0.5386862158554978, "learning_rate": 2.1802218403357003e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.18474605679512024, "step": 2485, "valid_targets_mean": 3811.4, "valid_targets_min": 608 }, { "epoch": 3.6779911373707534, "grad_norm": 0.4199309274764877, "learning_rate": 2.1728846162731547e-05, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.16229534149169922, "step": 2490, "valid_targets_mean": 4422.1, "valid_targets_min": 602 }, { "epoch": 3.6853766617429837, "grad_norm": 0.44213788636825774, "learning_rate": 2.1655450471312587e-05, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.16909149289131165, "step": 2495, "valid_targets_mean": 4642.9, "valid_targets_min": 670 }, { "epoch": 3.692762186115214, "grad_norm": 0.47756920378888834, "learning_rate": 2.1582032324670024e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.21273420751094818, "step": 2500, "valid_targets_mean": 4483.9, "valid_targets_min": 573 }, { "epoch": 3.7001477104874447, "grad_norm": 1.7776796913692625, "learning_rate": 2.150859271867836e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.20686309039592743, "step": 2505, "valid_targets_mean": 3814.2, "valid_targets_min": 282 }, { "epoch": 3.707533234859675, "grad_norm": 0.4541222702170866, "learning_rate": 2.143513264950316e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.16933034360408783, "step": 2510, "valid_targets_mean": 4283.7, "valid_targets_min": 360 }, { "epoch": 3.7149187592319057, "grad_norm": 0.512488878559065, "learning_rate": 2.1361653113587583e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.23736466467380524, "step": 2515, "valid_targets_mean": 4091.1, "valid_targets_min": 553 }, { "epoch": 3.722304283604136, "grad_norm": 0.5026024047876461, "learning_rate": 2.128815510763882e-05, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.19661220908164978, "step": 2520, "valid_targets_mean": 3568.8, "valid_targets_min": 479 }, { "epoch": 3.7296898079763663, "grad_norm": 0.4756178800621908, "learning_rate": 2.1214639628614618e-05, "loss": 0.1717, "loss_nan_ranks": 0, "loss_rank_avg": 0.2067551612854004, "step": 2525, "valid_targets_mean": 4420.6, "valid_targets_min": 535 }, { "epoch": 3.7370753323485966, "grad_norm": 0.4481991423508541, "learning_rate": 2.1141107673709727e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.2029070109128952, "step": 2530, "valid_targets_mean": 4889.3, "valid_targets_min": 671 }, { "epoch": 3.7444608567208273, "grad_norm": 0.4486218822810619, "learning_rate": 2.1067560240342382e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.19874705374240875, "step": 2535, "valid_targets_mean": 4725.5, "valid_targets_min": 309 }, { "epoch": 3.7518463810930576, "grad_norm": 0.42580796837346163, "learning_rate": 2.0993998326140774e-05, "loss": 0.1857, "loss_nan_ranks": 0, "loss_rank_avg": 0.17727911472320557, "step": 2540, "valid_targets_mean": 4696.8, "valid_targets_min": 629 }, { "epoch": 3.7592319054652883, "grad_norm": 0.46276463063827256, "learning_rate": 2.0920422928929514e-05, "loss": 0.165, "loss_nan_ranks": 0, "loss_rank_avg": 0.21701931953430176, "step": 2545, "valid_targets_mean": 5121.4, "valid_targets_min": 620 }, { "epoch": 3.7666174298375186, "grad_norm": 0.39520678275058635, "learning_rate": 2.0846835046716124e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.2055937796831131, "step": 2550, "valid_targets_mean": 6235.9, "valid_targets_min": 743 }, { "epoch": 3.774002954209749, "grad_norm": 0.3749059071380504, "learning_rate": 2.0773235677677453e-05, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.1439509242773056, "step": 2555, "valid_targets_mean": 5177.5, "valid_targets_min": 601 }, { "epoch": 3.781388478581979, "grad_norm": 0.4376582038796636, "learning_rate": 2.0699625820146166e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.19691312313079834, "step": 2560, "valid_targets_mean": 4715.4, "valid_targets_min": 388 }, { "epoch": 3.78877400295421, "grad_norm": 0.4555515812161259, "learning_rate": 2.0626006472597203e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.2008768618106842, "step": 2565, "valid_targets_mean": 4623.0, "valid_targets_min": 731 }, { "epoch": 3.79615952732644, "grad_norm": 0.459171004943161, "learning_rate": 2.055237863363424e-05, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.21966755390167236, "step": 2570, "valid_targets_mean": 4648.9, "valid_targets_min": 615 }, { "epoch": 3.803545051698671, "grad_norm": 0.4284579195415132, "learning_rate": 2.047874330197612e-05, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.17750242352485657, "step": 2575, "valid_targets_mean": 5786.1, "valid_targets_min": 697 }, { "epoch": 3.810930576070901, "grad_norm": 0.5052628017425496, "learning_rate": 2.040510147644332e-05, "loss": 0.1835, "loss_nan_ranks": 0, "loss_rank_avg": 0.1922721564769745, "step": 2580, "valid_targets_mean": 4639.9, "valid_targets_min": 664 }, { "epoch": 3.8183161004431314, "grad_norm": 0.5209698856989999, "learning_rate": 2.033145415594441e-05, "loss": 0.1807, "loss_nan_ranks": 0, "loss_rank_avg": 0.1749410480260849, "step": 2585, "valid_targets_mean": 4522.6, "valid_targets_min": 314 }, { "epoch": 3.8257016248153617, "grad_norm": 0.5289497505816443, "learning_rate": 2.0257802339462497e-05, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.2323957085609436, "step": 2590, "valid_targets_mean": 3958.1, "valid_targets_min": 257 }, { "epoch": 3.8330871491875924, "grad_norm": 0.4429473903371753, "learning_rate": 2.018414702604167e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.17129692435264587, "step": 2595, "valid_targets_mean": 4951.2, "valid_targets_min": 535 }, { "epoch": 3.8404726735598227, "grad_norm": 0.5664110286490077, "learning_rate": 2.011048921477345e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.19464537501335144, "step": 2600, "valid_targets_mean": 4107.1, "valid_targets_min": 743 }, { "epoch": 3.8478581979320534, "grad_norm": 0.48372759494178025, "learning_rate": 2.0036829904783234e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.15631017088890076, "step": 2605, "valid_targets_mean": 5911.1, "valid_targets_min": 535 }, { "epoch": 3.8552437223042837, "grad_norm": 0.5771058795231779, "learning_rate": 1.996317009521677e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.16237816214561462, "step": 2610, "valid_targets_mean": 4347.8, "valid_targets_min": 565 }, { "epoch": 3.862629246676514, "grad_norm": 0.3451442793961211, "learning_rate": 1.9889510785226556e-05, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.16310572624206543, "step": 2615, "valid_targets_mean": 6855.8, "valid_targets_min": 537 }, { "epoch": 3.8700147710487443, "grad_norm": 0.47160578182778307, "learning_rate": 1.981585297395833e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.18903210759162903, "step": 2620, "valid_targets_mean": 4925.4, "valid_targets_min": 490 }, { "epoch": 3.877400295420975, "grad_norm": 0.4112730275680861, "learning_rate": 1.9742197660537503e-05, "loss": 0.1801, "loss_nan_ranks": 0, "loss_rank_avg": 0.1774231493473053, "step": 2625, "valid_targets_mean": 4865.4, "valid_targets_min": 566 }, { "epoch": 3.8847858197932053, "grad_norm": 0.3852153308078606, "learning_rate": 1.96685458440556e-05, "loss": 0.1918, "loss_nan_ranks": 0, "loss_rank_avg": 0.21487516164779663, "step": 2630, "valid_targets_mean": 6536.1, "valid_targets_min": 666 }, { "epoch": 3.892171344165436, "grad_norm": 0.4266578300389501, "learning_rate": 1.9594898523556688e-05, "loss": 0.2017, "loss_nan_ranks": 0, "loss_rank_avg": 0.1812269687652588, "step": 2635, "valid_targets_mean": 4853.8, "valid_targets_min": 509 }, { "epoch": 3.8995568685376663, "grad_norm": 0.47478356489339524, "learning_rate": 1.952125669802389e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.1804153323173523, "step": 2640, "valid_targets_mean": 4120.0, "valid_targets_min": 229 }, { "epoch": 3.9069423929098965, "grad_norm": 0.3984291783021106, "learning_rate": 1.944762136636577e-05, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.14626066386699677, "step": 2645, "valid_targets_mean": 5470.4, "valid_targets_min": 482 }, { "epoch": 3.914327917282127, "grad_norm": 0.4145840145456443, "learning_rate": 1.9373993527402803e-05, "loss": 0.1842, "loss_nan_ranks": 0, "loss_rank_avg": 0.17797842621803284, "step": 2650, "valid_targets_mean": 5413.2, "valid_targets_min": 524 }, { "epoch": 3.9217134416543575, "grad_norm": 0.43768905570389377, "learning_rate": 1.930037417985384e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.1793164610862732, "step": 2655, "valid_targets_mean": 4557.5, "valid_targets_min": 563 }, { "epoch": 3.929098966026588, "grad_norm": 0.4471133890380236, "learning_rate": 1.9226764322322554e-05, "loss": 0.183, "loss_nan_ranks": 0, "loss_rank_avg": 0.21864616870880127, "step": 2660, "valid_targets_mean": 5254.9, "valid_targets_min": 788 }, { "epoch": 3.9364844903988185, "grad_norm": 0.4345555815624583, "learning_rate": 1.915316495328388e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.18304719030857086, "step": 2665, "valid_targets_mean": 4897.6, "valid_targets_min": 530 }, { "epoch": 3.943870014771049, "grad_norm": 0.46340151961537496, "learning_rate": 1.9079577071070486e-05, "loss": 0.1697, "loss_nan_ranks": 0, "loss_rank_avg": 0.1812700629234314, "step": 2670, "valid_targets_mean": 4532.0, "valid_targets_min": 570 }, { "epoch": 3.951255539143279, "grad_norm": 0.46722063462251806, "learning_rate": 1.9006001673859236e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.18102481961250305, "step": 2675, "valid_targets_mean": 4135.3, "valid_targets_min": 531 }, { "epoch": 3.9586410635155094, "grad_norm": 0.46809132826813665, "learning_rate": 1.8932439759657628e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.2036694884300232, "step": 2680, "valid_targets_mean": 4903.4, "valid_targets_min": 455 }, { "epoch": 3.96602658788774, "grad_norm": 0.4224456008680522, "learning_rate": 1.8858892326290283e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.20503783226013184, "step": 2685, "valid_targets_mean": 4960.2, "valid_targets_min": 563 }, { "epoch": 3.9734121122599704, "grad_norm": 0.3976755577199375, "learning_rate": 1.878536037138539e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.16833657026290894, "step": 2690, "valid_targets_mean": 5052.5, "valid_targets_min": 660 }, { "epoch": 3.980797636632201, "grad_norm": 0.4015922991970415, "learning_rate": 1.8711844892361187e-05, "loss": 0.1908, "loss_nan_ranks": 0, "loss_rank_avg": 0.17497824132442474, "step": 2695, "valid_targets_mean": 6211.0, "valid_targets_min": 703 }, { "epoch": 3.9881831610044314, "grad_norm": 0.46100259598039117, "learning_rate": 1.8638346886412427e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.17598775029182434, "step": 2700, "valid_targets_mean": 4511.3, "valid_targets_min": 677 }, { "epoch": 3.9955686853766617, "grad_norm": 0.5263845759468841, "learning_rate": 1.8564867350496845e-05, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.1905372142791748, "step": 2705, "valid_targets_mean": 3814.4, "valid_targets_min": 561 }, { "epoch": 4.002954209748892, "grad_norm": 0.34980228182591305, "learning_rate": 1.8491407281321647e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.14900560677051544, "step": 2710, "valid_targets_mean": 6249.2, "valid_targets_min": 320 }, { "epoch": 4.010339734121122, "grad_norm": 0.5143265300926454, "learning_rate": 1.8417967675329975e-05, "loss": 0.1616, "loss_nan_ranks": 0, "loss_rank_avg": 0.17539595067501068, "step": 2715, "valid_targets_mean": 3539.0, "valid_targets_min": 433 }, { "epoch": 4.017725258493353, "grad_norm": 0.3935516918907612, "learning_rate": 1.8344549528687423e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.18661487102508545, "step": 2720, "valid_targets_mean": 6973.4, "valid_targets_min": 441 }, { "epoch": 4.025110782865584, "grad_norm": 0.44755179204475903, "learning_rate": 1.8271153837268464e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.15159180760383606, "step": 2725, "valid_targets_mean": 4417.1, "valid_targets_min": 673 }, { "epoch": 4.032496307237814, "grad_norm": 0.42283273517778147, "learning_rate": 1.8197781596643e-05, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.18647818267345428, "step": 2730, "valid_targets_mean": 5626.2, "valid_targets_min": 648 }, { "epoch": 4.039881831610044, "grad_norm": 0.39804774495793865, "learning_rate": 1.812443380206285e-05, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.13898664712905884, "step": 2735, "valid_targets_mean": 5607.3, "valid_targets_min": 827 }, { "epoch": 4.0472673559822745, "grad_norm": 0.4952592545309753, "learning_rate": 1.805111144844821e-05, "loss": 0.1694, "loss_nan_ranks": 0, "loss_rank_avg": 0.17651236057281494, "step": 2740, "valid_targets_mean": 4273.1, "valid_targets_min": 564 }, { "epoch": 4.054652880354505, "grad_norm": 0.5267789359486101, "learning_rate": 1.7977815530374207e-05, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.16626033186912537, "step": 2745, "valid_targets_mean": 3623.0, "valid_targets_min": 125 }, { "epoch": 4.062038404726736, "grad_norm": 0.5196745978105738, "learning_rate": 1.7904547042057364e-05, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.16587507724761963, "step": 2750, "valid_targets_mean": 4396.9, "valid_targets_min": 466 }, { "epoch": 4.069423929098966, "grad_norm": 0.4220475584040045, "learning_rate": 1.7831306977342152e-05, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.14500692486763, "step": 2755, "valid_targets_mean": 4850.2, "valid_targets_min": 524 }, { "epoch": 4.0768094534711965, "grad_norm": 0.42814857370303006, "learning_rate": 1.7758096329687488e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.13999520242214203, "step": 2760, "valid_targets_mean": 5521.1, "valid_targets_min": 606 }, { "epoch": 4.084194977843427, "grad_norm": 0.3859057452591373, "learning_rate": 1.7684916092153262e-05, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.14261415600776672, "step": 2765, "valid_targets_mean": 5565.9, "valid_targets_min": 672 }, { "epoch": 4.091580502215657, "grad_norm": 0.42241050834024985, "learning_rate": 1.7611767257386864e-05, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.1470344364643097, "step": 2770, "valid_targets_mean": 5220.9, "valid_targets_min": 674 }, { "epoch": 4.098966026587887, "grad_norm": 0.416789874748107, "learning_rate": 1.753865081760973e-05, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.17493118345737457, "step": 2775, "valid_targets_mean": 5951.9, "valid_targets_min": 606 }, { "epoch": 4.1063515509601185, "grad_norm": 0.46960220255251917, "learning_rate": 1.7465567764603876e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.17590011656284332, "step": 2780, "valid_targets_mean": 4606.5, "valid_targets_min": 605 }, { "epoch": 4.113737075332349, "grad_norm": 0.4907659502885251, "learning_rate": 1.739251908969844e-05, "loss": 0.1695, "loss_nan_ranks": 0, "loss_rank_avg": 0.20186254382133484, "step": 2785, "valid_targets_mean": 4470.1, "valid_targets_min": 718 }, { "epoch": 4.121122599704579, "grad_norm": 0.3933868369919279, "learning_rate": 1.7319505783756248e-05, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.12017552554607391, "step": 2790, "valid_targets_mean": 6450.1, "valid_targets_min": 476 }, { "epoch": 4.128508124076809, "grad_norm": 0.4949323916381371, "learning_rate": 1.724652883716037e-05, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.15612033009529114, "step": 2795, "valid_targets_mean": 4150.4, "valid_targets_min": 518 }, { "epoch": 4.13589364844904, "grad_norm": 0.40509378331922025, "learning_rate": 1.7173589239800673e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.22377564013004303, "step": 2800, "valid_targets_mean": 6398.9, "valid_targets_min": 838 }, { "epoch": 4.14327917282127, "grad_norm": 0.4108689853913775, "learning_rate": 1.7100687981060405e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.1769275963306427, "step": 2805, "valid_targets_mean": 6090.0, "valid_targets_min": 1026 }, { "epoch": 4.150664697193501, "grad_norm": 0.5162692493811, "learning_rate": 1.7027826049802787e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.1626986861228943, "step": 2810, "valid_targets_mean": 3471.9, "valid_targets_min": 454 }, { "epoch": 4.158050221565731, "grad_norm": 0.5312767885071268, "learning_rate": 1.6955004434357557e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.20601385831832886, "step": 2815, "valid_targets_mean": 4762.1, "valid_targets_min": 355 }, { "epoch": 4.165435745937962, "grad_norm": 0.4235145894913193, "learning_rate": 1.6882224122507617e-05, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.1396898776292801, "step": 2820, "valid_targets_mean": 5606.3, "valid_targets_min": 456 }, { "epoch": 4.172821270310192, "grad_norm": 0.416756640748203, "learning_rate": 1.6809486101475595e-05, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.21778830885887146, "step": 2825, "valid_targets_mean": 7377.4, "valid_targets_min": 657 }, { "epoch": 4.180206794682422, "grad_norm": 0.5252822718202776, "learning_rate": 1.673679135791049e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.19100016355514526, "step": 2830, "valid_targets_mean": 4078.6, "valid_targets_min": 584 }, { "epoch": 4.1875923190546525, "grad_norm": 0.529831098741841, "learning_rate": 1.6664140877874245e-05, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.18276384472846985, "step": 2835, "valid_targets_mean": 3844.6, "valid_targets_min": 532 }, { "epoch": 4.194977843426884, "grad_norm": 0.3492533131434477, "learning_rate": 1.65915356468284e-05, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.11477085202932358, "step": 2840, "valid_targets_mean": 7473.1, "valid_targets_min": 829 }, { "epoch": 4.202363367799114, "grad_norm": 0.46188579373201377, "learning_rate": 1.651897664962072e-05, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.15958110988140106, "step": 2845, "valid_targets_mean": 4629.6, "valid_targets_min": 477 }, { "epoch": 4.209748892171344, "grad_norm": 0.36990404396979687, "learning_rate": 1.644646487047184e-05, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.1521548181772232, "step": 2850, "valid_targets_mean": 7015.2, "valid_targets_min": 861 }, { "epoch": 4.2171344165435745, "grad_norm": 0.4062689203699344, "learning_rate": 1.6374001292961915e-05, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.1495155543088913, "step": 2855, "valid_targets_mean": 5666.6, "valid_targets_min": 760 }, { "epoch": 4.224519940915805, "grad_norm": 0.4252533883734268, "learning_rate": 1.630158690001723e-05, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.17348308861255646, "step": 2860, "valid_targets_mean": 5389.8, "valid_targets_min": 461 }, { "epoch": 4.231905465288035, "grad_norm": 0.44977416984855956, "learning_rate": 1.6229222673896977e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.19169771671295166, "step": 2865, "valid_targets_mean": 6240.2, "valid_targets_min": 648 }, { "epoch": 4.239290989660266, "grad_norm": 0.517268002202166, "learning_rate": 1.615690959617981e-05, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.1724705845117569, "step": 2870, "valid_targets_mean": 4480.9, "valid_targets_min": 546 }, { "epoch": 4.2466765140324965, "grad_norm": 0.5034227859483678, "learning_rate": 1.608464864775061e-05, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.15206247568130493, "step": 2875, "valid_targets_mean": 5756.9, "valid_targets_min": 883 }, { "epoch": 4.254062038404727, "grad_norm": 0.3934998046892, "learning_rate": 1.601244080878715e-05, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.1561555415391922, "step": 2880, "valid_targets_mean": 7151.8, "valid_targets_min": 637 }, { "epoch": 4.261447562776957, "grad_norm": 0.4021841720607587, "learning_rate": 1.5940287058746805e-05, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.14158207178115845, "step": 2885, "valid_targets_mean": 4988.3, "valid_targets_min": 691 }, { "epoch": 4.268833087149187, "grad_norm": 0.6182741776921272, "learning_rate": 1.5868188376353258e-05, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.1992129683494568, "step": 2890, "valid_targets_mean": 5678.7, "valid_targets_min": 778 }, { "epoch": 4.2762186115214185, "grad_norm": 0.4614176577748903, "learning_rate": 1.579614573958324e-05, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.17441459000110626, "step": 2895, "valid_targets_mean": 5331.5, "valid_targets_min": 324 }, { "epoch": 4.283604135893649, "grad_norm": 0.5039839970397774, "learning_rate": 1.5724160125653253e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.18613968789577484, "step": 2900, "valid_targets_mean": 4360.8, "valid_targets_min": 575 }, { "epoch": 4.290989660265879, "grad_norm": 0.56591190309574, "learning_rate": 1.5652232511006313e-05, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.21027769148349762, "step": 2905, "valid_targets_mean": 3856.9, "valid_targets_min": 362 }, { "epoch": 4.298375184638109, "grad_norm": 0.5045039977125617, "learning_rate": 1.5580363871298713e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.15514475107192993, "step": 2910, "valid_targets_mean": 4200.1, "valid_targets_min": 425 }, { "epoch": 4.30576070901034, "grad_norm": 0.5630509270539151, "learning_rate": 1.550855518138679e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.2181616574525833, "step": 2915, "valid_targets_mean": 3684.9, "valid_targets_min": 668 }, { "epoch": 4.31314623338257, "grad_norm": 0.50018909523244, "learning_rate": 1.543680741531368e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.1719134896993637, "step": 2920, "valid_targets_mean": 4710.3, "valid_targets_min": 575 }, { "epoch": 4.3205317577548, "grad_norm": 0.446233266875378, "learning_rate": 1.536512154629615e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.15354609489440918, "step": 2925, "valid_targets_mean": 4676.2, "valid_targets_min": 538 }, { "epoch": 4.327917282127031, "grad_norm": 0.4418361621253541, "learning_rate": 1.5293498546711347e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.21994024515151978, "step": 2930, "valid_targets_mean": 5910.9, "valid_targets_min": 541 }, { "epoch": 4.335302806499262, "grad_norm": 0.43246616750276806, "learning_rate": 1.5221939388083638e-05, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.14813780784606934, "step": 2935, "valid_targets_mean": 5155.4, "valid_targets_min": 608 }, { "epoch": 4.342688330871492, "grad_norm": 0.5184902584890491, "learning_rate": 1.5150445041071418e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.18272896111011505, "step": 2940, "valid_targets_mean": 3901.2, "valid_targets_min": 708 }, { "epoch": 4.350073855243722, "grad_norm": 0.46142756709679333, "learning_rate": 1.5079016475453974e-05, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.15337729454040527, "step": 2945, "valid_targets_mean": 4455.8, "valid_targets_min": 477 }, { "epoch": 4.357459379615952, "grad_norm": 0.4202013962683297, "learning_rate": 1.500765466011827e-05, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.14253225922584534, "step": 2950, "valid_targets_mean": 5328.2, "valid_targets_min": 747 }, { "epoch": 4.364844903988184, "grad_norm": 0.4223795000780752, "learning_rate": 1.4936360563045863e-05, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.1546299159526825, "step": 2955, "valid_targets_mean": 4801.2, "valid_targets_min": 228 }, { "epoch": 4.372230428360414, "grad_norm": 0.5947413428907822, "learning_rate": 1.4865135151299756e-05, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.18521949648857117, "step": 2960, "valid_targets_mean": 3601.5, "valid_targets_min": 481 }, { "epoch": 4.379615952732644, "grad_norm": 0.4824214614001069, "learning_rate": 1.4793979391011264e-05, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.1658276468515396, "step": 2965, "valid_targets_mean": 4537.8, "valid_targets_min": 596 }, { "epoch": 4.387001477104874, "grad_norm": 0.4535168608231596, "learning_rate": 1.4722894247366925e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.17292077839374542, "step": 2970, "valid_targets_mean": 4852.9, "valid_targets_min": 215 }, { "epoch": 4.394387001477105, "grad_norm": 0.43921335228854064, "learning_rate": 1.4651880684595394e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.18284352123737335, "step": 2975, "valid_targets_mean": 5821.1, "valid_targets_min": 552 }, { "epoch": 4.401772525849335, "grad_norm": 0.47059015487422473, "learning_rate": 1.4580939665954396e-05, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.1612253487110138, "step": 2980, "valid_targets_mean": 4167.0, "valid_targets_min": 686 }, { "epoch": 4.409158050221565, "grad_norm": 0.6361271510225736, "learning_rate": 1.4510072153717613e-05, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.17631939053535461, "step": 2985, "valid_targets_mean": 3730.2, "valid_targets_min": 626 }, { "epoch": 4.416543574593796, "grad_norm": 0.4847929947491163, "learning_rate": 1.4439279109161673e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.16035814583301544, "step": 2990, "valid_targets_mean": 4219.9, "valid_targets_min": 652 }, { "epoch": 4.423929098966027, "grad_norm": 0.4246728217669771, "learning_rate": 1.4368561492553074e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.19435647130012512, "step": 2995, "valid_targets_mean": 5936.1, "valid_targets_min": 615 }, { "epoch": 4.431314623338257, "grad_norm": 0.5841115607984504, "learning_rate": 1.4297920263135194e-05, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.18300238251686096, "step": 3000, "valid_targets_mean": 3174.0, "valid_targets_min": 355 }, { "epoch": 4.438700147710487, "grad_norm": 0.44672860156890554, "learning_rate": 1.4227356379115256e-05, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.18793809413909912, "step": 3005, "valid_targets_mean": 5597.8, "valid_targets_min": 879 }, { "epoch": 4.4460856720827175, "grad_norm": 0.38476310411513204, "learning_rate": 1.4156870797651343e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.1833447515964508, "step": 3010, "valid_targets_mean": 6966.1, "valid_targets_min": 506 }, { "epoch": 4.453471196454949, "grad_norm": 0.42279572173644614, "learning_rate": 1.4086464474839399e-05, "loss": 0.1927, "loss_nan_ranks": 0, "loss_rank_avg": 0.1899091899394989, "step": 3015, "valid_targets_mean": 5839.3, "valid_targets_min": 816 }, { "epoch": 4.460856720827179, "grad_norm": 0.44031418366204805, "learning_rate": 1.4016138365700283e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.17797401547431946, "step": 3020, "valid_targets_mean": 6834.4, "valid_targets_min": 628 }, { "epoch": 4.468242245199409, "grad_norm": 0.48920064870797775, "learning_rate": 1.3945893424166799e-05, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.18216978013515472, "step": 3025, "valid_targets_mean": 4377.6, "valid_targets_min": 573 }, { "epoch": 4.4756277695716395, "grad_norm": 0.4860440678191081, "learning_rate": 1.3875730603070755e-05, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.17842218279838562, "step": 3030, "valid_targets_mean": 4298.3, "valid_targets_min": 519 }, { "epoch": 4.48301329394387, "grad_norm": 0.5122645397551936, "learning_rate": 1.3805650854130042e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.16408318281173706, "step": 3035, "valid_targets_mean": 5356.2, "valid_targets_min": 612 }, { "epoch": 4.4903988183161, "grad_norm": 0.5777970599819502, "learning_rate": 1.3735655127935727e-05, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.18035376071929932, "step": 3040, "valid_targets_mean": 3534.7, "valid_targets_min": 510 }, { "epoch": 4.497784342688331, "grad_norm": 0.40634258250665284, "learning_rate": 1.3665744373939165e-05, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.1392553746700287, "step": 3045, "valid_targets_mean": 6123.2, "valid_targets_min": 768 }, { "epoch": 4.5051698670605616, "grad_norm": 0.4222640132338195, "learning_rate": 1.3595919540439098e-05, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.15259933471679688, "step": 3050, "valid_targets_mean": 4889.3, "valid_targets_min": 475 }, { "epoch": 4.512555391432792, "grad_norm": 0.42710032158994776, "learning_rate": 1.352618157456882e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.1755707710981369, "step": 3055, "valid_targets_mean": 5323.7, "valid_targets_min": 573 }, { "epoch": 4.519940915805022, "grad_norm": 0.4546554151450125, "learning_rate": 1.3456531422283314e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.16564080119132996, "step": 3060, "valid_targets_mean": 5748.6, "valid_targets_min": 635 }, { "epoch": 4.527326440177252, "grad_norm": 0.3920659302495498, "learning_rate": 1.3386970028346414e-05, "loss": 0.158, "loss_nan_ranks": 0, "loss_rank_avg": 0.14143362641334534, "step": 3065, "valid_targets_mean": 6217.1, "valid_targets_min": 637 }, { "epoch": 4.534711964549483, "grad_norm": 0.6631096404799323, "learning_rate": 1.3317498336318001e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.14858531951904297, "step": 3070, "valid_targets_mean": 5357.5, "valid_targets_min": 802 }, { "epoch": 4.542097488921714, "grad_norm": 0.36924744404698256, "learning_rate": 1.3248117288541224e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.15762075781822205, "step": 3075, "valid_targets_mean": 6748.7, "valid_targets_min": 1209 }, { "epoch": 4.549483013293944, "grad_norm": 0.4132566623757397, "learning_rate": 1.3178827826129653e-05, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.15297694504261017, "step": 3080, "valid_targets_mean": 5218.4, "valid_targets_min": 629 }, { "epoch": 4.556868537666174, "grad_norm": 0.6105683360071116, "learning_rate": 1.3109630888954586e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.18115362524986267, "step": 3085, "valid_targets_mean": 2799.2, "valid_targets_min": 518 }, { "epoch": 4.564254062038405, "grad_norm": 0.4312209357104268, "learning_rate": 1.3040527415632264e-05, "loss": 0.1705, "loss_nan_ranks": 0, "loss_rank_avg": 0.13422748446464539, "step": 3090, "valid_targets_mean": 5207.3, "valid_targets_min": 750 }, { "epoch": 4.571639586410635, "grad_norm": 0.5345112264129266, "learning_rate": 1.297151834351115e-05, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.2037266194820404, "step": 3095, "valid_targets_mean": 4426.9, "valid_targets_min": 584 }, { "epoch": 4.579025110782865, "grad_norm": 0.48644514959603063, "learning_rate": 1.2902604608659195e-05, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.19521738588809967, "step": 3100, "valid_targets_mean": 4656.5, "valid_targets_min": 536 }, { "epoch": 4.586410635155096, "grad_norm": 0.4686584623782236, "learning_rate": 1.2833787145851164e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.16689223051071167, "step": 3105, "valid_targets_mean": 4490.6, "valid_targets_min": 675 }, { "epoch": 4.593796159527327, "grad_norm": 0.4343439566599933, "learning_rate": 1.2765066888555957e-05, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.19107720255851746, "step": 3110, "valid_targets_mean": 5998.3, "valid_targets_min": 735 }, { "epoch": 4.601181683899557, "grad_norm": 0.48092468519713316, "learning_rate": 1.2696444768923919e-05, "loss": 0.1721, "loss_nan_ranks": 0, "loss_rank_avg": 0.18640181422233582, "step": 3115, "valid_targets_mean": 4409.0, "valid_targets_min": 492 }, { "epoch": 4.608567208271787, "grad_norm": 0.3949210579717376, "learning_rate": 1.2627921717774236e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.16668841242790222, "step": 3120, "valid_targets_mean": 6662.4, "valid_targets_min": 375 }, { "epoch": 4.6159527326440175, "grad_norm": 0.3653101251021582, "learning_rate": 1.2559498664582259e-05, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.17200833559036255, "step": 3125, "valid_targets_mean": 7024.5, "valid_targets_min": 691 }, { "epoch": 4.623338257016248, "grad_norm": 0.5353189616488072, "learning_rate": 1.2491176537466951e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.18706795573234558, "step": 3130, "valid_targets_mean": 3664.9, "valid_targets_min": 553 }, { "epoch": 4.630723781388479, "grad_norm": 0.48483146785334685, "learning_rate": 1.242295626317826e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.18977820873260498, "step": 3135, "valid_targets_mean": 4671.8, "valid_targets_min": 541 }, { "epoch": 4.638109305760709, "grad_norm": 0.4576012336580824, "learning_rate": 1.2354838767084563e-05, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.1621273159980774, "step": 3140, "valid_targets_mean": 4912.6, "valid_targets_min": 547 }, { "epoch": 4.6454948301329395, "grad_norm": 0.47408165212071834, "learning_rate": 1.2286824973160103e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.14935819804668427, "step": 3145, "valid_targets_mean": 4476.2, "valid_targets_min": 654 }, { "epoch": 4.65288035450517, "grad_norm": 0.35823980053826326, "learning_rate": 1.2218915803972478e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.15744267404079437, "step": 3150, "valid_targets_mean": 6967.7, "valid_targets_min": 639 }, { "epoch": 4.6602658788774, "grad_norm": 0.3938649437885737, "learning_rate": 1.2151112180670097e-05, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.15055982768535614, "step": 3155, "valid_targets_mean": 6357.4, "valid_targets_min": 2129 }, { "epoch": 4.66765140324963, "grad_norm": 0.4159919225396087, "learning_rate": 1.2083415022969712e-05, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.1428435891866684, "step": 3160, "valid_targets_mean": 5190.1, "valid_targets_min": 589 }, { "epoch": 4.6750369276218615, "grad_norm": 0.321718436567835, "learning_rate": 1.2015825249143926e-05, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.11123082041740417, "step": 3165, "valid_targets_mean": 6443.4, "valid_targets_min": 550 }, { "epoch": 4.682422451994092, "grad_norm": 0.5181376093279889, "learning_rate": 1.1948343776008738e-05, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.18044036626815796, "step": 3170, "valid_targets_mean": 5152.0, "valid_targets_min": 476 }, { "epoch": 4.689807976366322, "grad_norm": 0.3835319842919287, "learning_rate": 1.1880971518911112e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.1430322527885437, "step": 3175, "valid_targets_mean": 5503.8, "valid_targets_min": 599 }, { "epoch": 4.697193500738552, "grad_norm": 0.38392579284693557, "learning_rate": 1.1813709391716568e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.14627256989479065, "step": 3180, "valid_targets_mean": 6006.3, "valid_targets_min": 649 }, { "epoch": 4.704579025110783, "grad_norm": 0.4621220677999244, "learning_rate": 1.1746558306796776e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.17970584332942963, "step": 3185, "valid_targets_mean": 4955.9, "valid_targets_min": 676 }, { "epoch": 4.711964549483013, "grad_norm": 0.4500367333603124, "learning_rate": 1.1679519175017174e-05, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.14992380142211914, "step": 3190, "valid_targets_mean": 4324.4, "valid_targets_min": 615 }, { "epoch": 4.719350073855244, "grad_norm": 0.4306455292259303, "learning_rate": 1.161259290572462e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.1760706901550293, "step": 3195, "valid_targets_mean": 5846.6, "valid_targets_min": 714 }, { "epoch": 4.726735598227474, "grad_norm": 0.5361598584911511, "learning_rate": 1.1545780406735081e-05, "loss": 0.1835, "loss_nan_ranks": 0, "loss_rank_avg": 0.16949506103992462, "step": 3200, "valid_targets_mean": 3808.7, "valid_targets_min": 608 }, { "epoch": 4.734121122599705, "grad_norm": 0.4278388705938128, "learning_rate": 1.1479082584321265e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.16112419962882996, "step": 3205, "valid_targets_mean": 5402.7, "valid_targets_min": 614 }, { "epoch": 4.741506646971935, "grad_norm": 0.4272816557388593, "learning_rate": 1.1412500343200384e-05, "loss": 0.1457, "loss_nan_ranks": 0, "loss_rank_avg": 0.13227397203445435, "step": 3210, "valid_targets_mean": 5582.8, "valid_targets_min": 229 }, { "epoch": 4.748892171344165, "grad_norm": 0.47634077338014624, "learning_rate": 1.1346034586521828e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.17866167426109314, "step": 3215, "valid_targets_mean": 4475.9, "valid_targets_min": 595 }, { "epoch": 4.7562776957163955, "grad_norm": 0.4344869468282722, "learning_rate": 1.127968621585497e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.15781113505363464, "step": 3220, "valid_targets_mean": 5149.8, "valid_targets_min": 702 }, { "epoch": 4.763663220088627, "grad_norm": 0.4467123123517859, "learning_rate": 1.1213456131176894e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.13696205615997314, "step": 3225, "valid_targets_mean": 4635.4, "valid_targets_min": 355 }, { "epoch": 4.771048744460857, "grad_norm": 0.6578561115499146, "learning_rate": 1.1147345230860225e-05, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.1457718312740326, "step": 3230, "valid_targets_mean": 5075.1, "valid_targets_min": 380 }, { "epoch": 4.778434268833087, "grad_norm": 0.47187291081005306, "learning_rate": 1.1081354411660899e-05, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.22649861872196198, "step": 3235, "valid_targets_mean": 5602.9, "valid_targets_min": 385 }, { "epoch": 4.7858197932053175, "grad_norm": 0.4585294146600305, "learning_rate": 1.1015484568706025e-05, "loss": 0.1694, "loss_nan_ranks": 0, "loss_rank_avg": 0.15446168184280396, "step": 3240, "valid_targets_mean": 4190.6, "valid_targets_min": 401 }, { "epoch": 4.793205317577548, "grad_norm": 0.4721836321102142, "learning_rate": 1.0949736595481748e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.16026848554611206, "step": 3245, "valid_targets_mean": 4162.0, "valid_targets_min": 211 }, { "epoch": 4.800590841949779, "grad_norm": 0.5097924145730403, "learning_rate": 1.0884111383821115e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.1608010232448578, "step": 3250, "valid_targets_mean": 4100.3, "valid_targets_min": 559 }, { "epoch": 4.807976366322009, "grad_norm": 0.5121344596400246, "learning_rate": 1.0818609823891988e-05, "loss": 0.1852, "loss_nan_ranks": 0, "loss_rank_avg": 0.18942126631736755, "step": 3255, "valid_targets_mean": 4584.4, "valid_targets_min": 529 }, { "epoch": 4.8153618906942395, "grad_norm": 0.39125128571958845, "learning_rate": 1.0753232804184944e-05, "loss": 0.1711, "loss_nan_ranks": 0, "loss_rank_avg": 0.1385767161846161, "step": 3260, "valid_targets_mean": 5840.9, "valid_targets_min": 696 }, { "epoch": 4.82274741506647, "grad_norm": 0.519147963569654, "learning_rate": 1.0687981211501286e-05, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.13257870078086853, "step": 3265, "valid_targets_mean": 5252.2, "valid_targets_min": 832 }, { "epoch": 4.8301329394387, "grad_norm": 0.3882601827065478, "learning_rate": 1.0622855930940935e-05, "loss": 0.1788, "loss_nan_ranks": 0, "loss_rank_avg": 0.16074441373348236, "step": 3270, "valid_targets_mean": 5536.7, "valid_targets_min": 717 }, { "epoch": 4.83751846381093, "grad_norm": 0.5424919781622314, "learning_rate": 1.0557857845890486e-05, "loss": 0.1676, "loss_nan_ranks": 0, "loss_rank_avg": 0.19361868500709534, "step": 3275, "valid_targets_mean": 4543.6, "valid_targets_min": 246 }, { "epoch": 4.844903988183161, "grad_norm": 0.5134917623818339, "learning_rate": 1.049298783801118e-05, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.1247122585773468, "step": 3280, "valid_targets_mean": 4817.4, "valid_targets_min": 457 }, { "epoch": 4.852289512555392, "grad_norm": 0.4500612814479838, "learning_rate": 1.0428246787226979e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.16459113359451294, "step": 3285, "valid_targets_mean": 4635.2, "valid_targets_min": 531 }, { "epoch": 4.859675036927622, "grad_norm": 0.4535219744538525, "learning_rate": 1.0363635571712614e-05, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.16566744446754456, "step": 3290, "valid_targets_mean": 5096.8, "valid_targets_min": 592 }, { "epoch": 4.867060561299852, "grad_norm": 0.46962696061070613, "learning_rate": 1.0299155067881673e-05, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.19553884863853455, "step": 3295, "valid_targets_mean": 5114.3, "valid_targets_min": 562 }, { "epoch": 4.874446085672083, "grad_norm": 0.39252568546578387, "learning_rate": 1.023480615037472e-05, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.1575905829668045, "step": 3300, "valid_targets_mean": 5711.9, "valid_targets_min": 568 }, { "epoch": 4.881831610044313, "grad_norm": 4.133528284855488, "learning_rate": 1.0170589692047428e-05, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.13656756281852722, "step": 3305, "valid_targets_mean": 4539.4, "valid_targets_min": 494 }, { "epoch": 4.889217134416544, "grad_norm": 0.5686494863470835, "learning_rate": 1.0106506563958733e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.19371378421783447, "step": 3310, "valid_targets_mean": 3573.2, "valid_targets_min": 430 }, { "epoch": 4.896602658788774, "grad_norm": 0.4402520543361477, "learning_rate": 1.0042557635359028e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.1665995717048645, "step": 3315, "valid_targets_mean": 5250.2, "valid_targets_min": 495 }, { "epoch": 4.903988183161005, "grad_norm": 0.41299530585836114, "learning_rate": 9.978743773678362e-06, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.173518568277359, "step": 3320, "valid_targets_mean": 5918.4, "valid_targets_min": 583 }, { "epoch": 4.911373707533235, "grad_norm": 0.4208459436047827, "learning_rate": 9.915065844514688e-06, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.12593166530132294, "step": 3325, "valid_targets_mean": 5046.3, "valid_targets_min": 298 }, { "epoch": 4.918759231905465, "grad_norm": 0.5089228253284505, "learning_rate": 9.851524711622111e-06, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.19019880890846252, "step": 3330, "valid_targets_mean": 4365.8, "valid_targets_min": 683 }, { "epoch": 4.926144756277695, "grad_norm": 0.3548181182634598, "learning_rate": 9.78812123689917e-06, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.16198115050792694, "step": 3335, "valid_targets_mean": 7325.5, "valid_targets_min": 469 }, { "epoch": 4.933530280649926, "grad_norm": 0.4847190504144033, "learning_rate": 9.724856280377155e-06, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.19115082919597626, "step": 3340, "valid_targets_mean": 4280.8, "valid_targets_min": 655 }, { "epoch": 4.940915805022157, "grad_norm": 0.45392216834170873, "learning_rate": 9.661730700208434e-06, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.21955522894859314, "step": 3345, "valid_targets_mean": 4720.2, "valid_targets_min": 383 }, { "epoch": 4.948301329394387, "grad_norm": 0.38054470770168214, "learning_rate": 9.598745352654819e-06, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.16042864322662354, "step": 3350, "valid_targets_mean": 5992.3, "valid_targets_min": 598 }, { "epoch": 4.955686853766617, "grad_norm": 0.4603546661973167, "learning_rate": 9.535901092075945e-06, "loss": 0.1739, "loss_nan_ranks": 0, "loss_rank_avg": 0.17585790157318115, "step": 3355, "valid_targets_mean": 4433.1, "valid_targets_min": 538 }, { "epoch": 4.963072378138848, "grad_norm": 0.4507007240993226, "learning_rate": 9.473198770917686e-06, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.13589590787887573, "step": 3360, "valid_targets_mean": 5814.6, "valid_targets_min": 649 }, { "epoch": 4.970457902511078, "grad_norm": 0.42542002909001325, "learning_rate": 9.41063923970059e-06, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.16971269249916077, "step": 3365, "valid_targets_mean": 5632.9, "valid_targets_min": 584 }, { "epoch": 4.977843426883309, "grad_norm": 0.6339824403474643, "learning_rate": 9.348223347008342e-06, "loss": 0.1862, "loss_nan_ranks": 0, "loss_rank_avg": 0.1671033501625061, "step": 3370, "valid_targets_mean": 6262.1, "valid_targets_min": 831 }, { "epoch": 4.985228951255539, "grad_norm": 0.4263518906101623, "learning_rate": 9.285951939476256e-06, "loss": 0.1488, "loss_nan_ranks": 0, "loss_rank_avg": 0.1599881947040558, "step": 3375, "valid_targets_mean": 4836.1, "valid_targets_min": 521 }, { "epoch": 4.99261447562777, "grad_norm": 0.4552157775554924, "learning_rate": 9.22382586177978e-06, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.17859028279781342, "step": 3380, "valid_targets_mean": 5123.1, "valid_targets_min": 664 }, { "epoch": 5.0, "grad_norm": 0.42182388484726885, "learning_rate": 9.161845956623072e-06, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.125313863158226, "step": 3385, "valid_targets_mean": 5043.0, "valid_targets_min": 661 }, { "epoch": 5.00738552437223, "grad_norm": 0.4371353465408426, "learning_rate": 9.100013064727508e-06, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.19350577890872955, "step": 3390, "valid_targets_mean": 6081.2, "valid_targets_min": 591 }, { "epoch": 5.014771048744461, "grad_norm": 0.444555503330858, "learning_rate": 9.038328024820342e-06, "loss": 0.1691, "loss_nan_ranks": 0, "loss_rank_avg": 0.2033313512802124, "step": 3395, "valid_targets_mean": 5863.6, "valid_targets_min": 499 }, { "epoch": 5.022156573116692, "grad_norm": 0.42165983760825365, "learning_rate": 8.976791673623289e-06, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.15845409035682678, "step": 3400, "valid_targets_mean": 5640.8, "valid_targets_min": 546 }, { "epoch": 5.029542097488922, "grad_norm": 0.38297498375540073, "learning_rate": 8.915404845841194e-06, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.11503148823976517, "step": 3405, "valid_targets_mean": 7132.4, "valid_targets_min": 592 }, { "epoch": 5.036927621861152, "grad_norm": 0.4953749429257958, "learning_rate": 8.8541683741507e-06, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.14602802693843842, "step": 3410, "valid_targets_mean": 4715.0, "valid_targets_min": 539 }, { "epoch": 5.044313146233383, "grad_norm": 0.5095609371925762, "learning_rate": 8.793083089188953e-06, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.1521594226360321, "step": 3415, "valid_targets_mean": 4684.5, "valid_targets_min": 555 }, { "epoch": 5.051698670605613, "grad_norm": 0.4523371860610417, "learning_rate": 8.732149819542362e-06, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.15225934982299805, "step": 3420, "valid_targets_mean": 5030.1, "valid_targets_min": 577 }, { "epoch": 5.059084194977843, "grad_norm": 0.5280342375496218, "learning_rate": 8.671369391735304e-06, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.14403800666332245, "step": 3425, "valid_targets_mean": 5231.7, "valid_targets_min": 566 }, { "epoch": 5.066469719350074, "grad_norm": 0.40798873184330564, "learning_rate": 8.610742630218978e-06, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.13136714696884155, "step": 3430, "valid_targets_mean": 6256.9, "valid_targets_min": 613 }, { "epoch": 5.073855243722305, "grad_norm": 0.3861935517496378, "learning_rate": 8.550270357360149e-06, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.12466324865818024, "step": 3435, "valid_targets_mean": 5849.4, "valid_targets_min": 642 }, { "epoch": 5.081240768094535, "grad_norm": 0.7401400100882837, "learning_rate": 8.489953393430066e-06, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.1705418825149536, "step": 3440, "valid_targets_mean": 3559.2, "valid_targets_min": 490 }, { "epoch": 5.088626292466765, "grad_norm": 0.5193202825498705, "learning_rate": 8.429792556593293e-06, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.22426575422286987, "step": 3445, "valid_targets_mean": 5109.2, "valid_targets_min": 496 }, { "epoch": 5.096011816838995, "grad_norm": 0.43168022491540325, "learning_rate": 8.36978866289661e-06, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.17360247671604156, "step": 3450, "valid_targets_mean": 5924.7, "valid_targets_min": 690 }, { "epoch": 5.103397341211226, "grad_norm": 0.5111277913511018, "learning_rate": 8.309942526257982e-06, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.14671558141708374, "step": 3455, "valid_targets_mean": 4076.2, "valid_targets_min": 552 }, { "epoch": 5.110782865583457, "grad_norm": 0.3745220484810527, "learning_rate": 8.250254958455466e-06, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.13649728894233704, "step": 3460, "valid_targets_mean": 6392.8, "valid_targets_min": 953 }, { "epoch": 5.118168389955687, "grad_norm": 0.41895740102958157, "learning_rate": 8.19072676911623e-06, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.16213387250900269, "step": 3465, "valid_targets_mean": 5501.8, "valid_targets_min": 563 }, { "epoch": 5.125553914327917, "grad_norm": 0.4621969274320497, "learning_rate": 8.13135876570557e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.1634249985218048, "step": 3470, "valid_targets_mean": 5318.6, "valid_targets_min": 739 }, { "epoch": 5.132939438700148, "grad_norm": 0.5101384366926183, "learning_rate": 8.072151753515963e-06, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.18241387605667114, "step": 3475, "valid_targets_mean": 4392.2, "valid_targets_min": 589 }, { "epoch": 5.140324963072378, "grad_norm": 0.435494385133351, "learning_rate": 8.013106535656098e-06, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.15624777972698212, "step": 3480, "valid_targets_mean": 5854.9, "valid_targets_min": 671 }, { "epoch": 5.147710487444608, "grad_norm": 0.45540841610405663, "learning_rate": 7.954223913040052e-06, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.16797244548797607, "step": 3485, "valid_targets_mean": 6307.3, "valid_targets_min": 650 }, { "epoch": 5.155096011816839, "grad_norm": 0.435797126087404, "learning_rate": 7.895504684376387e-06, "loss": 0.1686, "loss_nan_ranks": 0, "loss_rank_avg": 0.20473451912403107, "step": 3490, "valid_targets_mean": 6468.6, "valid_targets_min": 688 }, { "epoch": 5.16248153618907, "grad_norm": 0.4658949563928541, "learning_rate": 7.836949646157317e-06, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.23565639555454254, "step": 3495, "valid_targets_mean": 5807.4, "valid_targets_min": 471 }, { "epoch": 5.1698670605613, "grad_norm": 0.6532185606945251, "learning_rate": 7.778559592647903e-06, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.15222051739692688, "step": 3500, "valid_targets_mean": 5615.7, "valid_targets_min": 583 }, { "epoch": 5.17725258493353, "grad_norm": 0.37994849707269074, "learning_rate": 7.720335315875286e-06, "loss": 0.1522, "loss_nan_ranks": 0, "loss_rank_avg": 0.11698979139328003, "step": 3505, "valid_targets_mean": 6916.1, "valid_targets_min": 303 }, { "epoch": 5.1846381093057605, "grad_norm": 0.4867862414276969, "learning_rate": 7.662277605617952e-06, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.15551450848579407, "step": 3510, "valid_targets_mean": 5208.1, "valid_targets_min": 692 }, { "epoch": 5.192023633677991, "grad_norm": 0.5261180668274233, "learning_rate": 7.604387249394991e-06, "loss": 0.1883, "loss_nan_ranks": 0, "loss_rank_avg": 0.17861658334732056, "step": 3515, "valid_targets_mean": 4572.2, "valid_targets_min": 643 }, { "epoch": 5.199409158050222, "grad_norm": 0.5013761956045906, "learning_rate": 7.546665032455458e-06, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.24076738953590393, "step": 3520, "valid_targets_mean": 5969.2, "valid_targets_min": 952 }, { "epoch": 5.206794682422452, "grad_norm": 0.44388940849901665, "learning_rate": 7.4891117377676555e-06, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.1808503419160843, "step": 3525, "valid_targets_mean": 5442.9, "valid_targets_min": 831 }, { "epoch": 5.2141802067946825, "grad_norm": 0.3368141280700644, "learning_rate": 7.431728146008603e-06, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.12330228835344315, "step": 3530, "valid_targets_mean": 7554.9, "valid_targets_min": 804 }, { "epoch": 5.221565731166913, "grad_norm": 0.47194572305530047, "learning_rate": 7.3745150355533665e-06, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.1410825550556183, "step": 3535, "valid_targets_mean": 4599.2, "valid_targets_min": 521 }, { "epoch": 5.228951255539143, "grad_norm": 0.4589841119409957, "learning_rate": 7.317473182464543e-06, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.14487279951572418, "step": 3540, "valid_targets_mean": 5436.2, "valid_targets_min": 472 }, { "epoch": 5.236336779911373, "grad_norm": 0.5079352080568156, "learning_rate": 7.260603360481719e-06, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.177564337849617, "step": 3545, "valid_targets_mean": 4225.0, "valid_targets_min": 441 }, { "epoch": 5.2437223042836045, "grad_norm": 0.4124981604846651, "learning_rate": 7.20390634101098e-06, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.20939132571220398, "step": 3550, "valid_targets_mean": 7137.3, "valid_targets_min": 425 }, { "epoch": 5.251107828655835, "grad_norm": 0.4748050711224649, "learning_rate": 7.147382893114447e-06, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.15160918235778809, "step": 3555, "valid_targets_mean": 5582.1, "valid_targets_min": 508 }, { "epoch": 5.258493353028065, "grad_norm": 0.49570642663047704, "learning_rate": 7.091033783499843e-06, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.1662381887435913, "step": 3560, "valid_targets_mean": 4688.8, "valid_targets_min": 412 }, { "epoch": 5.265878877400295, "grad_norm": 0.6444535354021959, "learning_rate": 7.034859776510094e-06, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.18472233414649963, "step": 3565, "valid_targets_mean": 2869.7, "valid_targets_min": 358 }, { "epoch": 5.273264401772526, "grad_norm": 0.36003282906413414, "learning_rate": 6.978861634112959e-06, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.11764170229434967, "step": 3570, "valid_targets_mean": 7215.8, "valid_targets_min": 714 }, { "epoch": 5.280649926144756, "grad_norm": 0.4363348321964383, "learning_rate": 6.923040115890698e-06, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.14421112835407257, "step": 3575, "valid_targets_mean": 5132.3, "valid_targets_min": 731 }, { "epoch": 5.288035450516987, "grad_norm": 0.4270407605139215, "learning_rate": 6.867395979029763e-06, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.15610837936401367, "step": 3580, "valid_targets_mean": 5726.0, "valid_targets_min": 524 }, { "epoch": 5.295420974889217, "grad_norm": 0.4372448860288484, "learning_rate": 6.8119299783105384e-06, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.1485387682914734, "step": 3585, "valid_targets_mean": 5501.2, "valid_targets_min": 798 }, { "epoch": 5.302806499261448, "grad_norm": 0.49670165229019625, "learning_rate": 6.756642866097087e-06, "loss": 0.1727, "loss_nan_ranks": 0, "loss_rank_avg": 0.21197667717933655, "step": 3590, "valid_targets_mean": 4981.1, "valid_targets_min": 593 }, { "epoch": 5.310192023633678, "grad_norm": 0.4873247420128096, "learning_rate": 6.701535392326959e-06, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.14547309279441833, "step": 3595, "valid_targets_mean": 4563.1, "valid_targets_min": 619 }, { "epoch": 5.317577548005908, "grad_norm": 0.4104843544339754, "learning_rate": 6.646608304501008e-06, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.16900783777236938, "step": 3600, "valid_targets_mean": 6581.2, "valid_targets_min": 764 }, { "epoch": 5.3249630723781385, "grad_norm": 0.47195907463014314, "learning_rate": 6.591862347673257e-06, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.1981767863035202, "step": 3605, "valid_targets_mean": 4831.9, "valid_targets_min": 710 }, { "epoch": 5.33234859675037, "grad_norm": 0.542224951252824, "learning_rate": 6.537298264440813e-06, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.19629326462745667, "step": 3610, "valid_targets_mean": 3798.4, "valid_targets_min": 432 }, { "epoch": 5.3397341211226, "grad_norm": 0.35804884095064315, "learning_rate": 6.482916794933736e-06, "loss": 0.141, "loss_nan_ranks": 0, "loss_rank_avg": 0.12061704695224762, "step": 3615, "valid_targets_mean": 6460.8, "valid_targets_min": 638 }, { "epoch": 5.34711964549483, "grad_norm": 0.49330966651853386, "learning_rate": 6.428718676805065e-06, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.21051400899887085, "step": 3620, "valid_targets_mean": 4860.2, "valid_targets_min": 433 }, { "epoch": 5.3545051698670605, "grad_norm": 0.5321457303177618, "learning_rate": 6.374704645220775e-06, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.1549859642982483, "step": 3625, "valid_targets_mean": 3886.5, "valid_targets_min": 466 }, { "epoch": 5.361890694239291, "grad_norm": 0.39489790904559613, "learning_rate": 6.320875432849816e-06, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.1310429573059082, "step": 3630, "valid_targets_mean": 7088.1, "valid_targets_min": 584 }, { "epoch": 5.369276218611521, "grad_norm": 0.45105096964297986, "learning_rate": 6.2672317698541695e-06, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.1540766954421997, "step": 3635, "valid_targets_mean": 4639.0, "valid_targets_min": 560 }, { "epoch": 5.376661742983752, "grad_norm": 0.4753836438289837, "learning_rate": 6.213774383878945e-06, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.12997017800807953, "step": 3640, "valid_targets_mean": 5125.3, "valid_targets_min": 526 }, { "epoch": 5.3840472673559825, "grad_norm": 0.5042444574219167, "learning_rate": 6.1605040000425285e-06, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.13099181652069092, "step": 3645, "valid_targets_mean": 5819.9, "valid_targets_min": 490 }, { "epoch": 5.391432791728213, "grad_norm": 0.3863263579045339, "learning_rate": 6.107421340926716e-06, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.16232043504714966, "step": 3650, "valid_targets_mean": 6967.1, "valid_targets_min": 901 }, { "epoch": 5.398818316100443, "grad_norm": 0.5220422627235417, "learning_rate": 6.054527126566933e-06, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.16426241397857666, "step": 3655, "valid_targets_mean": 4679.2, "valid_targets_min": 716 }, { "epoch": 5.406203840472673, "grad_norm": 0.4319185540338788, "learning_rate": 6.0018220744424495e-06, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.1663556545972824, "step": 3660, "valid_targets_mean": 6097.4, "valid_targets_min": 602 }, { "epoch": 5.413589364844904, "grad_norm": 0.3956255035616646, "learning_rate": 5.949306899466672e-06, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.14825277030467987, "step": 3665, "valid_targets_mean": 6583.9, "valid_targets_min": 691 }, { "epoch": 5.420974889217135, "grad_norm": 0.484584083668749, "learning_rate": 5.8969823139774304e-06, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.19931569695472717, "step": 3670, "valid_targets_mean": 4773.4, "valid_targets_min": 597 }, { "epoch": 5.428360413589365, "grad_norm": 0.45434367771112616, "learning_rate": 5.844849027727313e-06, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.19150590896606445, "step": 3675, "valid_targets_mean": 5992.9, "valid_targets_min": 505 }, { "epoch": 5.435745937961595, "grad_norm": 0.6026865956309536, "learning_rate": 5.792907747874068e-06, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.16173362731933594, "step": 3680, "valid_targets_mean": 4554.5, "valid_targets_min": 573 }, { "epoch": 5.443131462333826, "grad_norm": 0.40334097093396654, "learning_rate": 5.741159178970958e-06, "loss": 0.1551, "loss_nan_ranks": 0, "loss_rank_avg": 0.15286067128181458, "step": 3685, "valid_targets_mean": 6434.6, "valid_targets_min": 894 }, { "epoch": 5.450516986706056, "grad_norm": 0.42746203298644087, "learning_rate": 5.689604022957256e-06, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.1851692497730255, "step": 3690, "valid_targets_mean": 6208.4, "valid_targets_min": 584 }, { "epoch": 5.457902511078286, "grad_norm": 0.48488271400781807, "learning_rate": 5.638242979148685e-06, "loss": 0.1782, "loss_nan_ranks": 0, "loss_rank_avg": 0.17530173063278198, "step": 3695, "valid_targets_mean": 4681.8, "valid_targets_min": 369 }, { "epoch": 5.465288035450517, "grad_norm": 0.49213245126776284, "learning_rate": 5.587076744227966e-06, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.1436440646648407, "step": 3700, "valid_targets_mean": 4852.8, "valid_targets_min": 349 }, { "epoch": 5.472673559822748, "grad_norm": 0.5385593413242621, "learning_rate": 5.536106012235329e-06, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.23084211349487305, "step": 3705, "valid_targets_mean": 5293.5, "valid_targets_min": 733 }, { "epoch": 5.480059084194978, "grad_norm": 0.4064012565579344, "learning_rate": 5.485331474559133e-06, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.13796594738960266, "step": 3710, "valid_targets_mean": 6042.2, "valid_targets_min": 491 }, { "epoch": 5.487444608567208, "grad_norm": 0.4466176384591676, "learning_rate": 5.434753819926484e-06, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.16316545009613037, "step": 3715, "valid_targets_mean": 4737.5, "valid_targets_min": 662 }, { "epoch": 5.4948301329394384, "grad_norm": 0.48204920306109306, "learning_rate": 5.384373734393871e-06, "loss": 0.1522, "loss_nan_ranks": 0, "loss_rank_avg": 0.12412101030349731, "step": 3720, "valid_targets_mean": 4247.8, "valid_targets_min": 430 }, { "epoch": 5.50221565731167, "grad_norm": 0.4423331415810954, "learning_rate": 5.334191901337875e-06, "loss": 0.1708, "loss_nan_ranks": 0, "loss_rank_avg": 0.16865645349025726, "step": 3725, "valid_targets_mean": 5476.6, "valid_targets_min": 635 }, { "epoch": 5.5096011816839, "grad_norm": 0.4261034310873824, "learning_rate": 5.284209001445901e-06, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.1629231870174408, "step": 3730, "valid_targets_mean": 5663.4, "valid_targets_min": 613 }, { "epoch": 5.51698670605613, "grad_norm": 0.5270843670535649, "learning_rate": 5.234425712706938e-06, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.1648382544517517, "step": 3735, "valid_targets_mean": 4095.7, "valid_targets_min": 587 }, { "epoch": 5.5243722304283605, "grad_norm": 0.4594394151163437, "learning_rate": 5.184842710402367e-06, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.14536496996879578, "step": 3740, "valid_targets_mean": 5437.5, "valid_targets_min": 734 }, { "epoch": 5.531757754800591, "grad_norm": 0.54902978481994, "learning_rate": 5.135460667096806e-06, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.20517590641975403, "step": 3745, "valid_targets_mean": 4786.9, "valid_targets_min": 500 }, { "epoch": 5.539143279172821, "grad_norm": 0.45086635799096986, "learning_rate": 5.086280252628955e-06, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.15122875571250916, "step": 3750, "valid_targets_mean": 4694.8, "valid_targets_min": 309 }, { "epoch": 5.546528803545051, "grad_norm": 0.4417456541588059, "learning_rate": 5.037302134102575e-06, "loss": 0.1656, "loss_nan_ranks": 0, "loss_rank_avg": 0.16173198819160461, "step": 3755, "valid_targets_mean": 5160.4, "valid_targets_min": 677 }, { "epoch": 5.5539143279172825, "grad_norm": 0.4768321706536616, "learning_rate": 4.988526975877374e-06, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.14764034748077393, "step": 3760, "valid_targets_mean": 4331.2, "valid_targets_min": 612 }, { "epoch": 5.561299852289513, "grad_norm": 0.41225383767497426, "learning_rate": 4.939955439560031e-06, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.12844733893871307, "step": 3765, "valid_targets_mean": 6010.1, "valid_targets_min": 515 }, { "epoch": 5.568685376661743, "grad_norm": 0.46955403794769657, "learning_rate": 4.891588183995206e-06, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.18649445474147797, "step": 3770, "valid_targets_mean": 4942.9, "valid_targets_min": 639 }, { "epoch": 5.576070901033973, "grad_norm": 0.3936059528169128, "learning_rate": 4.8434258652566165e-06, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.1388961225748062, "step": 3775, "valid_targets_mean": 5572.7, "valid_targets_min": 635 }, { "epoch": 5.583456425406204, "grad_norm": 0.4122457123845285, "learning_rate": 4.795469136638125e-06, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.14227622747421265, "step": 3780, "valid_targets_mean": 6029.8, "valid_targets_min": 535 }, { "epoch": 5.590841949778435, "grad_norm": 0.4412352401816102, "learning_rate": 4.747718648644884e-06, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.17034125328063965, "step": 3785, "valid_targets_mean": 5354.1, "valid_targets_min": 652 }, { "epoch": 5.598227474150665, "grad_norm": 0.5432056759362457, "learning_rate": 4.700175048984517e-06, "loss": 0.137, "loss_nan_ranks": 0, "loss_rank_avg": 0.11455181241035461, "step": 3790, "valid_targets_mean": 4452.2, "valid_targets_min": 513 }, { "epoch": 5.605612998522895, "grad_norm": 0.48873939155313356, "learning_rate": 4.652838982558321e-06, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.17513684928417206, "step": 3795, "valid_targets_mean": 4769.3, "valid_targets_min": 688 }, { "epoch": 5.612998522895126, "grad_norm": 0.4245229968901909, "learning_rate": 4.605711091452529e-06, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.1345527321100235, "step": 3800, "valid_targets_mean": 4822.4, "valid_targets_min": 320 }, { "epoch": 5.620384047267356, "grad_norm": 0.4483079582956929, "learning_rate": 4.5587920149296e-06, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.19811424612998962, "step": 3805, "valid_targets_mean": 5786.8, "valid_targets_min": 641 }, { "epoch": 5.627769571639586, "grad_norm": 0.3685763809564081, "learning_rate": 4.512082389419536e-06, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.11352822184562683, "step": 3810, "valid_targets_mean": 6317.6, "valid_targets_min": 610 }, { "epoch": 5.635155096011816, "grad_norm": 0.45195450036915635, "learning_rate": 4.465582848511265e-06, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.15802201628684998, "step": 3815, "valid_targets_mean": 4964.2, "valid_targets_min": 637 }, { "epoch": 5.642540620384048, "grad_norm": 0.4019080742593427, "learning_rate": 4.419294022944036e-06, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.1530536711215973, "step": 3820, "valid_targets_mean": 6357.9, "valid_targets_min": 669 }, { "epoch": 5.649926144756278, "grad_norm": 0.6283549194708017, "learning_rate": 4.373216540598868e-06, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.17285491526126862, "step": 3825, "valid_targets_mean": 3964.8, "valid_targets_min": 375 }, { "epoch": 5.657311669128508, "grad_norm": 0.43312904879288805, "learning_rate": 4.32735102649003e-06, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.14635983109474182, "step": 3830, "valid_targets_mean": 6200.1, "valid_targets_min": 656 }, { "epoch": 5.664697193500738, "grad_norm": 0.43595340706555863, "learning_rate": 4.281698102756568e-06, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.1400405317544937, "step": 3835, "valid_targets_mean": 5565.6, "valid_targets_min": 360 }, { "epoch": 5.672082717872969, "grad_norm": 0.48135722402982084, "learning_rate": 4.236258388653862e-06, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.20159319043159485, "step": 3840, "valid_targets_mean": 5819.4, "valid_targets_min": 835 }, { "epoch": 5.6794682422452, "grad_norm": 0.3965676517017414, "learning_rate": 4.1910325005452266e-06, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.1373254656791687, "step": 3845, "valid_targets_mean": 6392.2, "valid_targets_min": 668 }, { "epoch": 5.68685376661743, "grad_norm": 0.42777121231754817, "learning_rate": 4.146021051893554e-06, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.1447691023349762, "step": 3850, "valid_targets_mean": 5918.9, "valid_targets_min": 606 }, { "epoch": 5.69423929098966, "grad_norm": 0.5369213979278165, "learning_rate": 4.101224653252984e-06, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.14309504628181458, "step": 3855, "valid_targets_mean": 4915.6, "valid_targets_min": 710 }, { "epoch": 5.701624815361891, "grad_norm": 0.46685754924383494, "learning_rate": 4.056643912260634e-06, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.14844262599945068, "step": 3860, "valid_targets_mean": 4834.6, "valid_targets_min": 535 }, { "epoch": 5.709010339734121, "grad_norm": 0.5069631731010494, "learning_rate": 4.012279433628339e-06, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.17662671208381653, "step": 3865, "valid_targets_mean": 4272.2, "valid_targets_min": 427 }, { "epoch": 5.716395864106351, "grad_norm": 0.39028852212572046, "learning_rate": 3.968131819134484e-06, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.14806535840034485, "step": 3870, "valid_targets_mean": 7409.1, "valid_targets_min": 1271 }, { "epoch": 5.7237813884785815, "grad_norm": 0.42390110263128356, "learning_rate": 3.924201667615804e-06, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.1607496738433838, "step": 3875, "valid_targets_mean": 6367.4, "valid_targets_min": 773 }, { "epoch": 5.731166912850813, "grad_norm": 0.48659182537833057, "learning_rate": 3.880489574959261e-06, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.17565742135047913, "step": 3880, "valid_targets_mean": 4721.1, "valid_targets_min": 679 }, { "epoch": 5.738552437223043, "grad_norm": 0.4685263238659188, "learning_rate": 3.836996134093997e-06, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.20819538831710815, "step": 3885, "valid_targets_mean": 5287.9, "valid_targets_min": 524 }, { "epoch": 5.745937961595273, "grad_norm": 0.5369846316753283, "learning_rate": 3.7937219349832633e-06, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.16460327804088593, "step": 3890, "valid_targets_mean": 3801.6, "valid_targets_min": 635 }, { "epoch": 5.7533234859675035, "grad_norm": 0.41623622826233153, "learning_rate": 3.750667564616417e-06, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.19304777681827545, "step": 3895, "valid_targets_mean": 6364.7, "valid_targets_min": 471 }, { "epoch": 5.760709010339734, "grad_norm": 0.43621830231445924, "learning_rate": 3.7078336070009723e-06, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.14152905344963074, "step": 3900, "valid_targets_mean": 6270.2, "valid_targets_min": 298 }, { "epoch": 5.768094534711965, "grad_norm": 1.253010108913432, "learning_rate": 3.665220643154681e-06, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.16495048999786377, "step": 3905, "valid_targets_mean": 4590.6, "valid_targets_min": 606 }, { "epoch": 5.775480059084195, "grad_norm": 0.46508774999134267, "learning_rate": 3.622829251097626e-06, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.14090654253959656, "step": 3910, "valid_targets_mean": 4980.5, "valid_targets_min": 495 }, { "epoch": 5.7828655834564255, "grad_norm": 0.44297068805386, "learning_rate": 3.5806600058444075e-06, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.15334025025367737, "step": 3915, "valid_targets_mean": 5535.4, "valid_targets_min": 573 }, { "epoch": 5.790251107828656, "grad_norm": 0.4887477567047723, "learning_rate": 3.538713479396334e-06, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.15382501482963562, "step": 3920, "valid_targets_mean": 4043.9, "valid_targets_min": 553 }, { "epoch": 5.797636632200886, "grad_norm": 0.5918387677426872, "learning_rate": 3.4969902407336532e-06, "loss": 0.1857, "loss_nan_ranks": 0, "loss_rank_avg": 0.1690470576286316, "step": 3925, "valid_targets_mean": 3391.9, "valid_targets_min": 606 }, { "epoch": 5.805022156573116, "grad_norm": 0.45735044033920097, "learning_rate": 3.455490855807855e-06, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.19501203298568726, "step": 3930, "valid_targets_mean": 5170.4, "valid_targets_min": 686 }, { "epoch": 5.812407680945347, "grad_norm": 0.42972354738525703, "learning_rate": 3.4142158875339717e-06, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.16080421209335327, "step": 3935, "valid_targets_mean": 6471.1, "valid_targets_min": 858 }, { "epoch": 5.819793205317578, "grad_norm": 0.4913472734202364, "learning_rate": 3.373165895782973e-06, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.15726235508918762, "step": 3940, "valid_targets_mean": 4487.4, "valid_targets_min": 536 }, { "epoch": 5.827178729689808, "grad_norm": 0.3864919394835266, "learning_rate": 3.332341437374138e-06, "loss": 0.1463, "loss_nan_ranks": 0, "loss_rank_avg": 0.1257772147655487, "step": 3945, "valid_targets_mean": 6180.5, "valid_targets_min": 606 }, { "epoch": 5.834564254062038, "grad_norm": 0.4576260726948439, "learning_rate": 3.2917430660675165e-06, "loss": 0.1479, "loss_nan_ranks": 0, "loss_rank_avg": 0.13794982433319092, "step": 3950, "valid_targets_mean": 5125.7, "valid_targets_min": 562 }, { "epoch": 5.841949778434269, "grad_norm": 0.6723128146394246, "learning_rate": 3.251371332556428e-06, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.14654061198234558, "step": 3955, "valid_targets_mean": 5167.3, "valid_targets_min": 379 }, { "epoch": 5.849335302806499, "grad_norm": 0.5108031470733075, "learning_rate": 3.2112267844599686e-06, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.15340697765350342, "step": 3960, "valid_targets_mean": 4387.8, "valid_targets_min": 654 }, { "epoch": 5.85672082717873, "grad_norm": 0.557035301382823, "learning_rate": 3.171309966315614e-06, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.16433045268058777, "step": 3965, "valid_targets_mean": 4127.7, "valid_targets_min": 490 }, { "epoch": 5.86410635155096, "grad_norm": 0.4165972177795746, "learning_rate": 3.131621419571795e-06, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.15628871321678162, "step": 3970, "valid_targets_mean": 5658.2, "valid_targets_min": 563 }, { "epoch": 5.871491875923191, "grad_norm": 0.4450131689820263, "learning_rate": 3.0921616825805834e-06, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.15231899917125702, "step": 3975, "valid_targets_mean": 5490.5, "valid_targets_min": 655 }, { "epoch": 5.878877400295421, "grad_norm": 0.46785664172207136, "learning_rate": 3.0529312905903886e-06, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.15238377451896667, "step": 3980, "valid_targets_mean": 4522.8, "valid_targets_min": 504 }, { "epoch": 5.886262924667651, "grad_norm": 0.49684861734721625, "learning_rate": 3.013930775738676e-06, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.1534469872713089, "step": 3985, "valid_targets_mean": 4430.8, "valid_targets_min": 557 }, { "epoch": 5.8936484490398815, "grad_norm": 0.6814697551595089, "learning_rate": 2.975160667044763e-06, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.16581161320209503, "step": 3990, "valid_targets_mean": 4855.6, "valid_targets_min": 570 }, { "epoch": 5.901033973412112, "grad_norm": 0.42548375911231223, "learning_rate": 2.9366214904026445e-06, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.1445370763540268, "step": 3995, "valid_targets_mean": 5361.6, "valid_targets_min": 679 }, { "epoch": 5.908419497784343, "grad_norm": 0.4413005273888539, "learning_rate": 2.898313768573857e-06, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.14729730784893036, "step": 4000, "valid_targets_mean": 5133.8, "valid_targets_min": 491 }, { "epoch": 5.915805022156573, "grad_norm": 0.4985779399517165, "learning_rate": 2.8602380211803815e-06, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.15672720968723297, "step": 4005, "valid_targets_mean": 4657.6, "valid_targets_min": 789 }, { "epoch": 5.9231905465288035, "grad_norm": 0.5264213368938573, "learning_rate": 2.822394764697607e-06, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.14332908391952515, "step": 4010, "valid_targets_mean": 4761.6, "valid_targets_min": 289 }, { "epoch": 5.930576070901034, "grad_norm": 0.4744288530268933, "learning_rate": 2.784784512447314e-06, "loss": 0.1728, "loss_nan_ranks": 0, "loss_rank_avg": 0.1922370046377182, "step": 4015, "valid_targets_mean": 5348.4, "valid_targets_min": 853 }, { "epoch": 5.937961595273264, "grad_norm": 0.4438269690328926, "learning_rate": 2.747407774590718e-06, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440523862838745, "step": 4020, "valid_targets_mean": 4801.4, "valid_targets_min": 700 }, { "epoch": 5.945347119645495, "grad_norm": 0.3990012691696163, "learning_rate": 2.7102650581215486e-06, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.13657835125923157, "step": 4025, "valid_targets_mean": 6708.6, "valid_targets_min": 648 }, { "epoch": 5.9527326440177255, "grad_norm": 0.41646211715971676, "learning_rate": 2.673356866859167e-06, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.15765783190727234, "step": 4030, "valid_targets_mean": 5822.4, "valid_targets_min": 872 }, { "epoch": 5.960118168389956, "grad_norm": 0.4931126540910065, "learning_rate": 2.6366837014417422e-06, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.1812196969985962, "step": 4035, "valid_targets_mean": 5131.9, "valid_targets_min": 714 }, { "epoch": 5.967503692762186, "grad_norm": 0.4482245693010152, "learning_rate": 2.6002460593194466e-06, "loss": 0.1715, "loss_nan_ranks": 0, "loss_rank_avg": 0.14398686587810516, "step": 4040, "valid_targets_mean": 5426.2, "valid_targets_min": 384 }, { "epoch": 5.974889217134416, "grad_norm": 0.4086296843327063, "learning_rate": 2.5640444347477255e-06, "loss": 0.145, "loss_nan_ranks": 0, "loss_rank_avg": 0.1505671888589859, "step": 4045, "valid_targets_mean": 6444.2, "valid_targets_min": 477 }, { "epoch": 5.982274741506647, "grad_norm": 0.5290771022870968, "learning_rate": 2.528079318780574e-06, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.17048917710781097, "step": 4050, "valid_targets_mean": 3984.4, "valid_targets_min": 495 }, { "epoch": 5.989660265878878, "grad_norm": 0.4256479196291018, "learning_rate": 2.4923511992638895e-06, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.14762143790721893, "step": 4055, "valid_targets_mean": 5162.6, "valid_targets_min": 703 }, { "epoch": 5.997045790251108, "grad_norm": 0.46850279871296086, "learning_rate": 2.4568605608288533e-06, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.14865565299987793, "step": 4060, "valid_targets_mean": 4318.1, "valid_targets_min": 486 }, { "epoch": 6.004431314623338, "grad_norm": 0.5249959190204746, "learning_rate": 2.4216078848853506e-06, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.17384469509124756, "step": 4065, "valid_targets_mean": 3995.9, "valid_targets_min": 477 }, { "epoch": 6.011816838995569, "grad_norm": 0.5988657789473296, "learning_rate": 2.386593649615441e-06, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.151736781001091, "step": 4070, "valid_targets_mean": 2800.8, "valid_targets_min": 451 }, { "epoch": 6.019202363367799, "grad_norm": 0.39840181178979595, "learning_rate": 2.3518183299668796e-06, "loss": 0.138, "loss_nan_ranks": 0, "loss_rank_avg": 0.13792383670806885, "step": 4075, "valid_targets_mean": 5876.8, "valid_targets_min": 645 }, { "epoch": 6.026587887740029, "grad_norm": 0.44045943750338273, "learning_rate": 2.3172823976466697e-06, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.15484324097633362, "step": 4080, "valid_targets_mean": 5097.8, "valid_targets_min": 771 }, { "epoch": 6.03397341211226, "grad_norm": 0.4629364970805179, "learning_rate": 2.282986321114662e-06, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.14461535215377808, "step": 4085, "valid_targets_mean": 5088.2, "valid_targets_min": 655 }, { "epoch": 6.041358936484491, "grad_norm": 0.40286656062179965, "learning_rate": 2.2489305655771987e-06, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.16793042421340942, "step": 4090, "valid_targets_mean": 6758.6, "valid_targets_min": 832 }, { "epoch": 6.048744460856721, "grad_norm": 0.4182839452913791, "learning_rate": 2.215115592980821e-06, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.14046970009803772, "step": 4095, "valid_targets_mean": 5969.9, "valid_targets_min": 640 }, { "epoch": 6.056129985228951, "grad_norm": 0.43593965359653836, "learning_rate": 2.1815418620059824e-06, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.1332874596118927, "step": 4100, "valid_targets_mean": 5555.6, "valid_targets_min": 476 }, { "epoch": 6.0635155096011815, "grad_norm": 0.46039610869991315, "learning_rate": 2.1482098280608234e-06, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.2060922533273697, "step": 4105, "valid_targets_mean": 5705.4, "valid_targets_min": 614 }, { "epoch": 6.070901033973412, "grad_norm": 0.37373910107719843, "learning_rate": 2.1151199432750192e-06, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.1127336174249649, "step": 4110, "valid_targets_mean": 6756.9, "valid_targets_min": 831 }, { "epoch": 6.078286558345643, "grad_norm": 0.44535195342707495, "learning_rate": 2.082272656493625e-06, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.15034779906272888, "step": 4115, "valid_targets_mean": 5689.1, "valid_targets_min": 349 }, { "epoch": 6.085672082717873, "grad_norm": 0.5195916162622733, "learning_rate": 2.049668413271e-06, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.19452224671840668, "step": 4120, "valid_targets_mean": 4656.3, "valid_targets_min": 636 }, { "epoch": 6.0930576070901035, "grad_norm": 0.5560703022649638, "learning_rate": 2.0173076558647487e-06, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.14960438013076782, "step": 4125, "valid_targets_mean": 4023.4, "valid_targets_min": 692 }, { "epoch": 6.100443131462334, "grad_norm": 0.4749923373792734, "learning_rate": 1.9851908232297525e-06, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.13118794560432434, "step": 4130, "valid_targets_mean": 4465.4, "valid_targets_min": 326 }, { "epoch": 6.107828655834564, "grad_norm": 0.4829535285337888, "learning_rate": 1.9533183510121725e-06, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.15433762967586517, "step": 4135, "valid_targets_mean": 5477.0, "valid_targets_min": 621 }, { "epoch": 6.115214180206794, "grad_norm": 0.45301666809919827, "learning_rate": 1.9216906715435744e-06, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.1339162439107895, "step": 4140, "valid_targets_mean": 4647.9, "valid_targets_min": 761 }, { "epoch": 6.1225997045790255, "grad_norm": 0.39338422495107067, "learning_rate": 1.8903082138350548e-06, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.1282079815864563, "step": 4145, "valid_targets_mean": 5771.3, "valid_targets_min": 425 }, { "epoch": 6.129985228951256, "grad_norm": 0.44371532394815066, "learning_rate": 1.8591714035714049e-06, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.16418243944644928, "step": 4150, "valid_targets_mean": 5660.0, "valid_targets_min": 479 }, { "epoch": 6.137370753323486, "grad_norm": 0.48563406133620735, "learning_rate": 1.8282806631053662e-06, "loss": 0.1479, "loss_nan_ranks": 0, "loss_rank_avg": 0.16766785085201263, "step": 4155, "valid_targets_mean": 4655.8, "valid_targets_min": 433 }, { "epoch": 6.144756277695716, "grad_norm": 0.6072416236863333, "learning_rate": 1.7976364114518796e-06, "loss": 0.1463, "loss_nan_ranks": 0, "loss_rank_avg": 0.1494389772415161, "step": 4160, "valid_targets_mean": 3736.5, "valid_targets_min": 491 }, { "epoch": 6.152141802067947, "grad_norm": 0.50481142735507, "learning_rate": 1.7672390642824156e-06, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.17777088284492493, "step": 4165, "valid_targets_mean": 4276.0, "valid_targets_min": 666 }, { "epoch": 6.159527326440177, "grad_norm": 0.42071660129307986, "learning_rate": 1.7370890339193191e-06, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.1517738252878189, "step": 4170, "valid_targets_mean": 6217.3, "valid_targets_min": 747 }, { "epoch": 6.166912850812408, "grad_norm": 0.4290485201318066, "learning_rate": 1.7071867293302325e-06, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.1593089997768402, "step": 4175, "valid_targets_mean": 5545.1, "valid_targets_min": 765 }, { "epoch": 6.174298375184638, "grad_norm": 0.43744895390706484, "learning_rate": 1.6775325561225409e-06, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.13858440518379211, "step": 4180, "valid_targets_mean": 5377.1, "valid_targets_min": 466 }, { "epoch": 6.181683899556869, "grad_norm": 0.4262626698684947, "learning_rate": 1.648126916537871e-06, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.14648282527923584, "step": 4185, "valid_targets_mean": 5709.4, "valid_targets_min": 654 }, { "epoch": 6.189069423929099, "grad_norm": 0.47051468258097345, "learning_rate": 1.6189702094466309e-06, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.1473892331123352, "step": 4190, "valid_targets_mean": 4704.9, "valid_targets_min": 755 }, { "epoch": 6.196454948301329, "grad_norm": 0.49070628134476585, "learning_rate": 1.5900628303426114e-06, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.15285709500312805, "step": 4195, "valid_targets_mean": 4618.8, "valid_targets_min": 530 }, { "epoch": 6.203840472673559, "grad_norm": 0.4253518994986448, "learning_rate": 1.5614051713376066e-06, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.15116259455680847, "step": 4200, "valid_targets_mean": 5736.6, "valid_targets_min": 412 }, { "epoch": 6.211225997045791, "grad_norm": 0.4641185127939372, "learning_rate": 1.5329976211561138e-06, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.20113864541053772, "step": 4205, "valid_targets_mean": 5099.3, "valid_targets_min": 529 }, { "epoch": 6.218611521418021, "grad_norm": 0.39647752417172666, "learning_rate": 1.504840565130039e-06, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.13573205471038818, "step": 4210, "valid_targets_mean": 6350.6, "valid_targets_min": 711 }, { "epoch": 6.225997045790251, "grad_norm": 0.48103069316244723, "learning_rate": 1.4769343851934847e-06, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.1464741975069046, "step": 4215, "valid_targets_mean": 4600.5, "valid_targets_min": 514 }, { "epoch": 6.233382570162481, "grad_norm": 0.40232624403233436, "learning_rate": 1.4492794598775661e-06, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.13256195187568665, "step": 4220, "valid_targets_mean": 6487.2, "valid_targets_min": 679 }, { "epoch": 6.240768094534712, "grad_norm": 0.5055273590949532, "learning_rate": 1.4218761643052692e-06, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.15635859966278076, "step": 4225, "valid_targets_mean": 4193.4, "valid_targets_min": 721 }, { "epoch": 6.248153618906942, "grad_norm": 0.43866996029377286, "learning_rate": 1.3947248701863813e-06, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.16044774651527405, "step": 4230, "valid_targets_mean": 5434.1, "valid_targets_min": 541 }, { "epoch": 6.255539143279173, "grad_norm": 0.49231511408163975, "learning_rate": 1.3678259458124177e-06, "loss": 0.1694, "loss_nan_ranks": 0, "loss_rank_avg": 0.13283999264240265, "step": 4235, "valid_targets_mean": 4179.0, "valid_targets_min": 800 }, { "epoch": 6.262924667651403, "grad_norm": 0.4230623819145653, "learning_rate": 1.3411797560516627e-06, "loss": 0.1344, "loss_nan_ranks": 0, "loss_rank_avg": 0.1318785846233368, "step": 4240, "valid_targets_mean": 6249.6, "valid_targets_min": 703 }, { "epoch": 6.270310192023634, "grad_norm": 0.46935895443155884, "learning_rate": 1.314786662344194e-06, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.17924916744232178, "step": 4245, "valid_targets_mean": 5661.8, "valid_targets_min": 570 }, { "epoch": 6.277695716395864, "grad_norm": 0.3888317431003321, "learning_rate": 1.2886470226969895e-06, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.13889117538928986, "step": 4250, "valid_targets_mean": 6869.9, "valid_targets_min": 990 }, { "epoch": 6.285081240768094, "grad_norm": 0.4352449485035959, "learning_rate": 1.2627611916790715e-06, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.14910173416137695, "step": 4255, "valid_targets_mean": 5603.9, "valid_targets_min": 491 }, { "epoch": 6.2924667651403245, "grad_norm": 0.40749937475334613, "learning_rate": 1.237129520416691e-06, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.15692628920078278, "step": 4260, "valid_targets_mean": 6081.8, "valid_targets_min": 831 }, { "epoch": 6.299852289512556, "grad_norm": 0.4037894828650866, "learning_rate": 1.211752356588578e-06, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.13675357401371002, "step": 4265, "valid_targets_mean": 6421.4, "valid_targets_min": 457 }, { "epoch": 6.307237813884786, "grad_norm": 0.5205689683666549, "learning_rate": 1.1866300444212108e-06, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.15477876365184784, "step": 4270, "valid_targets_mean": 3994.2, "valid_targets_min": 546 }, { "epoch": 6.314623338257016, "grad_norm": 0.5661967143739712, "learning_rate": 1.161762924684151e-06, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.15488114953041077, "step": 4275, "valid_targets_mean": 4311.4, "valid_targets_min": 541 }, { "epoch": 6.3220088626292466, "grad_norm": 0.4837147960209401, "learning_rate": 1.1371513346854313e-06, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.16949772834777832, "step": 4280, "valid_targets_mean": 4836.6, "valid_targets_min": 493 }, { "epoch": 6.329394387001477, "grad_norm": 0.5432762673776387, "learning_rate": 1.1127956082669633e-06, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.18372945487499237, "step": 4285, "valid_targets_mean": 4226.1, "valid_targets_min": 707 }, { "epoch": 6.336779911373707, "grad_norm": 0.5144469478911506, "learning_rate": 1.0886960758000265e-06, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.16694745421409607, "step": 4290, "valid_targets_mean": 3961.9, "valid_targets_min": 400 }, { "epoch": 6.344165435745938, "grad_norm": 0.43923637649600045, "learning_rate": 1.0648530641807686e-06, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.1794458031654358, "step": 4295, "valid_targets_mean": 5821.2, "valid_targets_min": 526 }, { "epoch": 6.3515509601181686, "grad_norm": 0.5123527090839185, "learning_rate": 1.0412668968257877e-06, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.14006029069423676, "step": 4300, "valid_targets_mean": 4426.3, "valid_targets_min": 781 }, { "epoch": 6.358936484490399, "grad_norm": 0.4115851655709371, "learning_rate": 1.0179378936677397e-06, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.1542370468378067, "step": 4305, "valid_targets_mean": 5933.6, "valid_targets_min": 666 }, { "epoch": 6.366322008862629, "grad_norm": 0.5258862879779717, "learning_rate": 9.948663711509954e-07, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.15517973899841309, "step": 4310, "valid_targets_mean": 4407.2, "valid_targets_min": 586 }, { "epoch": 6.373707533234859, "grad_norm": 0.44159616792495127, "learning_rate": 9.720526422273412e-07, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.1318591982126236, "step": 4315, "valid_targets_mean": 5543.4, "valid_targets_min": 841 }, { "epoch": 6.381093057607091, "grad_norm": 0.49990677130913785, "learning_rate": 9.494970163517681e-07, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.15071862936019897, "step": 4320, "valid_targets_mean": 4528.5, "valid_targets_min": 573 }, { "epoch": 6.388478581979321, "grad_norm": 0.4164585567607767, "learning_rate": 9.2719979947822e-07, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.15653051435947418, "step": 4325, "valid_targets_mean": 6323.8, "valid_targets_min": 490 }, { "epoch": 6.395864106351551, "grad_norm": 0.5160481333349497, "learning_rate": 9.051612940554899e-07, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.1293860673904419, "step": 4330, "valid_targets_mean": 4956.7, "valid_targets_min": 796 }, { "epoch": 6.403249630723781, "grad_norm": 0.5499032197777276, "learning_rate": 8.833817990230953e-07, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.15469960868358612, "step": 4335, "valid_targets_mean": 4249.5, "valid_targets_min": 324 }, { "epoch": 6.410635155096012, "grad_norm": 0.40152843519987197, "learning_rate": 8.61861609807233e-07, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.11483586579561234, "step": 4340, "valid_targets_mean": 6111.3, "valid_targets_min": 712 }, { "epoch": 6.418020679468242, "grad_norm": 0.42446425379167474, "learning_rate": 8.406010183167601e-07, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.1487945318222046, "step": 4345, "valid_targets_mean": 7079.7, "valid_targets_min": 685 }, { "epoch": 6.425406203840472, "grad_norm": 0.7413738678926328, "learning_rate": 8.196003129392438e-07, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.16445940732955933, "step": 4350, "valid_targets_mean": 3112.4, "valid_targets_min": 548 }, { "epoch": 6.432791728212703, "grad_norm": 0.44560225337100395, "learning_rate": 7.988597785370533e-07, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.12470986694097519, "step": 4355, "valid_targets_mean": 5328.5, "valid_targets_min": 257 }, { "epoch": 6.440177252584934, "grad_norm": 0.4745632975601192, "learning_rate": 7.783796964434831e-07, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.16859686374664307, "step": 4360, "valid_targets_mean": 5014.4, "valid_targets_min": 726 }, { "epoch": 6.447562776957164, "grad_norm": 0.4642679768852893, "learning_rate": 7.581603444589447e-07, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.13736671209335327, "step": 4365, "valid_targets_mean": 4825.1, "valid_targets_min": 528 }, { "epoch": 6.454948301329394, "grad_norm": 0.4434842107811936, "learning_rate": 7.382019968471943e-07, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.14103060960769653, "step": 4370, "valid_targets_mean": 5577.3, "valid_targets_min": 552 }, { "epoch": 6.4623338257016245, "grad_norm": 0.503057563707869, "learning_rate": 7.185049243316222e-07, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.14642839133739471, "step": 4375, "valid_targets_mean": 4761.9, "valid_targets_min": 652 }, { "epoch": 6.469719350073856, "grad_norm": 0.6276381062918326, "learning_rate": 6.990693940915694e-07, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.24949908256530762, "step": 4380, "valid_targets_mean": 3993.2, "valid_targets_min": 535 }, { "epoch": 6.477104874446086, "grad_norm": 0.4926903015244238, "learning_rate": 6.798956697587079e-07, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.1511232703924179, "step": 4385, "valid_targets_mean": 4615.3, "valid_targets_min": 595 }, { "epoch": 6.484490398818316, "grad_norm": 0.49283910568013917, "learning_rate": 6.60984011413468e-07, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.16701708734035492, "step": 4390, "valid_targets_mean": 4338.4, "valid_targets_min": 645 }, { "epoch": 6.4918759231905465, "grad_norm": 0.5002990883414868, "learning_rate": 6.423346755815019e-07, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.13407056033611298, "step": 4395, "valid_targets_mean": 4023.8, "valid_targets_min": 658 }, { "epoch": 6.499261447562777, "grad_norm": 0.5338641891206741, "learning_rate": 6.239479152302164e-07, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.17522169649600983, "step": 4400, "valid_targets_mean": 4392.1, "valid_targets_min": 670 }, { "epoch": 6.506646971935007, "grad_norm": 0.5484669473808206, "learning_rate": 6.058239797653276e-07, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.1687406748533249, "step": 4405, "valid_targets_mean": 4462.4, "valid_targets_min": 482 }, { "epoch": 6.514032496307237, "grad_norm": 0.5639609310377635, "learning_rate": 5.879631150274901e-07, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.15761615335941315, "step": 4410, "valid_targets_mean": 4938.3, "valid_targets_min": 271 }, { "epoch": 6.5214180206794685, "grad_norm": 0.4302419740392286, "learning_rate": 5.703655632889505e-07, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.12143665552139282, "step": 4415, "valid_targets_mean": 6462.4, "valid_targets_min": 537 }, { "epoch": 6.528803545051699, "grad_norm": 0.4018145246408569, "learning_rate": 5.530315632502725e-07, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.15424439311027527, "step": 4420, "valid_targets_mean": 7003.6, "valid_targets_min": 650 }, { "epoch": 6.536189069423929, "grad_norm": 0.4280985946691859, "learning_rate": 5.359613500370931e-07, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.13937228918075562, "step": 4425, "valid_targets_mean": 5996.9, "valid_targets_min": 928 }, { "epoch": 6.543574593796159, "grad_norm": 0.512095968806376, "learning_rate": 5.191551551969376e-07, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.1761317402124405, "step": 4430, "valid_targets_mean": 5061.4, "valid_targets_min": 639 }, { "epoch": 6.55096011816839, "grad_norm": 0.42658213407812473, "learning_rate": 5.026132066960699e-07, "loss": 0.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.12839290499687195, "step": 4435, "valid_targets_mean": 6122.6, "valid_targets_min": 989 }, { "epoch": 6.558345642540621, "grad_norm": 0.43584162901665235, "learning_rate": 4.863357289164094e-07, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.13353732228279114, "step": 4440, "valid_targets_mean": 5793.8, "valid_targets_min": 774 }, { "epoch": 6.565731166912851, "grad_norm": 0.5121854270322571, "learning_rate": 4.703229426524836e-07, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.140175461769104, "step": 4445, "valid_targets_mean": 6360.8, "valid_targets_min": 825 }, { "epoch": 6.573116691285081, "grad_norm": 0.4891587376138227, "learning_rate": 4.545750651084291e-07, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.1598307192325592, "step": 4450, "valid_targets_mean": 5076.1, "valid_targets_min": 641 }, { "epoch": 6.580502215657312, "grad_norm": 0.48474954710037227, "learning_rate": 4.3909230989505724e-07, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.15411385893821716, "step": 4455, "valid_targets_mean": 4396.3, "valid_targets_min": 641 }, { "epoch": 6.587887740029542, "grad_norm": 0.48095262700952346, "learning_rate": 4.2387488702693823e-07, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.15224063396453857, "step": 4460, "valid_targets_mean": 4503.4, "valid_targets_min": 612 }, { "epoch": 6.595273264401772, "grad_norm": 0.42397246226943786, "learning_rate": 4.0892300291957674e-07, "loss": 0.1786, "loss_nan_ranks": 0, "loss_rank_avg": 0.14690491557121277, "step": 4465, "valid_targets_mean": 5915.6, "valid_targets_min": 495 }, { "epoch": 6.6026587887740025, "grad_norm": 0.43317383963947165, "learning_rate": 3.942368603865898e-07, "loss": 0.1522, "loss_nan_ranks": 0, "loss_rank_avg": 0.13303223252296448, "step": 4470, "valid_targets_mean": 5465.1, "valid_targets_min": 1317 }, { "epoch": 6.610044313146234, "grad_norm": 0.4006775023374142, "learning_rate": 3.798166586369645e-07, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.15547743439674377, "step": 4475, "valid_targets_mean": 7271.6, "valid_targets_min": 636 }, { "epoch": 6.617429837518464, "grad_norm": 0.4117824406720461, "learning_rate": 3.656625932723579e-07, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.13841594755649567, "step": 4480, "valid_targets_mean": 6281.6, "valid_targets_min": 685 }, { "epoch": 6.624815361890694, "grad_norm": 0.5336042505216406, "learning_rate": 3.5177485628444363e-07, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.1793767213821411, "step": 4485, "valid_targets_mean": 4352.6, "valid_targets_min": 603 }, { "epoch": 6.6322008862629245, "grad_norm": 0.44302761320669076, "learning_rate": 3.381536360523008e-07, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.14193832874298096, "step": 4490, "valid_targets_mean": 5695.8, "valid_targets_min": 734 }, { "epoch": 6.639586410635155, "grad_norm": 0.4383730918433756, "learning_rate": 3.247991173398668e-07, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.1333121955394745, "step": 4495, "valid_targets_mean": 5675.1, "valid_targets_min": 622 }, { "epoch": 6.646971935007386, "grad_norm": 0.5170425717885939, "learning_rate": 3.117114812934263e-07, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.1605900526046753, "step": 4500, "valid_targets_mean": 4572.1, "valid_targets_min": 575 }, { "epoch": 6.654357459379616, "grad_norm": 0.48806033544384714, "learning_rate": 2.988909054391598e-07, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.1332065463066101, "step": 4505, "valid_targets_mean": 4321.8, "valid_targets_min": 573 }, { "epoch": 6.6617429837518465, "grad_norm": 0.37245789606924895, "learning_rate": 2.8633756368072307e-07, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.11881101131439209, "step": 4510, "valid_targets_mean": 6310.8, "valid_targets_min": 803 }, { "epoch": 6.669128508124077, "grad_norm": 0.4549884322992929, "learning_rate": 2.740516262969051e-07, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.1540367156267166, "step": 4515, "valid_targets_mean": 5073.8, "valid_targets_min": 637 }, { "epoch": 6.676514032496307, "grad_norm": 0.4944141719547407, "learning_rate": 2.6203325993930717e-07, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.11980420351028442, "step": 4520, "valid_targets_mean": 4708.9, "valid_targets_min": 499 }, { "epoch": 6.683899556868537, "grad_norm": 0.5049668775794947, "learning_rate": 2.5028262763008514e-07, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.17368857562541962, "step": 4525, "valid_targets_mean": 4323.2, "valid_targets_min": 529 }, { "epoch": 6.691285081240768, "grad_norm": 0.39940995378060945, "learning_rate": 2.3879988875973314e-07, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.12155850231647491, "step": 4530, "valid_targets_mean": 6206.7, "valid_targets_min": 552 }, { "epoch": 6.698670605612999, "grad_norm": 0.4013521013669753, "learning_rate": 2.2758519908493648e-07, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.15022462606430054, "step": 4535, "valid_targets_mean": 6336.5, "valid_targets_min": 630 }, { "epoch": 6.706056129985229, "grad_norm": 0.5620177209255185, "learning_rate": 2.1663871072643784e-07, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.16755668818950653, "step": 4540, "valid_targets_mean": 3727.6, "valid_targets_min": 390 }, { "epoch": 6.713441654357459, "grad_norm": 0.5258801995748262, "learning_rate": 2.059605721669966e-07, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.14239409565925598, "step": 4545, "valid_targets_mean": 4034.1, "valid_targets_min": 540 }, { "epoch": 6.72082717872969, "grad_norm": 0.4560448915232561, "learning_rate": 1.9555092824935062e-07, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.1599361002445221, "step": 4550, "valid_targets_mean": 5137.9, "valid_targets_min": 310 }, { "epoch": 6.72821270310192, "grad_norm": 0.46957544677234575, "learning_rate": 1.854099201742754e-07, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.13492749631404877, "step": 4555, "valid_targets_mean": 5321.8, "valid_targets_min": 486 }, { "epoch": 6.735598227474151, "grad_norm": 0.4893832374792917, "learning_rate": 1.7553768549864791e-07, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.1458035260438919, "step": 4560, "valid_targets_mean": 4632.6, "valid_targets_min": 723 }, { "epoch": 6.742983751846381, "grad_norm": 0.49924643293505594, "learning_rate": 1.6593435813359704e-07, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.1429969072341919, "step": 4565, "valid_targets_mean": 5114.1, "valid_targets_min": 573 }, { "epoch": 6.750369276218612, "grad_norm": 0.5588546086896948, "learning_rate": 1.5660006834267826e-07, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.17076215147972107, "step": 4570, "valid_targets_mean": 3644.6, "valid_targets_min": 462 }, { "epoch": 6.757754800590842, "grad_norm": 0.44934370220938186, "learning_rate": 1.4753494274010404e-07, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.12686952948570251, "step": 4575, "valid_targets_mean": 4405.2, "valid_targets_min": 532 }, { "epoch": 6.765140324963072, "grad_norm": 0.40287819658097046, "learning_rate": 1.387391042890407e-07, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.1626736968755722, "step": 4580, "valid_targets_mean": 6230.9, "valid_targets_min": 471 }, { "epoch": 6.772525849335302, "grad_norm": 0.39016310022420664, "learning_rate": 1.3021267229992307e-07, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.13419151306152344, "step": 4585, "valid_targets_mean": 5865.1, "valid_targets_min": 552 }, { "epoch": 6.779911373707534, "grad_norm": 0.48929349503037056, "learning_rate": 1.2195576242884256e-07, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.16033774614334106, "step": 4590, "valid_targets_mean": 4465.0, "valid_targets_min": 462 }, { "epoch": 6.787296898079764, "grad_norm": 0.4099040200611785, "learning_rate": 1.1396848667598826e-07, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.13809999823570251, "step": 4595, "valid_targets_mean": 5768.4, "valid_targets_min": 562 }, { "epoch": 6.794682422451994, "grad_norm": 0.47774449623791543, "learning_rate": 1.0625095338411051e-07, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.1699640303850174, "step": 4600, "valid_targets_mean": 4953.6, "valid_targets_min": 553 }, { "epoch": 6.802067946824224, "grad_norm": 0.5076200380883104, "learning_rate": 9.880326723706646e-08, "loss": 0.1479, "loss_nan_ranks": 0, "loss_rank_avg": 0.1531982421875, "step": 4605, "valid_targets_mean": 4243.5, "valid_targets_min": 575 }, { "epoch": 6.809453471196455, "grad_norm": 0.5365924598906461, "learning_rate": 9.162552925838564e-08, "loss": 0.1694, "loss_nan_ranks": 0, "loss_rank_avg": 0.19307509064674377, "step": 4610, "valid_targets_mean": 4674.6, "valid_targets_min": 577 }, { "epoch": 6.816838995568685, "grad_norm": 0.4114855170974802, "learning_rate": 8.471783680991774e-08, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.11866377294063568, "step": 4615, "valid_targets_mean": 5945.6, "valid_targets_min": 500 }, { "epoch": 6.824224519940916, "grad_norm": 0.4311591899524311, "learning_rate": 7.80802835904959e-08, "loss": 0.137, "loss_nan_ranks": 0, "loss_rank_avg": 0.13947513699531555, "step": 4620, "valid_targets_mean": 5683.1, "valid_targets_min": 634 }, { "epoch": 6.8316100443131464, "grad_norm": 0.5619454499028758, "learning_rate": 7.171295963466884e-08, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.1453944444656372, "step": 4625, "valid_targets_mean": 4229.2, "valid_targets_min": 517 }, { "epoch": 6.838995568685377, "grad_norm": 0.43973530083348866, "learning_rate": 6.561595131149068e-08, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.15559229254722595, "step": 4630, "valid_targets_mean": 5828.9, "valid_targets_min": 731 }, { "epoch": 6.846381093057607, "grad_norm": 0.46646297249339624, "learning_rate": 5.97893413233308e-08, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.13109324872493744, "step": 4635, "valid_targets_mean": 4558.2, "valid_targets_min": 721 }, { "epoch": 6.853766617429837, "grad_norm": 0.5158968571743305, "learning_rate": 5.4233208704770336e-08, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.18643151223659515, "step": 4640, "valid_targets_mean": 4622.7, "valid_targets_min": 529 }, { "epoch": 6.861152141802068, "grad_norm": 0.42120731834961433, "learning_rate": 4.894762882151849e-08, "loss": 0.1488, "loss_nan_ranks": 0, "loss_rank_avg": 0.12933212518692017, "step": 4645, "valid_targets_mean": 5539.8, "valid_targets_min": 516 }, { "epoch": 6.868537666174299, "grad_norm": 0.4701920136133854, "learning_rate": 4.393267336939566e-08, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.16911543905735016, "step": 4650, "valid_targets_mean": 5174.4, "valid_targets_min": 494 }, { "epoch": 6.875923190546529, "grad_norm": 0.4483722090071213, "learning_rate": 3.9188410373358635e-08, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.23113879561424255, "step": 4655, "valid_targets_mean": 6327.1, "valid_targets_min": 597 }, { "epoch": 6.883308714918759, "grad_norm": 0.4700078471031414, "learning_rate": 3.471490418657686e-08, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.15961627662181854, "step": 4660, "valid_targets_mean": 5725.3, "valid_targets_min": 648 }, { "epoch": 6.89069423929099, "grad_norm": 0.4655597595051389, "learning_rate": 3.051221548956207e-08, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.12833762168884277, "step": 4665, "valid_targets_mean": 4711.9, "valid_targets_min": 725 }, { "epoch": 6.89807976366322, "grad_norm": 0.6380093111909683, "learning_rate": 2.6580401289344472e-08, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.1340949535369873, "step": 4670, "valid_targets_mean": 3719.6, "valid_targets_min": 521 }, { "epoch": 6.905465288035451, "grad_norm": 0.42232440957412026, "learning_rate": 2.2919514918700038e-08, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.13673587143421173, "step": 4675, "valid_targets_mean": 6005.1, "valid_targets_min": 567 }, { "epoch": 6.912850812407681, "grad_norm": 0.4656904084131196, "learning_rate": 1.95296060354222e-08, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.1485702097415924, "step": 4680, "valid_targets_mean": 5101.6, "valid_targets_min": 579 }, { "epoch": 6.920236336779912, "grad_norm": 0.4808238353600059, "learning_rate": 1.6410720621655718e-08, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.1313798427581787, "step": 4685, "valid_targets_mean": 6804.3, "valid_targets_min": 819 }, { "epoch": 6.927621861152142, "grad_norm": 0.4233348673449903, "learning_rate": 1.356290098327051e-08, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.15477396547794342, "step": 4690, "valid_targets_mean": 6435.8, "valid_targets_min": 699 }, { "epoch": 6.935007385524372, "grad_norm": 0.43007196837079203, "learning_rate": 1.0986185749282118e-08, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.11044066399335861, "step": 4695, "valid_targets_mean": 5944.6, "valid_targets_min": 229 }, { "epoch": 6.942392909896602, "grad_norm": 0.5232298527072103, "learning_rate": 8.680609871338786e-09, "loss": 0.1708, "loss_nan_ranks": 0, "loss_rank_avg": 0.18600329756736755, "step": 4700, "valid_targets_mean": 4885.4, "valid_targets_min": 799 }, { "epoch": 6.949778434268833, "grad_norm": 0.6339786906635847, "learning_rate": 6.646204623232954e-09, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.21870045363903046, "step": 4705, "valid_targets_mean": 3441.2, "valid_targets_min": 526 }, { "epoch": 6.957163958641064, "grad_norm": 0.3930755994701203, "learning_rate": 4.882997600494932e-09, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.12523368000984192, "step": 4710, "valid_targets_mean": 6379.2, "valid_targets_min": 563 }, { "epoch": 6.964549483013294, "grad_norm": 0.46455499149966306, "learning_rate": 3.3910127199998643e-09, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.1395748257637024, "step": 4715, "valid_targets_mean": 5036.2, "valid_targets_min": 476 }, { "epoch": 6.971935007385524, "grad_norm": 0.5569847284562671, "learning_rate": 2.170270219654658e-09, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.16902390122413635, "step": 4720, "valid_targets_mean": 4324.9, "valid_targets_min": 542 }, { "epoch": 6.979320531757755, "grad_norm": 0.4994292568305981, "learning_rate": 1.2207866581248617e-09, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.15097226202487946, "step": 4725, "valid_targets_mean": 4825.1, "valid_targets_min": 314 }, { "epoch": 6.986706056129985, "grad_norm": 0.4317365485031485, "learning_rate": 5.425749146015235e-10, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.14707861840724945, "step": 4730, "valid_targets_mean": 6297.3, "valid_targets_min": 696 }, { "epoch": 6.994091580502216, "grad_norm": 0.43567574617565746, "learning_rate": 1.3564418863465378e-10, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.13918901979923248, "step": 4735, "valid_targets_mean": 5156.8, "valid_targets_min": 633 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.13066400587558746, "step": 4739, "total_flos": 1781000233680896.0, "train_loss": 0.19506101114987875, "train_runtime": 33204.2929, "train_samples_per_second": 2.281, "train_steps_per_second": 0.143, "valid_targets_mean": 5264.3, "valid_targets_min": 320 } ], "logging_steps": 5, "max_steps": 4739, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1781000233680896.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }