diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,29439 @@ +{ + "best_global_step": null, + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 7.0, + "eval_steps": 500, + "global_step": 13363, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0026191723415400735, + "grad_norm": 14.360649611601202, + "learning_rate": 1.1967090501121915e-07, + "loss": 0.8127, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.34690144658088684, + "step": 5, + "valid_targets_mean": 1236.5, + "valid_targets_min": 746 + }, + { + "epoch": 0.005238344683080147, + "grad_norm": 15.365253914310367, + "learning_rate": 2.692595362752431e-07, + "loss": 0.8159, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4388588070869446, + "step": 10, + "valid_targets_mean": 1550.8, + "valid_targets_min": 612 + }, + { + "epoch": 0.00785751702462022, + "grad_norm": 14.009337806771104, + "learning_rate": 4.1884816753926706e-07, + "loss": 0.7913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.37569183111190796, + "step": 15, + "valid_targets_mean": 1455.8, + "valid_targets_min": 904 + }, + { + "epoch": 0.010476689366160294, + "grad_norm": 13.648701274661068, + "learning_rate": 5.68436798803291e-07, + "loss": 0.7905, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4232363700866699, + "step": 20, + "valid_targets_mean": 1514.4, + "valid_targets_min": 967 + }, + { + "epoch": 0.013095861707700367, + "grad_norm": 12.665998950030927, + "learning_rate": 7.18025430067315e-07, + "loss": 0.7813, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36753425002098083, + "step": 25, + "valid_targets_mean": 1500.2, + "valid_targets_min": 718 + }, + { + "epoch": 0.01571503404924044, + "grad_norm": 10.58346863646541, + "learning_rate": 8.676140613313389e-07, + "loss": 0.7649, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.41818854212760925, + "step": 30, + "valid_targets_mean": 1689.9, + "valid_targets_min": 764 + }, + { + "epoch": 0.018334206390780514, + "grad_norm": 10.066660675934825, + "learning_rate": 1.0172026925953627e-06, + "loss": 0.7398, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.37240898609161377, + "step": 35, + "valid_targets_mean": 1543.9, + "valid_targets_min": 725 + }, + { + "epoch": 0.020953378732320588, + "grad_norm": 8.335114097477899, + "learning_rate": 1.1667913238593869e-06, + "loss": 0.7298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3356940448284149, + "step": 40, + "valid_targets_mean": 1290.1, + "valid_targets_min": 610 + }, + { + "epoch": 0.02357255107386066, + "grad_norm": 7.3101895788801965, + "learning_rate": 1.3163799551234108e-06, + "loss": 0.6865, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3337023854255676, + "step": 45, + "valid_targets_mean": 1588.6, + "valid_targets_min": 720 + }, + { + "epoch": 0.026191723415400735, + "grad_norm": 6.5252803076428245, + "learning_rate": 1.4659685863874346e-06, + "loss": 0.6516, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.37255507707595825, + "step": 50, + "valid_targets_mean": 1708.5, + "valid_targets_min": 865 + }, + { + "epoch": 0.028810895756940808, + "grad_norm": 4.800098717068578, + "learning_rate": 1.6155572176514587e-06, + "loss": 0.61, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32511481642723083, + "step": 55, + "valid_targets_mean": 1502.1, + "valid_targets_min": 593 + }, + { + "epoch": 0.03143006809848088, + "grad_norm": 4.157839193676562, + "learning_rate": 1.7651458489154827e-06, + "loss": 0.5816, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30514219403266907, + "step": 60, + "valid_targets_mean": 1667.9, + "valid_targets_min": 704 + }, + { + "epoch": 0.03404924044002095, + "grad_norm": 4.1100198852951975, + "learning_rate": 1.9147344801795064e-06, + "loss": 0.5512, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22679626941680908, + "step": 65, + "valid_targets_mean": 1233.4, + "valid_targets_min": 722 + }, + { + "epoch": 0.03666841278156103, + "grad_norm": 2.7793207953264036, + "learning_rate": 2.0643231114435305e-06, + "loss": 0.5122, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2324710190296173, + "step": 70, + "valid_targets_mean": 1556.0, + "valid_targets_min": 968 + }, + { + "epoch": 0.0392875851231011, + "grad_norm": 2.1990435383084934, + "learning_rate": 2.2139117427075543e-06, + "loss": 0.4888, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2724093794822693, + "step": 75, + "valid_targets_mean": 1773.1, + "valid_targets_min": 936 + }, + { + "epoch": 0.041906757464641176, + "grad_norm": 1.9295286252565726, + "learning_rate": 2.3635003739715784e-06, + "loss": 0.4829, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21531279385089874, + "step": 80, + "valid_targets_mean": 1383.6, + "valid_targets_min": 728 + }, + { + "epoch": 0.044525929806181246, + "grad_norm": 1.4255276793624676, + "learning_rate": 2.513089005235602e-06, + "loss": 0.4682, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25964421033859253, + "step": 85, + "valid_targets_mean": 2023.5, + "valid_targets_min": 1143 + }, + { + "epoch": 0.04714510214772132, + "grad_norm": 1.4715916655150219, + "learning_rate": 2.6626776364996263e-06, + "loss": 0.4534, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25838708877563477, + "step": 90, + "valid_targets_mean": 1411.9, + "valid_targets_min": 818 + }, + { + "epoch": 0.04976427448926139, + "grad_norm": 1.5444005353673762, + "learning_rate": 2.8122662677636505e-06, + "loss": 0.4287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21245674788951874, + "step": 95, + "valid_targets_mean": 1393.2, + "valid_targets_min": 625 + }, + { + "epoch": 0.05238344683080147, + "grad_norm": 1.1994420345215826, + "learning_rate": 2.961854899027674e-06, + "loss": 0.4186, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22726021707057953, + "step": 100, + "valid_targets_mean": 1949.8, + "valid_targets_min": 790 + }, + { + "epoch": 0.05500261917234154, + "grad_norm": 1.3912983718478529, + "learning_rate": 3.111443530291698e-06, + "loss": 0.4149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2639816403388977, + "step": 105, + "valid_targets_mean": 2193.8, + "valid_targets_min": 891 + }, + { + "epoch": 0.057621791513881616, + "grad_norm": 1.1605250886514002, + "learning_rate": 3.261032161555722e-06, + "loss": 0.4063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1941235363483429, + "step": 110, + "valid_targets_mean": 1569.0, + "valid_targets_min": 850 + }, + { + "epoch": 0.060240963855421686, + "grad_norm": 1.1823905718225025, + "learning_rate": 3.410620792819746e-06, + "loss": 0.3927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17495793104171753, + "step": 115, + "valid_targets_mean": 1384.2, + "valid_targets_min": 974 + }, + { + "epoch": 0.06286013619696176, + "grad_norm": 1.1442967844329546, + "learning_rate": 3.56020942408377e-06, + "loss": 0.3807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22913743555545807, + "step": 120, + "valid_targets_mean": 1502.9, + "valid_targets_min": 998 + }, + { + "epoch": 0.06547930853850184, + "grad_norm": 1.068888565570554, + "learning_rate": 3.709798055347794e-06, + "loss": 0.3723, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20114624500274658, + "step": 125, + "valid_targets_mean": 1675.6, + "valid_targets_min": 1047 + }, + { + "epoch": 0.0680984808800419, + "grad_norm": 1.1005607515131652, + "learning_rate": 3.859386686611818e-06, + "loss": 0.3641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18255731463432312, + "step": 130, + "valid_targets_mean": 1577.6, + "valid_targets_min": 678 + }, + { + "epoch": 0.07071765322158198, + "grad_norm": 0.9822788022537852, + "learning_rate": 4.008975317875842e-06, + "loss": 0.3579, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19359880685806274, + "step": 135, + "valid_targets_mean": 1967.9, + "valid_targets_min": 1075 + }, + { + "epoch": 0.07333682556312206, + "grad_norm": 1.035772431448236, + "learning_rate": 4.158563949139865e-06, + "loss": 0.3573, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20526465773582458, + "step": 140, + "valid_targets_mean": 1872.6, + "valid_targets_min": 1317 + }, + { + "epoch": 0.07595599790466212, + "grad_norm": 1.0001037815145, + "learning_rate": 4.30815258040389e-06, + "loss": 0.3446, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18035730719566345, + "step": 145, + "valid_targets_mean": 1697.6, + "valid_targets_min": 957 + }, + { + "epoch": 0.0785751702462022, + "grad_norm": 0.9891303511553036, + "learning_rate": 4.457741211667914e-06, + "loss": 0.3512, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14854729175567627, + "step": 150, + "valid_targets_mean": 1323.0, + "valid_targets_min": 906 + }, + { + "epoch": 0.08119434258774227, + "grad_norm": 0.9882196378696704, + "learning_rate": 4.607329842931937e-06, + "loss": 0.3444, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14030331373214722, + "step": 155, + "valid_targets_mean": 1488.8, + "valid_targets_min": 1111 + }, + { + "epoch": 0.08381351492928235, + "grad_norm": 1.0048944644271929, + "learning_rate": 4.756918474195962e-06, + "loss": 0.3347, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16978579759597778, + "step": 160, + "valid_targets_mean": 1649.2, + "valid_targets_min": 1147 + }, + { + "epoch": 0.08643268727082241, + "grad_norm": 1.0229637320628204, + "learning_rate": 4.906507105459986e-06, + "loss": 0.3281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16098302602767944, + "step": 165, + "valid_targets_mean": 1526.2, + "valid_targets_min": 893 + }, + { + "epoch": 0.08905185961236249, + "grad_norm": 1.1203487718427658, + "learning_rate": 5.056095736724009e-06, + "loss": 0.3156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13853532075881958, + "step": 170, + "valid_targets_mean": 1219.6, + "valid_targets_min": 753 + }, + { + "epoch": 0.09167103195390257, + "grad_norm": 1.0656343831689796, + "learning_rate": 5.205684367988033e-06, + "loss": 0.3199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14839622378349304, + "step": 175, + "valid_targets_mean": 1574.5, + "valid_targets_min": 1192 + }, + { + "epoch": 0.09429020429544265, + "grad_norm": 1.0462503574281339, + "learning_rate": 5.355272999252057e-06, + "loss": 0.3214, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15112197399139404, + "step": 180, + "valid_targets_mean": 1496.1, + "valid_targets_min": 1039 + }, + { + "epoch": 0.09690937663698271, + "grad_norm": 1.0628653049567738, + "learning_rate": 5.504861630516081e-06, + "loss": 0.3216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1642725020647049, + "step": 185, + "valid_targets_mean": 1402.0, + "valid_targets_min": 657 + }, + { + "epoch": 0.09952854897852279, + "grad_norm": 1.1546554901174115, + "learning_rate": 5.654450261780105e-06, + "loss": 0.319, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1774584949016571, + "step": 190, + "valid_targets_mean": 1471.2, + "valid_targets_min": 880 + }, + { + "epoch": 0.10214772132006286, + "grad_norm": 1.4304632238319623, + "learning_rate": 5.80403889304413e-06, + "loss": 0.321, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1903408318758011, + "step": 195, + "valid_targets_mean": 1567.6, + "valid_targets_min": 1163 + }, + { + "epoch": 0.10476689366160294, + "grad_norm": 1.1266051731672357, + "learning_rate": 5.9536275243081535e-06, + "loss": 0.3091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15488669276237488, + "step": 200, + "valid_targets_mean": 1493.1, + "valid_targets_min": 998 + }, + { + "epoch": 0.107386066003143, + "grad_norm": 1.0963428815981444, + "learning_rate": 6.103216155572177e-06, + "loss": 0.3028, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12211956083774567, + "step": 205, + "valid_targets_mean": 1214.1, + "valid_targets_min": 703 + }, + { + "epoch": 0.11000523834468308, + "grad_norm": 1.5598102888973384, + "learning_rate": 6.252804786836201e-06, + "loss": 0.3236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15281397104263306, + "step": 210, + "valid_targets_mean": 1459.2, + "valid_targets_min": 934 + }, + { + "epoch": 0.11262441068622316, + "grad_norm": 0.9578105634940497, + "learning_rate": 6.402393418100225e-06, + "loss": 0.3268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20284399390220642, + "step": 215, + "valid_targets_mean": 1754.4, + "valid_targets_min": 734 + }, + { + "epoch": 0.11524358302776323, + "grad_norm": 1.0061815691692737, + "learning_rate": 6.5519820493642484e-06, + "loss": 0.3012, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1887899935245514, + "step": 220, + "valid_targets_mean": 1864.2, + "valid_targets_min": 1270 + }, + { + "epoch": 0.1178627553693033, + "grad_norm": 0.9847642087093494, + "learning_rate": 6.701570680628273e-06, + "loss": 0.3044, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.155894473195076, + "step": 225, + "valid_targets_mean": 1765.5, + "valid_targets_min": 746 + }, + { + "epoch": 0.12048192771084337, + "grad_norm": 1.0572078354661676, + "learning_rate": 6.851159311892297e-06, + "loss": 0.3094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18833455443382263, + "step": 230, + "valid_targets_mean": 1876.4, + "valid_targets_min": 1172 + }, + { + "epoch": 0.12310110005238345, + "grad_norm": 1.0498469428136838, + "learning_rate": 7.0007479431563205e-06, + "loss": 0.2971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15638378262519836, + "step": 235, + "valid_targets_mean": 1642.0, + "valid_targets_min": 1033 + }, + { + "epoch": 0.12572027239392353, + "grad_norm": 0.998808766771215, + "learning_rate": 7.150336574420344e-06, + "loss": 0.2892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16653478145599365, + "step": 240, + "valid_targets_mean": 1689.0, + "valid_targets_min": 1205 + }, + { + "epoch": 0.1283394447354636, + "grad_norm": 1.2353667197688452, + "learning_rate": 7.299925205684369e-06, + "loss": 0.2891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14583265781402588, + "step": 245, + "valid_targets_mean": 1164.2, + "valid_targets_min": 737 + }, + { + "epoch": 0.13095861707700368, + "grad_norm": 1.062022381972708, + "learning_rate": 7.4495138369483925e-06, + "loss": 0.3065, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16454707086086273, + "step": 250, + "valid_targets_mean": 1427.9, + "valid_targets_min": 791 + }, + { + "epoch": 0.13357778941854373, + "grad_norm": 0.8910358787837693, + "learning_rate": 7.599102468212416e-06, + "loss": 0.295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.128499835729599, + "step": 255, + "valid_targets_mean": 1559.5, + "valid_targets_min": 786 + }, + { + "epoch": 0.1361969617600838, + "grad_norm": 1.159401017442788, + "learning_rate": 7.748691099476442e-06, + "loss": 0.2876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12907026708126068, + "step": 260, + "valid_targets_mean": 1411.5, + "valid_targets_min": 944 + }, + { + "epoch": 0.13881613410162388, + "grad_norm": 1.244895408308553, + "learning_rate": 7.898279730740465e-06, + "loss": 0.2934, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1402992308139801, + "step": 265, + "valid_targets_mean": 1454.9, + "valid_targets_min": 1227 + }, + { + "epoch": 0.14143530644316396, + "grad_norm": 1.1306976178593087, + "learning_rate": 8.047868362004489e-06, + "loss": 0.2877, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1254289448261261, + "step": 270, + "valid_targets_mean": 1446.9, + "valid_targets_min": 740 + }, + { + "epoch": 0.14405447878470404, + "grad_norm": 0.921550922645942, + "learning_rate": 8.197456993268512e-06, + "loss": 0.2892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16916373372077942, + "step": 275, + "valid_targets_mean": 2122.9, + "valid_targets_min": 1227 + }, + { + "epoch": 0.14667365112624411, + "grad_norm": 0.9894093776769832, + "learning_rate": 8.347045624532537e-06, + "loss": 0.2832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12109673023223877, + "step": 280, + "valid_targets_mean": 1256.0, + "valid_targets_min": 636 + }, + { + "epoch": 0.1492928234677842, + "grad_norm": 1.0629135926381452, + "learning_rate": 8.49663425579656e-06, + "loss": 0.2795, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09688296169042587, + "step": 285, + "valid_targets_mean": 1168.8, + "valid_targets_min": 814 + }, + { + "epoch": 0.15191199580932424, + "grad_norm": 1.0185587649609436, + "learning_rate": 8.646222887060584e-06, + "loss": 0.2695, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13260769844055176, + "step": 290, + "valid_targets_mean": 1275.9, + "valid_targets_min": 911 + }, + { + "epoch": 0.15453116815086432, + "grad_norm": 0.9895587940966053, + "learning_rate": 8.795811518324609e-06, + "loss": 0.2781, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12507134675979614, + "step": 295, + "valid_targets_mean": 1431.9, + "valid_targets_min": 661 + }, + { + "epoch": 0.1571503404924044, + "grad_norm": 1.266883417746457, + "learning_rate": 8.945400149588632e-06, + "loss": 0.2794, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13883736729621887, + "step": 300, + "valid_targets_mean": 1572.1, + "valid_targets_min": 1164 + }, + { + "epoch": 0.15976951283394447, + "grad_norm": 1.1372606163472676, + "learning_rate": 9.094988780852656e-06, + "loss": 0.2734, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12079863250255585, + "step": 305, + "valid_targets_mean": 1396.6, + "valid_targets_min": 692 + }, + { + "epoch": 0.16238868517548455, + "grad_norm": 1.080445548289665, + "learning_rate": 9.244577412116679e-06, + "loss": 0.2777, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12431149184703827, + "step": 310, + "valid_targets_mean": 1405.8, + "valid_targets_min": 923 + }, + { + "epoch": 0.16500785751702463, + "grad_norm": 1.0979789118461285, + "learning_rate": 9.394166043380704e-06, + "loss": 0.2808, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1450071632862091, + "step": 315, + "valid_targets_mean": 1375.1, + "valid_targets_min": 922 + }, + { + "epoch": 0.1676270298585647, + "grad_norm": 0.9732855691376677, + "learning_rate": 9.543754674644728e-06, + "loss": 0.2692, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14313220977783203, + "step": 320, + "valid_targets_mean": 1806.0, + "valid_targets_min": 710 + }, + { + "epoch": 0.17024620220010478, + "grad_norm": 1.0693553307142176, + "learning_rate": 9.693343305908753e-06, + "loss": 0.2795, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1343768686056137, + "step": 325, + "valid_targets_mean": 1342.9, + "valid_targets_min": 836 + }, + { + "epoch": 0.17286537454164483, + "grad_norm": 1.2383461126696775, + "learning_rate": 9.842931937172776e-06, + "loss": 0.2761, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15635260939598083, + "step": 330, + "valid_targets_mean": 1504.5, + "valid_targets_min": 1013 + }, + { + "epoch": 0.1754845468831849, + "grad_norm": 1.0278678326366064, + "learning_rate": 9.9925205684368e-06, + "loss": 0.2889, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1264498382806778, + "step": 335, + "valid_targets_mean": 1351.6, + "valid_targets_min": 978 + }, + { + "epoch": 0.17810371922472498, + "grad_norm": 0.9446943807345949, + "learning_rate": 1.0142109199700823e-05, + "loss": 0.2776, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15977764129638672, + "step": 340, + "valid_targets_mean": 1812.5, + "valid_targets_min": 1205 + }, + { + "epoch": 0.18072289156626506, + "grad_norm": 1.0152657984078985, + "learning_rate": 1.029169783096485e-05, + "loss": 0.2904, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12069070339202881, + "step": 345, + "valid_targets_mean": 1657.9, + "valid_targets_min": 1219 + }, + { + "epoch": 0.18334206390780514, + "grad_norm": 1.1298475109493238, + "learning_rate": 1.0441286462228872e-05, + "loss": 0.2796, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17380760610103607, + "step": 350, + "valid_targets_mean": 1814.4, + "valid_targets_min": 1002 + }, + { + "epoch": 0.1859612362493452, + "grad_norm": 1.0284732532049468, + "learning_rate": 1.0590875093492897e-05, + "loss": 0.2747, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1345786154270172, + "step": 355, + "valid_targets_mean": 1390.4, + "valid_targets_min": 646 + }, + { + "epoch": 0.1885804085908853, + "grad_norm": 1.2878881994741163, + "learning_rate": 1.074046372475692e-05, + "loss": 0.2733, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15683802962303162, + "step": 360, + "valid_targets_mean": 1307.4, + "valid_targets_min": 906 + }, + { + "epoch": 0.19119958093242537, + "grad_norm": 0.9809027495356322, + "learning_rate": 1.0890052356020944e-05, + "loss": 0.2663, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14160452783107758, + "step": 365, + "valid_targets_mean": 1574.8, + "valid_targets_min": 808 + }, + { + "epoch": 0.19381875327396542, + "grad_norm": 1.1326103312750746, + "learning_rate": 1.1039640987284967e-05, + "loss": 0.2802, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1289289891719818, + "step": 370, + "valid_targets_mean": 1173.9, + "valid_targets_min": 913 + }, + { + "epoch": 0.1964379256155055, + "grad_norm": 1.1510183408232784, + "learning_rate": 1.1189229618548992e-05, + "loss": 0.2682, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1337447464466095, + "step": 375, + "valid_targets_mean": 1354.2, + "valid_targets_min": 821 + }, + { + "epoch": 0.19905709795704557, + "grad_norm": 1.0246072291580883, + "learning_rate": 1.1338818249813015e-05, + "loss": 0.2615, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12531915307044983, + "step": 380, + "valid_targets_mean": 1508.4, + "valid_targets_min": 1013 + }, + { + "epoch": 0.20167627029858565, + "grad_norm": 1.0553388175979033, + "learning_rate": 1.148840688107704e-05, + "loss": 0.2544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12561854720115662, + "step": 385, + "valid_targets_mean": 1517.8, + "valid_targets_min": 781 + }, + { + "epoch": 0.20429544264012572, + "grad_norm": 1.1033328804149476, + "learning_rate": 1.1637995512341062e-05, + "loss": 0.2812, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11696565896272659, + "step": 390, + "valid_targets_mean": 1243.6, + "valid_targets_min": 548 + }, + { + "epoch": 0.2069146149816658, + "grad_norm": 1.4355990728777048, + "learning_rate": 1.1787584143605087e-05, + "loss": 0.2564, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12579873204231262, + "step": 395, + "valid_targets_mean": 1269.0, + "valid_targets_min": 694 + }, + { + "epoch": 0.20953378732320588, + "grad_norm": 0.9410901318700186, + "learning_rate": 1.193717277486911e-05, + "loss": 0.2662, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15521228313446045, + "step": 400, + "valid_targets_mean": 2141.0, + "valid_targets_min": 1030 + }, + { + "epoch": 0.21215295966474593, + "grad_norm": 0.8804587710612956, + "learning_rate": 1.2086761406133134e-05, + "loss": 0.2429, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11668536067008972, + "step": 405, + "valid_targets_mean": 1738.6, + "valid_targets_min": 682 + }, + { + "epoch": 0.214772132006286, + "grad_norm": 1.124066683984815, + "learning_rate": 1.2236350037397157e-05, + "loss": 0.2532, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13496944308280945, + "step": 410, + "valid_targets_mean": 1407.2, + "valid_targets_min": 990 + }, + { + "epoch": 0.21739130434782608, + "grad_norm": 0.9627302938369182, + "learning_rate": 1.2385938668661183e-05, + "loss": 0.2605, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11118908226490021, + "step": 415, + "valid_targets_mean": 1551.6, + "valid_targets_min": 639 + }, + { + "epoch": 0.22001047668936616, + "grad_norm": 1.0027093220955372, + "learning_rate": 1.2535527299925208e-05, + "loss": 0.265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11878924071788788, + "step": 420, + "valid_targets_mean": 1442.6, + "valid_targets_min": 958 + }, + { + "epoch": 0.22262964903090623, + "grad_norm": 1.093327589386835, + "learning_rate": 1.268511593118923e-05, + "loss": 0.2583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13007187843322754, + "step": 425, + "valid_targets_mean": 1426.5, + "valid_targets_min": 874 + }, + { + "epoch": 0.2252488213724463, + "grad_norm": 1.056589541047298, + "learning_rate": 1.2834704562453255e-05, + "loss": 0.2627, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12732923030853271, + "step": 430, + "valid_targets_mean": 1298.2, + "valid_targets_min": 557 + }, + { + "epoch": 0.2278679937139864, + "grad_norm": 1.12863022898657, + "learning_rate": 1.2984293193717278e-05, + "loss": 0.2672, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1605558842420578, + "step": 435, + "valid_targets_mean": 1472.2, + "valid_targets_min": 713 + }, + { + "epoch": 0.23048716605552647, + "grad_norm": 0.9272349364850403, + "learning_rate": 1.3133881824981303e-05, + "loss": 0.2744, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20511457324028015, + "step": 440, + "valid_targets_mean": 3139.9, + "valid_targets_min": 760 + }, + { + "epoch": 0.23310633839706651, + "grad_norm": 0.6592303408303113, + "learning_rate": 1.3283470456245326e-05, + "loss": 0.3305, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16108927130699158, + "step": 445, + "valid_targets_mean": 7612.6, + "valid_targets_min": 5111 + }, + { + "epoch": 0.2357255107386066, + "grad_norm": 0.6070904717684076, + "learning_rate": 1.343305908750935e-05, + "loss": 0.309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15576837956905365, + "step": 450, + "valid_targets_mean": 6669.0, + "valid_targets_min": 4480 + }, + { + "epoch": 0.23834468308014667, + "grad_norm": 0.5605588322150622, + "learning_rate": 1.3582647718773375e-05, + "loss": 0.3049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14649811387062073, + "step": 455, + "valid_targets_mean": 6538.6, + "valid_targets_min": 4620 + }, + { + "epoch": 0.24096385542168675, + "grad_norm": 0.5393212034322579, + "learning_rate": 1.3732236350037398e-05, + "loss": 0.2975, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15623930096626282, + "step": 460, + "valid_targets_mean": 6802.6, + "valid_targets_min": 4873 + }, + { + "epoch": 0.24358302776322682, + "grad_norm": 0.5656537757646136, + "learning_rate": 1.3881824981301422e-05, + "loss": 0.3118, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.180804044008255, + "step": 465, + "valid_targets_mean": 7563.2, + "valid_targets_min": 4229 + }, + { + "epoch": 0.2462022001047669, + "grad_norm": 0.6043634022436999, + "learning_rate": 1.4031413612565445e-05, + "loss": 0.2989, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16554348170757294, + "step": 470, + "valid_targets_mean": 6109.0, + "valid_targets_min": 4279 + }, + { + "epoch": 0.24882137244630698, + "grad_norm": 0.5674853412227062, + "learning_rate": 1.418100224382947e-05, + "loss": 0.2798, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11345628648996353, + "step": 475, + "valid_targets_mean": 5549.6, + "valid_targets_min": 4542 + }, + { + "epoch": 0.25144054478784705, + "grad_norm": 0.7434256656586965, + "learning_rate": 1.4330590875093493e-05, + "loss": 0.3047, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12726938724517822, + "step": 480, + "valid_targets_mean": 2525.8, + "valid_targets_min": 1497 + }, + { + "epoch": 0.25405971712938713, + "grad_norm": 0.5220549071443945, + "learning_rate": 1.4480179506357519e-05, + "loss": 0.2726, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14162325859069824, + "step": 485, + "valid_targets_mean": 6166.2, + "valid_targets_min": 5332 + }, + { + "epoch": 0.2566788894709272, + "grad_norm": 0.5352536558586826, + "learning_rate": 1.4629768137621543e-05, + "loss": 0.2711, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1418171525001526, + "step": 490, + "valid_targets_mean": 5823.5, + "valid_targets_min": 4612 + }, + { + "epoch": 0.2592980618124673, + "grad_norm": 0.49634651905061267, + "learning_rate": 1.4779356768885566e-05, + "loss": 0.2801, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1447383463382721, + "step": 495, + "valid_targets_mean": 6896.5, + "valid_targets_min": 4491 + }, + { + "epoch": 0.26191723415400736, + "grad_norm": 0.595603945724847, + "learning_rate": 1.4928945400149591e-05, + "loss": 0.2682, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13166537880897522, + "step": 500, + "valid_targets_mean": 6611.1, + "valid_targets_min": 4754 + }, + { + "epoch": 0.2645364064955474, + "grad_norm": 0.5393190418295071, + "learning_rate": 1.5078534031413614e-05, + "loss": 0.2597, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12661321461200714, + "step": 505, + "valid_targets_mean": 5907.1, + "valid_targets_min": 4787 + }, + { + "epoch": 0.26715557883708746, + "grad_norm": 0.4805967233196434, + "learning_rate": 1.5228122662677638e-05, + "loss": 0.2501, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12104909867048264, + "step": 510, + "valid_targets_mean": 6055.5, + "valid_targets_min": 5052 + }, + { + "epoch": 0.26977475117862754, + "grad_norm": 0.523906305492081, + "learning_rate": 1.5377711293941663e-05, + "loss": 0.2486, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11703436076641083, + "step": 515, + "valid_targets_mean": 6365.0, + "valid_targets_min": 4664 + }, + { + "epoch": 0.2723939235201676, + "grad_norm": 0.5224516826211744, + "learning_rate": 1.5527299925205686e-05, + "loss": 0.2656, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12053846567869186, + "step": 520, + "valid_targets_mean": 5928.2, + "valid_targets_min": 4211 + }, + { + "epoch": 0.2750130958617077, + "grad_norm": 0.48612267922315106, + "learning_rate": 1.567688855646971e-05, + "loss": 0.2612, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13059380650520325, + "step": 525, + "valid_targets_mean": 6415.9, + "valid_targets_min": 4582 + }, + { + "epoch": 0.27763226820324777, + "grad_norm": 0.5147679122113759, + "learning_rate": 1.582647718773373e-05, + "loss": 0.241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10836943238973618, + "step": 530, + "valid_targets_mean": 6044.8, + "valid_targets_min": 4800 + }, + { + "epoch": 0.28025144054478784, + "grad_norm": 0.4734791716055116, + "learning_rate": 1.5976065818997758e-05, + "loss": 0.2353, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11990270763635635, + "step": 535, + "valid_targets_mean": 8009.0, + "valid_targets_min": 6651 + }, + { + "epoch": 0.2828706128863279, + "grad_norm": 1.140668751349671, + "learning_rate": 1.612565445026178e-05, + "loss": 0.2596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1416817456483841, + "step": 540, + "valid_targets_mean": 5887.5, + "valid_targets_min": 3477 + }, + { + "epoch": 0.285489785227868, + "grad_norm": 0.5997001161199454, + "learning_rate": 1.6275243081525804e-05, + "loss": 0.2832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1452217996120453, + "step": 545, + "valid_targets_mean": 5471.1, + "valid_targets_min": 965 + }, + { + "epoch": 0.2881089575694081, + "grad_norm": 0.5265818655921063, + "learning_rate": 1.6424831712789827e-05, + "loss": 0.2413, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1338367462158203, + "step": 550, + "valid_targets_mean": 6654.1, + "valid_targets_min": 5226 + }, + { + "epoch": 0.29072812991094815, + "grad_norm": 0.5748870112445678, + "learning_rate": 1.6574420344053853e-05, + "loss": 0.2518, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10587285459041595, + "step": 555, + "valid_targets_mean": 6363.4, + "valid_targets_min": 4213 + }, + { + "epoch": 0.29334730225248823, + "grad_norm": 0.5572025930451594, + "learning_rate": 1.672400897531788e-05, + "loss": 0.27, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13715760409832, + "step": 560, + "valid_targets_mean": 5469.9, + "valid_targets_min": 3761 + }, + { + "epoch": 0.2959664745940283, + "grad_norm": 0.4978200163320225, + "learning_rate": 1.6873597606581902e-05, + "loss": 0.2871, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16060104966163635, + "step": 565, + "valid_targets_mean": 7206.2, + "valid_targets_min": 4993 + }, + { + "epoch": 0.2985856469355684, + "grad_norm": 0.5876389734069661, + "learning_rate": 1.7023186237845925e-05, + "loss": 0.2815, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1361798644065857, + "step": 570, + "valid_targets_mean": 6402.2, + "valid_targets_min": 5199 + }, + { + "epoch": 0.30120481927710846, + "grad_norm": 0.49390495353916386, + "learning_rate": 1.7172774869109948e-05, + "loss": 0.257, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1463567018508911, + "step": 575, + "valid_targets_mean": 7578.1, + "valid_targets_min": 4534 + }, + { + "epoch": 0.3038239916186485, + "grad_norm": 0.8190322032239803, + "learning_rate": 1.7322363500373974e-05, + "loss": 0.2559, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11292055994272232, + "step": 580, + "valid_targets_mean": 6264.4, + "valid_targets_min": 4751 + }, + { + "epoch": 0.30644316396018856, + "grad_norm": 0.5825495479534828, + "learning_rate": 1.7471952131637997e-05, + "loss": 0.2546, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11191920191049576, + "step": 585, + "valid_targets_mean": 5604.1, + "valid_targets_min": 3888 + }, + { + "epoch": 0.30906233630172864, + "grad_norm": 0.6079995425568043, + "learning_rate": 1.762154076290202e-05, + "loss": 0.2632, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14392173290252686, + "step": 590, + "valid_targets_mean": 7001.6, + "valid_targets_min": 4455 + }, + { + "epoch": 0.3116815086432687, + "grad_norm": 0.5099427304498049, + "learning_rate": 1.7771129394166046e-05, + "loss": 0.252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14200888574123383, + "step": 595, + "valid_targets_mean": 6955.5, + "valid_targets_min": 5230 + }, + { + "epoch": 0.3143006809848088, + "grad_norm": 0.5221532590692329, + "learning_rate": 1.792071802543007e-05, + "loss": 0.2576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11283424496650696, + "step": 600, + "valid_targets_mean": 7295.8, + "valid_targets_min": 5668 + }, + { + "epoch": 0.31691985332634887, + "grad_norm": 0.6000692376731359, + "learning_rate": 1.8070306656694092e-05, + "loss": 0.2546, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13104653358459473, + "step": 605, + "valid_targets_mean": 6350.4, + "valid_targets_min": 4871 + }, + { + "epoch": 0.31953902566788894, + "grad_norm": 0.5108942792231622, + "learning_rate": 1.8219895287958115e-05, + "loss": 0.2418, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1462014615535736, + "step": 610, + "valid_targets_mean": 8015.2, + "valid_targets_min": 6018 + }, + { + "epoch": 0.322158198009429, + "grad_norm": 0.4384117592659271, + "learning_rate": 1.836948391922214e-05, + "loss": 0.2207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11725406348705292, + "step": 615, + "valid_targets_mean": 7110.1, + "valid_targets_min": 3533 + }, + { + "epoch": 0.3247773703509691, + "grad_norm": 0.5213116308490782, + "learning_rate": 1.8519072550486164e-05, + "loss": 0.2543, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13383880257606506, + "step": 620, + "valid_targets_mean": 6875.0, + "valid_targets_min": 5199 + }, + { + "epoch": 0.3273965426925092, + "grad_norm": 0.5834532687839684, + "learning_rate": 1.866866118175019e-05, + "loss": 0.2551, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12733125686645508, + "step": 625, + "valid_targets_mean": 5568.4, + "valid_targets_min": 4923 + }, + { + "epoch": 0.33001571503404925, + "grad_norm": 0.519113028355725, + "learning_rate": 1.8818249813014213e-05, + "loss": 0.2494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0986289530992508, + "step": 630, + "valid_targets_mean": 6421.9, + "valid_targets_min": 4527 + }, + { + "epoch": 0.3326348873755893, + "grad_norm": 0.8163787743694745, + "learning_rate": 1.8967838444278236e-05, + "loss": 0.2461, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1518421769142151, + "step": 635, + "valid_targets_mean": 7147.9, + "valid_targets_min": 3082 + }, + { + "epoch": 0.3352540597171294, + "grad_norm": 0.5104174282267507, + "learning_rate": 1.9117427075542262e-05, + "loss": 0.2262, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11866091936826706, + "step": 640, + "valid_targets_mean": 6880.6, + "valid_targets_min": 4685 + }, + { + "epoch": 0.3378732320586695, + "grad_norm": 0.570898453985933, + "learning_rate": 1.9267015706806285e-05, + "loss": 0.2479, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11430183053016663, + "step": 645, + "valid_targets_mean": 5915.5, + "valid_targets_min": 4875 + }, + { + "epoch": 0.34049240440020956, + "grad_norm": 0.5480651974305227, + "learning_rate": 1.9416604338070308e-05, + "loss": 0.247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1123688668012619, + "step": 650, + "valid_targets_mean": 6234.5, + "valid_targets_min": 4433 + }, + { + "epoch": 0.3431115767417496, + "grad_norm": 0.5442230880157303, + "learning_rate": 1.956619296933433e-05, + "loss": 0.2364, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10760192573070526, + "step": 655, + "valid_targets_mean": 5684.0, + "valid_targets_min": 4540 + }, + { + "epoch": 0.34573074908328966, + "grad_norm": 0.5346676203693183, + "learning_rate": 1.9715781600598357e-05, + "loss": 0.2514, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15074855089187622, + "step": 660, + "valid_targets_mean": 7353.4, + "valid_targets_min": 5101 + }, + { + "epoch": 0.34834992142482973, + "grad_norm": 0.5824277658679824, + "learning_rate": 1.986537023186238e-05, + "loss": 0.2413, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10114076733589172, + "step": 665, + "valid_targets_mean": 5300.5, + "valid_targets_min": 4442 + }, + { + "epoch": 0.3509690937663698, + "grad_norm": 0.4835835842335859, + "learning_rate": 2.0014958863126406e-05, + "loss": 0.2111, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09848757833242416, + "step": 670, + "valid_targets_mean": 6084.1, + "valid_targets_min": 5268 + }, + { + "epoch": 0.3535882661079099, + "grad_norm": 0.48641986127969844, + "learning_rate": 2.016454749439043e-05, + "loss": 0.2142, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11454112082719803, + "step": 675, + "valid_targets_mean": 6446.6, + "valid_targets_min": 5074 + }, + { + "epoch": 0.35620743844944996, + "grad_norm": 0.4862581142799685, + "learning_rate": 2.0314136125654452e-05, + "loss": 0.2243, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10703176259994507, + "step": 680, + "valid_targets_mean": 6195.0, + "valid_targets_min": 5221 + }, + { + "epoch": 0.35882661079099004, + "grad_norm": 0.5438834169467284, + "learning_rate": 2.046372475691848e-05, + "loss": 0.2368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11888057738542557, + "step": 685, + "valid_targets_mean": 5689.1, + "valid_targets_min": 4642 + }, + { + "epoch": 0.3614457831325301, + "grad_norm": 0.6833967212154707, + "learning_rate": 2.06133133881825e-05, + "loss": 0.2662, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13145872950553894, + "step": 690, + "valid_targets_mean": 4461.4, + "valid_targets_min": 3222 + }, + { + "epoch": 0.3640649554740702, + "grad_norm": 0.4757801544127953, + "learning_rate": 2.0762902019446524e-05, + "loss": 0.2772, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12056447565555573, + "step": 695, + "valid_targets_mean": 6822.2, + "valid_targets_min": 4371 + }, + { + "epoch": 0.3666841278156103, + "grad_norm": 0.6379502088686836, + "learning_rate": 2.0912490650710547e-05, + "loss": 0.2297, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12404558807611465, + "step": 700, + "valid_targets_mean": 5632.6, + "valid_targets_min": 3689 + }, + { + "epoch": 0.36930330015715035, + "grad_norm": 0.5476812114299602, + "learning_rate": 2.1062079281974573e-05, + "loss": 0.2392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12419216334819794, + "step": 705, + "valid_targets_mean": 6364.1, + "valid_targets_min": 4281 + }, + { + "epoch": 0.3719224724986904, + "grad_norm": 0.5104513503681111, + "learning_rate": 2.1211667913238596e-05, + "loss": 0.2406, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1376412808895111, + "step": 710, + "valid_targets_mean": 6337.8, + "valid_targets_min": 4844 + }, + { + "epoch": 0.3745416448402305, + "grad_norm": 0.5204775395935077, + "learning_rate": 2.136125654450262e-05, + "loss": 0.2567, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10598008334636688, + "step": 715, + "valid_targets_mean": 5507.5, + "valid_targets_min": 4549 + }, + { + "epoch": 0.3771608171817706, + "grad_norm": 0.47648945431326273, + "learning_rate": 2.1510845175766645e-05, + "loss": 0.235, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1064852625131607, + "step": 720, + "valid_targets_mean": 5274.8, + "valid_targets_min": 2461 + }, + { + "epoch": 0.37977998952331066, + "grad_norm": 0.6232540892767168, + "learning_rate": 2.1660433807030668e-05, + "loss": 0.245, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13343873620033264, + "step": 725, + "valid_targets_mean": 6465.2, + "valid_targets_min": 2815 + }, + { + "epoch": 0.38239916186485073, + "grad_norm": 0.4884239403527553, + "learning_rate": 2.181002243829469e-05, + "loss": 0.2363, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10519768297672272, + "step": 730, + "valid_targets_mean": 6715.5, + "valid_targets_min": 5192 + }, + { + "epoch": 0.38501833420639076, + "grad_norm": 0.48078334521709176, + "learning_rate": 2.1959611069558714e-05, + "loss": 0.2158, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10113941133022308, + "step": 735, + "valid_targets_mean": 5737.2, + "valid_targets_min": 5186 + }, + { + "epoch": 0.38763750654793083, + "grad_norm": 0.4914084122068677, + "learning_rate": 2.210919970082274e-05, + "loss": 0.2324, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09212394058704376, + "step": 740, + "valid_targets_mean": 5329.5, + "valid_targets_min": 3786 + }, + { + "epoch": 0.3902566788894709, + "grad_norm": 0.556681897033246, + "learning_rate": 2.2258788332086763e-05, + "loss": 0.2831, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13327279686927795, + "step": 745, + "valid_targets_mean": 6233.8, + "valid_targets_min": 5147 + }, + { + "epoch": 0.392875851231011, + "grad_norm": 0.518177762534259, + "learning_rate": 2.2408376963350786e-05, + "loss": 0.2248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13125228881835938, + "step": 750, + "valid_targets_mean": 5807.6, + "valid_targets_min": 3952 + }, + { + "epoch": 0.39549502357255106, + "grad_norm": 0.5591532007746006, + "learning_rate": 2.255796559461481e-05, + "loss": 0.2392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13699626922607422, + "step": 755, + "valid_targets_mean": 6452.8, + "valid_targets_min": 5079 + }, + { + "epoch": 0.39811419591409114, + "grad_norm": 0.5270316309713508, + "learning_rate": 2.2707554225878835e-05, + "loss": 0.2452, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12873396277427673, + "step": 760, + "valid_targets_mean": 6432.9, + "valid_targets_min": 3762 + }, + { + "epoch": 0.4007333682556312, + "grad_norm": 0.46395489991397554, + "learning_rate": 2.2857142857142858e-05, + "loss": 0.2165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1013445183634758, + "step": 765, + "valid_targets_mean": 5954.1, + "valid_targets_min": 4726 + }, + { + "epoch": 0.4033525405971713, + "grad_norm": 0.5726114581033401, + "learning_rate": 2.300673148840688e-05, + "loss": 0.2236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12622445821762085, + "step": 770, + "valid_targets_mean": 5874.6, + "valid_targets_min": 3724 + }, + { + "epoch": 0.40597171293871137, + "grad_norm": 0.539701890419442, + "learning_rate": 2.3156320119670904e-05, + "loss": 0.2083, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10788456350564957, + "step": 775, + "valid_targets_mean": 6436.9, + "valid_targets_min": 5578 + }, + { + "epoch": 0.40859088528025145, + "grad_norm": 0.50097922607963, + "learning_rate": 2.330590875093493e-05, + "loss": 0.2296, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10845942050218582, + "step": 780, + "valid_targets_mean": 6727.8, + "valid_targets_min": 5795 + }, + { + "epoch": 0.4112100576217915, + "grad_norm": 0.4773488140437983, + "learning_rate": 2.3455497382198953e-05, + "loss": 0.2207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09601639211177826, + "step": 785, + "valid_targets_mean": 6116.2, + "valid_targets_min": 5268 + }, + { + "epoch": 0.4138292299633316, + "grad_norm": 0.4195165425204695, + "learning_rate": 2.3605086013462976e-05, + "loss": 0.2224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10880352556705475, + "step": 790, + "valid_targets_mean": 7379.5, + "valid_targets_min": 4920 + }, + { + "epoch": 0.4164484023048717, + "grad_norm": 0.4306956855558924, + "learning_rate": 2.3754674644727006e-05, + "loss": 0.2288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08985568583011627, + "step": 795, + "valid_targets_mean": 7048.4, + "valid_targets_min": 5243 + }, + { + "epoch": 0.41906757464641176, + "grad_norm": 0.5369718687993797, + "learning_rate": 2.390426327599103e-05, + "loss": 0.2172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12296460568904877, + "step": 800, + "valid_targets_mean": 6385.8, + "valid_targets_min": 4794 + }, + { + "epoch": 0.42168674698795183, + "grad_norm": 0.4941586673987478, + "learning_rate": 2.405385190725505e-05, + "loss": 0.2392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10740514099597931, + "step": 805, + "valid_targets_mean": 6215.4, + "valid_targets_min": 5168 + }, + { + "epoch": 0.42430591932949185, + "grad_norm": 0.582899412841253, + "learning_rate": 2.4203440538519078e-05, + "loss": 0.2465, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.138446643948555, + "step": 810, + "valid_targets_mean": 5333.2, + "valid_targets_min": 3130 + }, + { + "epoch": 0.42692509167103193, + "grad_norm": 0.7098374759246038, + "learning_rate": 2.43530291697831e-05, + "loss": 0.3222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17193308472633362, + "step": 815, + "valid_targets_mean": 5546.2, + "valid_targets_min": 1971 + }, + { + "epoch": 0.429544264012572, + "grad_norm": 0.7132928007433752, + "learning_rate": 2.4502617801047123e-05, + "loss": 0.3978, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2480137199163437, + "step": 820, + "valid_targets_mean": 5648.9, + "valid_targets_min": 1631 + }, + { + "epoch": 0.4321634363541121, + "grad_norm": 0.6728986690741761, + "learning_rate": 2.4652206432311146e-05, + "loss": 0.3876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22709880769252777, + "step": 825, + "valid_targets_mean": 5411.4, + "valid_targets_min": 1509 + }, + { + "epoch": 0.43478260869565216, + "grad_norm": 0.644504704154439, + "learning_rate": 2.4801795063575172e-05, + "loss": 0.3675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1710299700498581, + "step": 830, + "valid_targets_mean": 4960.2, + "valid_targets_min": 2736 + }, + { + "epoch": 0.43740178103719224, + "grad_norm": 0.603144229645836, + "learning_rate": 2.4951383694839195e-05, + "loss": 0.3715, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15948154032230377, + "step": 835, + "valid_targets_mean": 3726.8, + "valid_targets_min": 1439 + }, + { + "epoch": 0.4400209533787323, + "grad_norm": 0.6048927321251332, + "learning_rate": 2.5100972326103218e-05, + "loss": 0.3826, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16860568523406982, + "step": 840, + "valid_targets_mean": 4269.4, + "valid_targets_min": 1838 + }, + { + "epoch": 0.4426401257202724, + "grad_norm": 0.5645343149320301, + "learning_rate": 2.525056095736724e-05, + "loss": 0.3535, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22065946459770203, + "step": 845, + "valid_targets_mean": 5973.6, + "valid_targets_min": 2762 + }, + { + "epoch": 0.44525929806181247, + "grad_norm": 0.5696632258416167, + "learning_rate": 2.5400149588631267e-05, + "loss": 0.3636, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16765108704566956, + "step": 850, + "valid_targets_mean": 3987.1, + "valid_targets_min": 1654 + }, + { + "epoch": 0.44787847040335255, + "grad_norm": 0.5461627337763696, + "learning_rate": 2.554973821989529e-05, + "loss": 0.3634, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1650678813457489, + "step": 855, + "valid_targets_mean": 5043.6, + "valid_targets_min": 2493 + }, + { + "epoch": 0.4504976427448926, + "grad_norm": 0.6356464309990801, + "learning_rate": 2.5699326851159313e-05, + "loss": 0.3755, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17353945970535278, + "step": 860, + "valid_targets_mean": 4468.9, + "valid_targets_min": 874 + }, + { + "epoch": 0.4531168150864327, + "grad_norm": 0.5446940060410611, + "learning_rate": 2.584891548242334e-05, + "loss": 0.3598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16391149163246155, + "step": 865, + "valid_targets_mean": 5241.0, + "valid_targets_min": 953 + }, + { + "epoch": 0.4557359874279728, + "grad_norm": 0.6074855741100244, + "learning_rate": 2.5998504113687362e-05, + "loss": 0.3662, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22667014598846436, + "step": 870, + "valid_targets_mean": 5277.0, + "valid_targets_min": 1265 + }, + { + "epoch": 0.45835515976951285, + "grad_norm": 0.5397370112483811, + "learning_rate": 2.6148092744951385e-05, + "loss": 0.357, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.189674511551857, + "step": 875, + "valid_targets_mean": 6127.8, + "valid_targets_min": 2566 + }, + { + "epoch": 0.46097433211105293, + "grad_norm": 0.6193870279812388, + "learning_rate": 2.6297681376215408e-05, + "loss": 0.3642, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1588752567768097, + "step": 880, + "valid_targets_mean": 3446.9, + "valid_targets_min": 1759 + }, + { + "epoch": 0.463593504452593, + "grad_norm": 0.7161305662391659, + "learning_rate": 2.6447270007479434e-05, + "loss": 0.3692, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18031099438667297, + "step": 885, + "valid_targets_mean": 3659.4, + "valid_targets_min": 2179 + }, + { + "epoch": 0.46621267679413303, + "grad_norm": 0.6833309594222867, + "learning_rate": 2.6596858638743457e-05, + "loss": 0.3705, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19416679441928864, + "step": 890, + "valid_targets_mean": 4161.5, + "valid_targets_min": 1785 + }, + { + "epoch": 0.4688318491356731, + "grad_norm": 0.6686531726084138, + "learning_rate": 2.674644727000748e-05, + "loss": 0.3619, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21306106448173523, + "step": 895, + "valid_targets_mean": 4467.9, + "valid_targets_min": 2345 + }, + { + "epoch": 0.4714510214772132, + "grad_norm": 0.6514316529464631, + "learning_rate": 2.6896035901271503e-05, + "loss": 0.3779, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2033441960811615, + "step": 900, + "valid_targets_mean": 4057.2, + "valid_targets_min": 2767 + }, + { + "epoch": 0.47407019381875326, + "grad_norm": 0.7367261083208211, + "learning_rate": 2.704562453253553e-05, + "loss": 0.3782, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19121892750263214, + "step": 905, + "valid_targets_mean": 3450.2, + "valid_targets_min": 1205 + }, + { + "epoch": 0.47668936616029334, + "grad_norm": 0.7078706067989683, + "learning_rate": 2.7195213163799552e-05, + "loss": 0.3673, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1769869178533554, + "step": 910, + "valid_targets_mean": 3777.1, + "valid_targets_min": 2004 + }, + { + "epoch": 0.4793085385018334, + "grad_norm": 0.6092132151273473, + "learning_rate": 2.7344801795063575e-05, + "loss": 0.3723, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1985096037387848, + "step": 915, + "valid_targets_mean": 4273.0, + "valid_targets_min": 1469 + }, + { + "epoch": 0.4819277108433735, + "grad_norm": 0.7040547478222255, + "learning_rate": 2.7494390426327598e-05, + "loss": 0.3514, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2201271951198578, + "step": 920, + "valid_targets_mean": 4196.8, + "valid_targets_min": 1889 + }, + { + "epoch": 0.48454688318491357, + "grad_norm": 0.6604000483479482, + "learning_rate": 2.7643979057591624e-05, + "loss": 0.3455, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18622466921806335, + "step": 925, + "valid_targets_mean": 4319.2, + "valid_targets_min": 2046 + }, + { + "epoch": 0.48716605552645365, + "grad_norm": 0.6969880777230246, + "learning_rate": 2.7793567688855647e-05, + "loss": 0.3496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21243366599082947, + "step": 930, + "valid_targets_mean": 4580.1, + "valid_targets_min": 3373 + }, + { + "epoch": 0.4897852278679937, + "grad_norm": 0.7477837127123838, + "learning_rate": 2.7943156320119677e-05, + "loss": 0.3645, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18580077588558197, + "step": 935, + "valid_targets_mean": 3786.0, + "valid_targets_min": 1747 + }, + { + "epoch": 0.4924044002095338, + "grad_norm": 0.66746084891723, + "learning_rate": 2.80927449513837e-05, + "loss": 0.3639, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1607457548379898, + "step": 940, + "valid_targets_mean": 3339.9, + "valid_targets_min": 1166 + }, + { + "epoch": 0.4950235725510739, + "grad_norm": 0.6087369419354419, + "learning_rate": 2.8242333582647723e-05, + "loss": 0.3452, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17224672436714172, + "step": 945, + "valid_targets_mean": 4114.1, + "valid_targets_min": 1537 + }, + { + "epoch": 0.49764274489261395, + "grad_norm": 0.5999130824203768, + "learning_rate": 2.8391922213911745e-05, + "loss": 0.3457, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15660347044467926, + "step": 950, + "valid_targets_mean": 4550.4, + "valid_targets_min": 3119 + }, + { + "epoch": 0.500261917234154, + "grad_norm": 0.6722215026458347, + "learning_rate": 2.8541510845175772e-05, + "loss": 0.3584, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1680639684200287, + "step": 955, + "valid_targets_mean": 3810.8, + "valid_targets_min": 2562 + }, + { + "epoch": 0.5028810895756941, + "grad_norm": 0.666118761172745, + "learning_rate": 2.8691099476439795e-05, + "loss": 0.3535, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17258156836032867, + "step": 960, + "valid_targets_mean": 4045.5, + "valid_targets_min": 2659 + }, + { + "epoch": 0.5055002619172342, + "grad_norm": 0.7024796510442974, + "learning_rate": 2.8840688107703817e-05, + "loss": 0.342, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15005125105381012, + "step": 965, + "valid_targets_mean": 4064.8, + "valid_targets_min": 1349 + }, + { + "epoch": 0.5081194342587743, + "grad_norm": 0.7539571461509252, + "learning_rate": 2.899027673896784e-05, + "loss": 0.3495, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16101238131523132, + "step": 970, + "valid_targets_mean": 3371.4, + "valid_targets_min": 2474 + }, + { + "epoch": 0.5107386066003143, + "grad_norm": 0.7517420716020826, + "learning_rate": 2.9139865370231867e-05, + "loss": 0.3601, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14872035384178162, + "step": 975, + "valid_targets_mean": 2590.5, + "valid_targets_min": 738 + }, + { + "epoch": 0.5133577789418544, + "grad_norm": 0.6639925547944596, + "learning_rate": 2.928945400149589e-05, + "loss": 0.3364, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16390451788902283, + "step": 980, + "valid_targets_mean": 3570.5, + "valid_targets_min": 2033 + }, + { + "epoch": 0.5159769512833945, + "grad_norm": 0.7875063369111589, + "learning_rate": 2.9439042632759912e-05, + "loss": 0.3639, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1987815797328949, + "step": 985, + "valid_targets_mean": 2933.1, + "valid_targets_min": 1346 + }, + { + "epoch": 0.5185961236249346, + "grad_norm": 0.8229821761970155, + "learning_rate": 2.958863126402394e-05, + "loss": 0.356, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19160673022270203, + "step": 990, + "valid_targets_mean": 2991.1, + "valid_targets_min": 1821 + }, + { + "epoch": 0.5212152959664746, + "grad_norm": 0.6966642598769553, + "learning_rate": 2.973821989528796e-05, + "loss": 0.348, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16364285349845886, + "step": 995, + "valid_targets_mean": 3400.1, + "valid_targets_min": 2535 + }, + { + "epoch": 0.5238344683080147, + "grad_norm": 0.6969200634499667, + "learning_rate": 2.9887808526551984e-05, + "loss": 0.3399, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16623015701770782, + "step": 1000, + "valid_targets_mean": 3411.5, + "valid_targets_min": 2352 + }, + { + "epoch": 0.5264536406495547, + "grad_norm": 0.698223030299044, + "learning_rate": 3.0037397157816007e-05, + "loss": 0.3464, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15625500679016113, + "step": 1005, + "valid_targets_mean": 3319.8, + "valid_targets_min": 1153 + }, + { + "epoch": 0.5290728129910948, + "grad_norm": 0.66010760037979, + "learning_rate": 3.0186985789080034e-05, + "loss": 0.3412, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17209413647651672, + "step": 1010, + "valid_targets_mean": 3718.0, + "valid_targets_min": 2072 + }, + { + "epoch": 0.5316919853326348, + "grad_norm": 0.6744391263190171, + "learning_rate": 3.0336574420344056e-05, + "loss": 0.3529, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16139277815818787, + "step": 1015, + "valid_targets_mean": 3451.0, + "valid_targets_min": 922 + }, + { + "epoch": 0.5343111576741749, + "grad_norm": 0.6079834396763925, + "learning_rate": 3.048616305160808e-05, + "loss": 0.3482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13819198310375214, + "step": 1020, + "valid_targets_mean": 3381.6, + "valid_targets_min": 1417 + }, + { + "epoch": 0.536930330015715, + "grad_norm": 0.5887998623425829, + "learning_rate": 3.06357516828721e-05, + "loss": 0.3442, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15055982768535614, + "step": 1025, + "valid_targets_mean": 4260.6, + "valid_targets_min": 1844 + }, + { + "epoch": 0.5395495023572551, + "grad_norm": 0.72423300552497, + "learning_rate": 3.078534031413613e-05, + "loss": 0.3443, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17637065052986145, + "step": 1030, + "valid_targets_mean": 3525.2, + "valid_targets_min": 1261 + }, + { + "epoch": 0.5421686746987951, + "grad_norm": 0.6296896185231665, + "learning_rate": 3.093492894540015e-05, + "loss": 0.3388, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20019851624965668, + "step": 1035, + "valid_targets_mean": 4548.6, + "valid_targets_min": 2077 + }, + { + "epoch": 0.5447878470403352, + "grad_norm": 0.6461874598516931, + "learning_rate": 3.1084517576664174e-05, + "loss": 0.345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18294253945350647, + "step": 1040, + "valid_targets_mean": 4140.9, + "valid_targets_min": 2724 + }, + { + "epoch": 0.5474070193818753, + "grad_norm": 0.5734534078703716, + "learning_rate": 3.12341062079282e-05, + "loss": 0.333, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21917563676834106, + "step": 1045, + "valid_targets_mean": 5291.4, + "valid_targets_min": 2292 + }, + { + "epoch": 0.5500261917234154, + "grad_norm": 0.7655146463989795, + "learning_rate": 3.138369483919222e-05, + "loss": 0.3546, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17243260145187378, + "step": 1050, + "valid_targets_mean": 2965.1, + "valid_targets_min": 1377 + }, + { + "epoch": 0.5526453640649555, + "grad_norm": 0.6429273155264622, + "learning_rate": 3.1533283470456246e-05, + "loss": 0.3555, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15151354670524597, + "step": 1055, + "valid_targets_mean": 3099.5, + "valid_targets_min": 1350 + }, + { + "epoch": 0.5552645364064955, + "grad_norm": 0.666416181336385, + "learning_rate": 3.168287210172027e-05, + "loss": 0.3419, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16854865849018097, + "step": 1060, + "valid_targets_mean": 3031.9, + "valid_targets_min": 654 + }, + { + "epoch": 0.5578837087480356, + "grad_norm": 0.6585380604523907, + "learning_rate": 3.183246073298429e-05, + "loss": 0.3412, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13452671468257904, + "step": 1065, + "valid_targets_mean": 3463.8, + "valid_targets_min": 1706 + }, + { + "epoch": 0.5605028810895757, + "grad_norm": 0.6303742591532483, + "learning_rate": 3.198204936424832e-05, + "loss": 0.3465, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18186776340007782, + "step": 1070, + "valid_targets_mean": 4105.5, + "valid_targets_min": 1739 + }, + { + "epoch": 0.5631220534311158, + "grad_norm": 0.7100853348756141, + "learning_rate": 3.2131637995512345e-05, + "loss": 0.3423, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1468432992696762, + "step": 1075, + "valid_targets_mean": 2944.4, + "valid_targets_min": 1302 + }, + { + "epoch": 0.5657412257726558, + "grad_norm": 0.6102827886643082, + "learning_rate": 3.228122662677637e-05, + "loss": 0.3196, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1456199586391449, + "step": 1080, + "valid_targets_mean": 3531.5, + "valid_targets_min": 2501 + }, + { + "epoch": 0.5683603981141959, + "grad_norm": 0.5957194997566689, + "learning_rate": 3.243081525804039e-05, + "loss": 0.3376, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17194604873657227, + "step": 1085, + "valid_targets_mean": 4673.8, + "valid_targets_min": 3232 + }, + { + "epoch": 0.570979570455736, + "grad_norm": 0.6126169513308506, + "learning_rate": 3.258040388930442e-05, + "loss": 0.3195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16547763347625732, + "step": 1090, + "valid_targets_mean": 4465.1, + "valid_targets_min": 1101 + }, + { + "epoch": 0.5735987427972761, + "grad_norm": 0.6659288984648957, + "learning_rate": 3.272999252056844e-05, + "loss": 0.3541, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1823541522026062, + "step": 1095, + "valid_targets_mean": 4113.2, + "valid_targets_min": 2079 + }, + { + "epoch": 0.5762179151388162, + "grad_norm": 0.6253409519694156, + "learning_rate": 3.287958115183246e-05, + "loss": 0.3324, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15754787623882294, + "step": 1100, + "valid_targets_mean": 3891.4, + "valid_targets_min": 2138 + }, + { + "epoch": 0.5788370874803562, + "grad_norm": 0.6051674142458731, + "learning_rate": 3.302916978309649e-05, + "loss": 0.3415, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16496360301971436, + "step": 1105, + "valid_targets_mean": 3470.2, + "valid_targets_min": 1234 + }, + { + "epoch": 0.5814562598218963, + "grad_norm": 0.6431340211396896, + "learning_rate": 3.3178758414360515e-05, + "loss": 0.3432, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1701410710811615, + "step": 1110, + "valid_targets_mean": 4038.5, + "valid_targets_min": 1822 + }, + { + "epoch": 0.5840754321634364, + "grad_norm": 0.5805445731574228, + "learning_rate": 3.3328347045624535e-05, + "loss": 0.35, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17148751020431519, + "step": 1115, + "valid_targets_mean": 4214.6, + "valid_targets_min": 1651 + }, + { + "epoch": 0.5866946045049765, + "grad_norm": 0.687079516708165, + "learning_rate": 3.347793567688856e-05, + "loss": 0.3395, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19782204926013947, + "step": 1120, + "valid_targets_mean": 3447.9, + "valid_targets_min": 1434 + }, + { + "epoch": 0.5893137768465165, + "grad_norm": 0.6211556614620224, + "learning_rate": 3.362752430815259e-05, + "loss": 0.328, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18377473950386047, + "step": 1125, + "valid_targets_mean": 4753.4, + "valid_targets_min": 2725 + }, + { + "epoch": 0.5919329491880566, + "grad_norm": 0.6201693042858446, + "learning_rate": 3.3777112939416607e-05, + "loss": 0.3277, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16360099613666534, + "step": 1130, + "valid_targets_mean": 4005.8, + "valid_targets_min": 1966 + }, + { + "epoch": 0.5945521215295967, + "grad_norm": 0.6141969340369716, + "learning_rate": 3.392670157068063e-05, + "loss": 0.3301, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1609821319580078, + "step": 1135, + "valid_targets_mean": 3669.0, + "valid_targets_min": 1407 + }, + { + "epoch": 0.5971712938711368, + "grad_norm": 0.6142388805501698, + "learning_rate": 3.407629020194465e-05, + "loss": 0.3288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17364542186260223, + "step": 1140, + "valid_targets_mean": 4330.5, + "valid_targets_min": 1444 + }, + { + "epoch": 0.5997904662126768, + "grad_norm": 0.6084379669335195, + "learning_rate": 3.422587883320868e-05, + "loss": 0.3146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1472238004207611, + "step": 1145, + "valid_targets_mean": 3077.8, + "valid_targets_min": 1504 + }, + { + "epoch": 0.6024096385542169, + "grad_norm": 0.611062889831383, + "learning_rate": 3.4375467464472705e-05, + "loss": 0.3208, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13173359632492065, + "step": 1150, + "valid_targets_mean": 3051.6, + "valid_targets_min": 858 + }, + { + "epoch": 0.6050288108957569, + "grad_norm": 0.6400296995620607, + "learning_rate": 3.4525056095736724e-05, + "loss": 0.3359, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1425532102584839, + "step": 1155, + "valid_targets_mean": 3231.8, + "valid_targets_min": 1288 + }, + { + "epoch": 0.607647983237297, + "grad_norm": 0.5966035226835973, + "learning_rate": 3.467464472700075e-05, + "loss": 0.3566, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16310977935791016, + "step": 1160, + "valid_targets_mean": 4053.0, + "valid_targets_min": 1537 + }, + { + "epoch": 0.610267155578837, + "grad_norm": 0.6248556637700886, + "learning_rate": 3.482423335826478e-05, + "loss": 0.3294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16761454939842224, + "step": 1165, + "valid_targets_mean": 3917.1, + "valid_targets_min": 2060 + }, + { + "epoch": 0.6128863279203771, + "grad_norm": 0.6548057486516451, + "learning_rate": 3.4973821989528796e-05, + "loss": 0.3425, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18218758702278137, + "step": 1170, + "valid_targets_mean": 4482.6, + "valid_targets_min": 2515 + }, + { + "epoch": 0.6155055002619172, + "grad_norm": 0.6110367045018402, + "learning_rate": 3.512341062079282e-05, + "loss": 0.322, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1644124835729599, + "step": 1175, + "valid_targets_mean": 3847.2, + "valid_targets_min": 1744 + }, + { + "epoch": 0.6181246726034573, + "grad_norm": 0.5382561625787428, + "learning_rate": 3.527299925205684e-05, + "loss": 0.3334, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15760695934295654, + "step": 1180, + "valid_targets_mean": 5009.9, + "valid_targets_min": 2062 + }, + { + "epoch": 0.6207438449449973, + "grad_norm": 0.6120159820107818, + "learning_rate": 3.542258788332087e-05, + "loss": 0.3292, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15463533997535706, + "step": 1185, + "valid_targets_mean": 3550.4, + "valid_targets_min": 1181 + }, + { + "epoch": 0.6233630172865374, + "grad_norm": 0.6205449479706852, + "learning_rate": 3.5572176514584895e-05, + "loss": 0.3136, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17844107747077942, + "step": 1190, + "valid_targets_mean": 4010.6, + "valid_targets_min": 1937 + }, + { + "epoch": 0.6259821896280775, + "grad_norm": 0.6661879722953408, + "learning_rate": 3.5721765145848914e-05, + "loss": 0.3422, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20328474044799805, + "step": 1195, + "valid_targets_mean": 3624.9, + "valid_targets_min": 1649 + }, + { + "epoch": 0.6286013619696176, + "grad_norm": 0.7204535756744255, + "learning_rate": 3.587135377711294e-05, + "loss": 0.3239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15000876784324646, + "step": 1200, + "valid_targets_mean": 2808.1, + "valid_targets_min": 1197 + }, + { + "epoch": 0.6312205343111577, + "grad_norm": 0.7212522617141228, + "learning_rate": 3.602094240837697e-05, + "loss": 0.339, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17222219705581665, + "step": 1205, + "valid_targets_mean": 3251.4, + "valid_targets_min": 1824 + }, + { + "epoch": 0.6338397066526977, + "grad_norm": 0.9133985994273064, + "learning_rate": 3.6170531039640986e-05, + "loss": 0.3435, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1720942258834839, + "step": 1210, + "valid_targets_mean": 3145.6, + "valid_targets_min": 538 + }, + { + "epoch": 0.6364588789942378, + "grad_norm": 0.607433859360118, + "learning_rate": 3.632011967090502e-05, + "loss": 0.3311, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14743439853191376, + "step": 1215, + "valid_targets_mean": 3597.1, + "valid_targets_min": 537 + }, + { + "epoch": 0.6390780513357779, + "grad_norm": 0.693537651034399, + "learning_rate": 3.646970830216904e-05, + "loss": 0.3632, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16639968752861023, + "step": 1220, + "valid_targets_mean": 3386.5, + "valid_targets_min": 2169 + }, + { + "epoch": 0.641697223677318, + "grad_norm": 0.6611300941454468, + "learning_rate": 3.6619296933433065e-05, + "loss": 0.3325, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17038226127624512, + "step": 1225, + "valid_targets_mean": 3687.6, + "valid_targets_min": 1625 + }, + { + "epoch": 0.644316396018858, + "grad_norm": 0.6004055429958011, + "learning_rate": 3.6768885564697085e-05, + "loss": 0.338, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14659348130226135, + "step": 1230, + "valid_targets_mean": 3807.0, + "valid_targets_min": 2642 + }, + { + "epoch": 0.6469355683603981, + "grad_norm": 0.6119002554696095, + "learning_rate": 3.691847419596111e-05, + "loss": 0.3455, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18825103342533112, + "step": 1235, + "valid_targets_mean": 4289.9, + "valid_targets_min": 2935 + }, + { + "epoch": 0.6495547407019382, + "grad_norm": 0.5296888652650795, + "learning_rate": 3.706806282722514e-05, + "loss": 0.34, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17498472332954407, + "step": 1240, + "valid_targets_mean": 5189.9, + "valid_targets_min": 2652 + }, + { + "epoch": 0.6521739130434783, + "grad_norm": 0.6212330116518527, + "learning_rate": 3.7217651458489157e-05, + "loss": 0.3409, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.221257746219635, + "step": 1245, + "valid_targets_mean": 4117.2, + "valid_targets_min": 648 + }, + { + "epoch": 0.6547930853850183, + "grad_norm": 0.6181123400246369, + "learning_rate": 3.736724008975318e-05, + "loss": 0.3405, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14589467644691467, + "step": 1250, + "valid_targets_mean": 3492.8, + "valid_targets_min": 637 + }, + { + "epoch": 0.6574122577265584, + "grad_norm": 0.6588912659727094, + "learning_rate": 3.751682872101721e-05, + "loss": 0.3393, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17551174759864807, + "step": 1255, + "valid_targets_mean": 3412.5, + "valid_targets_min": 719 + }, + { + "epoch": 0.6600314300680985, + "grad_norm": 0.5476010398843242, + "learning_rate": 3.766641735228123e-05, + "loss": 0.3346, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15114666521549225, + "step": 1260, + "valid_targets_mean": 4227.4, + "valid_targets_min": 2182 + }, + { + "epoch": 0.6626506024096386, + "grad_norm": 0.6126328425922989, + "learning_rate": 3.7816005983545255e-05, + "loss": 0.3249, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15365070104599, + "step": 1265, + "valid_targets_mean": 3211.1, + "valid_targets_min": 1372 + }, + { + "epoch": 0.6652697747511787, + "grad_norm": 0.6205042228668959, + "learning_rate": 3.796559461480928e-05, + "loss": 0.3172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1903889924287796, + "step": 1270, + "valid_targets_mean": 4490.9, + "valid_targets_min": 2594 + }, + { + "epoch": 0.6678889470927187, + "grad_norm": 0.5812199952484004, + "learning_rate": 3.81151832460733e-05, + "loss": 0.3303, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14865991473197937, + "step": 1275, + "valid_targets_mean": 3054.6, + "valid_targets_min": 530 + }, + { + "epoch": 0.6705081194342588, + "grad_norm": 0.6461823490955528, + "learning_rate": 3.826477187733733e-05, + "loss": 0.3316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21536710858345032, + "step": 1280, + "valid_targets_mean": 4110.2, + "valid_targets_min": 611 + }, + { + "epoch": 0.6731272917757989, + "grad_norm": 0.659991493743984, + "learning_rate": 3.8414360508601346e-05, + "loss": 0.3289, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1761910766363144, + "step": 1285, + "valid_targets_mean": 3804.2, + "valid_targets_min": 1987 + }, + { + "epoch": 0.675746464117339, + "grad_norm": 0.7018636647048128, + "learning_rate": 3.856394913986537e-05, + "loss": 0.3347, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16965290904045105, + "step": 1290, + "valid_targets_mean": 3203.2, + "valid_targets_min": 1362 + }, + { + "epoch": 0.678365636458879, + "grad_norm": 0.5842545058219607, + "learning_rate": 3.87135377711294e-05, + "loss": 0.3254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1561589390039444, + "step": 1295, + "valid_targets_mean": 3245.1, + "valid_targets_min": 852 + }, + { + "epoch": 0.6809848088004191, + "grad_norm": 0.7090994749538716, + "learning_rate": 3.886312640239342e-05, + "loss": 0.3361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13681864738464355, + "step": 1300, + "valid_targets_mean": 2537.4, + "valid_targets_min": 1195 + }, + { + "epoch": 0.6836039811419592, + "grad_norm": 0.6173257676382597, + "learning_rate": 3.9012715033657445e-05, + "loss": 0.3275, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17246338725090027, + "step": 1305, + "valid_targets_mean": 4383.0, + "valid_targets_min": 1397 + }, + { + "epoch": 0.6862231534834992, + "grad_norm": 0.565658382473205, + "learning_rate": 3.916230366492147e-05, + "loss": 0.3172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12798964977264404, + "step": 1310, + "valid_targets_mean": 3421.0, + "valid_targets_min": 1975 + }, + { + "epoch": 0.6888423258250392, + "grad_norm": 0.6247345137814574, + "learning_rate": 3.931189229618549e-05, + "loss": 0.3099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16652032732963562, + "step": 1315, + "valid_targets_mean": 4100.6, + "valid_targets_min": 2564 + }, + { + "epoch": 0.6914614981665793, + "grad_norm": 0.5083389735343604, + "learning_rate": 3.946148092744952e-05, + "loss": 0.3158, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14584901928901672, + "step": 1320, + "valid_targets_mean": 4986.9, + "valid_targets_min": 2595 + }, + { + "epoch": 0.6940806705081194, + "grad_norm": 0.5862521496377336, + "learning_rate": 3.9611069558713536e-05, + "loss": 0.3258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18245020508766174, + "step": 1325, + "valid_targets_mean": 3992.9, + "valid_targets_min": 2845 + }, + { + "epoch": 0.6966998428496595, + "grad_norm": 0.72016307931705, + "learning_rate": 3.976065818997756e-05, + "loss": 0.3132, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1214650347828865, + "step": 1330, + "valid_targets_mean": 2390.1, + "valid_targets_min": 993 + }, + { + "epoch": 0.6993190151911995, + "grad_norm": 0.595404792324118, + "learning_rate": 3.991024682124159e-05, + "loss": 0.3129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1291854977607727, + "step": 1335, + "valid_targets_mean": 3729.1, + "valid_targets_min": 1575 + }, + { + "epoch": 0.7019381875327396, + "grad_norm": 0.6414455374657542, + "learning_rate": 3.999999727028487e-05, + "loss": 0.3248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17417430877685547, + "step": 1340, + "valid_targets_mean": 3469.0, + "valid_targets_min": 1360 + }, + { + "epoch": 0.7045573598742797, + "grad_norm": 0.6355175987771899, + "learning_rate": 3.999996656099815e-05, + "loss": 0.3136, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15191948413848877, + "step": 1345, + "valid_targets_mean": 3555.5, + "valid_targets_min": 2278 + }, + { + "epoch": 0.7071765322158198, + "grad_norm": 0.588717387625224, + "learning_rate": 3.999990173033336e-05, + "loss": 0.3435, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18690279126167297, + "step": 1350, + "valid_targets_mean": 3812.2, + "valid_targets_min": 1454 + }, + { + "epoch": 0.7097957045573599, + "grad_norm": 0.6344109053156491, + "learning_rate": 3.99998027784011e-05, + "loss": 0.3304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17694224417209625, + "step": 1355, + "valid_targets_mean": 3796.6, + "valid_targets_min": 2344 + }, + { + "epoch": 0.7124148768988999, + "grad_norm": 0.7385041094604863, + "learning_rate": 3.999966970537021e-05, + "loss": 0.3294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1743699014186859, + "step": 1360, + "valid_targets_mean": 3324.1, + "valid_targets_min": 1278 + }, + { + "epoch": 0.71503404924044, + "grad_norm": 0.6289043093306019, + "learning_rate": 3.999950251146769e-05, + "loss": 0.3133, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17869730293750763, + "step": 1365, + "valid_targets_mean": 3381.4, + "valid_targets_min": 1858 + }, + { + "epoch": 0.7176532215819801, + "grad_norm": 0.7124677183882361, + "learning_rate": 3.9999301196978804e-05, + "loss": 0.3244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12725886702537537, + "step": 1370, + "valid_targets_mean": 2566.0, + "valid_targets_min": 420 + }, + { + "epoch": 0.7202723939235202, + "grad_norm": 0.6978765070091023, + "learning_rate": 3.9999065762247e-05, + "loss": 0.3187, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1442769169807434, + "step": 1375, + "valid_targets_mean": 2649.4, + "valid_targets_min": 1039 + }, + { + "epoch": 0.7228915662650602, + "grad_norm": 0.5703472717476405, + "learning_rate": 3.999879620767397e-05, + "loss": 0.3318, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1461399644613266, + "step": 1380, + "valid_targets_mean": 4475.1, + "valid_targets_min": 1737 + }, + { + "epoch": 0.7255107386066003, + "grad_norm": 0.6082942173366175, + "learning_rate": 3.999849253371956e-05, + "loss": 0.324, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1938718557357788, + "step": 1385, + "valid_targets_mean": 4150.8, + "valid_targets_min": 809 + }, + { + "epoch": 0.7281299109481404, + "grad_norm": 0.5986725851757726, + "learning_rate": 3.999815474090188e-05, + "loss": 0.322, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1633826494216919, + "step": 1390, + "valid_targets_mean": 3864.1, + "valid_targets_min": 1780 + }, + { + "epoch": 0.7307490832896805, + "grad_norm": 0.5941021429982363, + "learning_rate": 3.9997782829797225e-05, + "loss": 0.33, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1542864739894867, + "step": 1395, + "valid_targets_mean": 4058.0, + "valid_targets_min": 2185 + }, + { + "epoch": 0.7333682556312205, + "grad_norm": 0.7314816153433888, + "learning_rate": 3.99973768010401e-05, + "loss": 0.2847, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09025775641202927, + "step": 1400, + "valid_targets_mean": 2736.0, + "valid_targets_min": 876 + }, + { + "epoch": 0.7359874279727606, + "grad_norm": 0.7986663261684929, + "learning_rate": 3.9996936655323216e-05, + "loss": 0.1956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0739547535777092, + "step": 1405, + "valid_targets_mean": 1472.5, + "valid_targets_min": 324 + }, + { + "epoch": 0.7386066003143007, + "grad_norm": 0.5158462550711758, + "learning_rate": 3.9996462393397505e-05, + "loss": 0.1507, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.086447574198246, + "step": 1410, + "valid_targets_mean": 2699.9, + "valid_targets_min": 1064 + }, + { + "epoch": 0.7412257726558408, + "grad_norm": 0.5424757814397492, + "learning_rate": 3.999595401607208e-05, + "loss": 0.1439, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07466402649879456, + "step": 1415, + "valid_targets_mean": 3137.0, + "valid_targets_min": 710 + }, + { + "epoch": 0.7438449449973809, + "grad_norm": 0.5353903699192518, + "learning_rate": 3.9995411524214275e-05, + "loss": 0.161, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05025868117809296, + "step": 1420, + "valid_targets_mean": 3472.9, + "valid_targets_min": 1223 + }, + { + "epoch": 0.7464641173389209, + "grad_norm": 0.5130922985032678, + "learning_rate": 3.999483491874962e-05, + "loss": 0.1463, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08507537841796875, + "step": 1425, + "valid_targets_mean": 3326.0, + "valid_targets_min": 1431 + }, + { + "epoch": 0.749083289680461, + "grad_norm": 0.8635294205181738, + "learning_rate": 3.999422420066184e-05, + "loss": 0.1984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08754102885723114, + "step": 1430, + "valid_targets_mean": 1161.2, + "valid_targets_min": 559 + }, + { + "epoch": 0.7517024620220011, + "grad_norm": 0.46394205723150345, + "learning_rate": 3.9993579370992874e-05, + "loss": 0.1862, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06998488306999207, + "step": 1435, + "valid_targets_mean": 3598.2, + "valid_targets_min": 1623 + }, + { + "epoch": 0.7543216343635412, + "grad_norm": 0.49592682911702274, + "learning_rate": 3.9992900430842836e-05, + "loss": 0.1576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0781191736459732, + "step": 1440, + "valid_targets_mean": 3178.2, + "valid_targets_min": 846 + }, + { + "epoch": 0.7569408067050812, + "grad_norm": 0.6450361626216348, + "learning_rate": 3.999218738137005e-05, + "loss": 0.2034, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13390403985977173, + "step": 1445, + "valid_targets_mean": 3622.6, + "valid_targets_min": 1949 + }, + { + "epoch": 0.7595599790466213, + "grad_norm": 0.41886270656201374, + "learning_rate": 3.999144022379103e-05, + "loss": 0.1169, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06320428848266602, + "step": 1450, + "valid_targets_mean": 3344.9, + "valid_targets_min": 764 + }, + { + "epoch": 0.7621791513881614, + "grad_norm": 0.5860692709334011, + "learning_rate": 3.9990658959380485e-05, + "loss": 0.1393, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0750679075717926, + "step": 1455, + "valid_targets_mean": 2391.6, + "valid_targets_min": 776 + }, + { + "epoch": 0.7647983237297015, + "grad_norm": 0.5010127595551124, + "learning_rate": 3.998984358947131e-05, + "loss": 0.1386, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07392105460166931, + "step": 1460, + "valid_targets_mean": 2818.5, + "valid_targets_min": 754 + }, + { + "epoch": 0.7674174960712414, + "grad_norm": 0.5866841846039216, + "learning_rate": 3.998899411545457e-05, + "loss": 0.1669, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08332496881484985, + "step": 1465, + "valid_targets_mean": 1646.6, + "valid_targets_min": 635 + }, + { + "epoch": 0.7700366684127815, + "grad_norm": 0.4642834513510014, + "learning_rate": 3.998811053877955e-05, + "loss": 0.1536, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07143302261829376, + "step": 1470, + "valid_targets_mean": 3374.8, + "valid_targets_min": 1862 + }, + { + "epoch": 0.7726558407543216, + "grad_norm": 0.515280742585236, + "learning_rate": 3.998719286095368e-05, + "loss": 0.1404, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08594658970832825, + "step": 1475, + "valid_targets_mean": 2837.4, + "valid_targets_min": 574 + }, + { + "epoch": 0.7752750130958617, + "grad_norm": 0.5213394719374975, + "learning_rate": 3.998624108354258e-05, + "loss": 0.1332, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06072106584906578, + "step": 1480, + "valid_targets_mean": 2618.4, + "valid_targets_min": 523 + }, + { + "epoch": 0.7778941854374017, + "grad_norm": 0.5070710235211495, + "learning_rate": 3.9985255208170065e-05, + "loss": 0.1322, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07832945883274078, + "step": 1485, + "valid_targets_mean": 3548.9, + "valid_targets_min": 2189 + }, + { + "epoch": 0.7805133577789418, + "grad_norm": 0.46229267557092607, + "learning_rate": 3.99842352365181e-05, + "loss": 0.1443, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05179700627923012, + "step": 1490, + "valid_targets_mean": 3564.6, + "valid_targets_min": 827 + }, + { + "epoch": 0.7831325301204819, + "grad_norm": 0.5527045613471703, + "learning_rate": 3.9983181170326835e-05, + "loss": 0.1586, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07232558727264404, + "step": 1495, + "valid_targets_mean": 1936.6, + "valid_targets_min": 597 + }, + { + "epoch": 0.785751702462022, + "grad_norm": 0.5620881757133277, + "learning_rate": 3.998209301139458e-05, + "loss": 0.1536, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06416729837656021, + "step": 1500, + "valid_targets_mean": 1747.5, + "valid_targets_min": 701 + }, + { + "epoch": 0.788370874803562, + "grad_norm": 0.605616319073172, + "learning_rate": 3.998097076157781e-05, + "loss": 0.1786, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1605839878320694, + "step": 1505, + "valid_targets_mean": 3329.6, + "valid_targets_min": 1652 + }, + { + "epoch": 0.7909900471451021, + "grad_norm": 0.46922548355435045, + "learning_rate": 3.997981442279117e-05, + "loss": 0.1549, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06859530508518219, + "step": 1510, + "valid_targets_mean": 3117.1, + "valid_targets_min": 786 + }, + { + "epoch": 0.7936092194866422, + "grad_norm": 0.7021593930917235, + "learning_rate": 3.997862399700744e-05, + "loss": 0.1323, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08121612668037415, + "step": 1515, + "valid_targets_mean": 2574.4, + "valid_targets_min": 971 + }, + { + "epoch": 0.7962283918281823, + "grad_norm": 0.4561349661914808, + "learning_rate": 3.99773994862576e-05, + "loss": 0.1846, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0743626058101654, + "step": 1520, + "valid_targets_mean": 3320.0, + "valid_targets_min": 2610 + }, + { + "epoch": 0.7988475641697224, + "grad_norm": 0.5086685356121075, + "learning_rate": 3.997614089263073e-05, + "loss": 0.1582, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.051420897245407104, + "step": 1525, + "valid_targets_mean": 2580.6, + "valid_targets_min": 753 + }, + { + "epoch": 0.8014667365112624, + "grad_norm": 0.6117088309504906, + "learning_rate": 3.997484821827409e-05, + "loss": 0.1444, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06646887958049774, + "step": 1530, + "valid_targets_mean": 1537.1, + "valid_targets_min": 619 + }, + { + "epoch": 0.8040859088528025, + "grad_norm": 0.5949023934852837, + "learning_rate": 3.9973521465393075e-05, + "loss": 0.3669, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15084227919578552, + "step": 1535, + "valid_targets_mean": 2271.2, + "valid_targets_min": 987 + }, + { + "epoch": 0.8067050811943426, + "grad_norm": 0.7502710001993674, + "learning_rate": 3.997216063625121e-05, + "loss": 0.1631, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07774441689252853, + "step": 1540, + "valid_targets_mean": 1351.5, + "valid_targets_min": 329 + }, + { + "epoch": 0.8093242535358827, + "grad_norm": 0.606702731963554, + "learning_rate": 3.997076573317019e-05, + "loss": 0.1445, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06768237799406052, + "step": 1545, + "valid_targets_mean": 1553.9, + "valid_targets_min": 608 + }, + { + "epoch": 0.8119434258774227, + "grad_norm": 0.5191457016879443, + "learning_rate": 3.9969336758529804e-05, + "loss": 0.2531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0957370176911354, + "step": 1550, + "valid_targets_mean": 3645.6, + "valid_targets_min": 873 + }, + { + "epoch": 0.8145625982189628, + "grad_norm": 0.3155287206576497, + "learning_rate": 3.996787371476799e-05, + "loss": 0.1225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.034252800047397614, + "step": 1555, + "valid_targets_mean": 4720.6, + "valid_targets_min": 3529 + }, + { + "epoch": 0.8171817705605029, + "grad_norm": 0.4212640247312681, + "learning_rate": 3.9966376604380795e-05, + "loss": 0.1411, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07607945054769516, + "step": 1560, + "valid_targets_mean": 4437.6, + "valid_targets_min": 2336 + }, + { + "epoch": 0.819800942902043, + "grad_norm": 0.39620114331915346, + "learning_rate": 3.9964845429922405e-05, + "loss": 0.1372, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06097068265080452, + "step": 1565, + "valid_targets_mean": 3533.1, + "valid_targets_min": 1226 + }, + { + "epoch": 0.822420115243583, + "grad_norm": 0.41995034506751305, + "learning_rate": 3.996328019400512e-05, + "loss": 0.1334, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06280517578125, + "step": 1570, + "valid_targets_mean": 3299.2, + "valid_targets_min": 798 + }, + { + "epoch": 0.8250392875851231, + "grad_norm": 0.46326861768093075, + "learning_rate": 3.996168089929934e-05, + "loss": 0.1262, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.052490413188934326, + "step": 1575, + "valid_targets_mean": 1836.9, + "valid_targets_min": 723 + }, + { + "epoch": 0.8276584599266632, + "grad_norm": 0.5055429997269286, + "learning_rate": 3.996004754853356e-05, + "loss": 0.1288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.063631571829319, + "step": 1580, + "valid_targets_mean": 3316.0, + "valid_targets_min": 898 + }, + { + "epoch": 0.8302776322682033, + "grad_norm": 0.3514177365249329, + "learning_rate": 3.995838014449442e-05, + "loss": 0.1212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.047119513154029846, + "step": 1585, + "valid_targets_mean": 4027.2, + "valid_targets_min": 3278 + }, + { + "epoch": 0.8328968046097434, + "grad_norm": 0.5531182262228151, + "learning_rate": 3.9956678690026625e-05, + "loss": 0.132, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.061042577028274536, + "step": 1590, + "valid_targets_mean": 2052.8, + "valid_targets_min": 739 + }, + { + "epoch": 0.8355159769512834, + "grad_norm": 0.7755795660820791, + "learning_rate": 3.995494318803297e-05, + "loss": 0.174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07252795249223709, + "step": 1595, + "valid_targets_mean": 1574.9, + "valid_targets_min": 538 + }, + { + "epoch": 0.8381351492928235, + "grad_norm": 0.625425729205124, + "learning_rate": 3.995317364147434e-05, + "loss": 0.1096, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.050821200013160706, + "step": 1600, + "valid_targets_mean": 1956.9, + "valid_targets_min": 654 + }, + { + "epoch": 0.8407543216343636, + "grad_norm": 0.5634458011817362, + "learning_rate": 3.9951370053369726e-05, + "loss": 0.1296, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07513399422168732, + "step": 1605, + "valid_targets_mean": 2735.4, + "valid_targets_min": 930 + }, + { + "epoch": 0.8433734939759037, + "grad_norm": 0.48760076249445794, + "learning_rate": 3.994953242679617e-05, + "loss": 0.1162, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06778737157583237, + "step": 1610, + "valid_targets_mean": 2965.0, + "valid_targets_min": 684 + }, + { + "epoch": 0.8459926663174437, + "grad_norm": 0.4572772548812646, + "learning_rate": 3.994766076488879e-05, + "loss": 0.1866, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06816256791353226, + "step": 1615, + "valid_targets_mean": 3344.6, + "valid_targets_min": 999 + }, + { + "epoch": 0.8486118386589837, + "grad_norm": 0.65505384257651, + "learning_rate": 3.994575507084078e-05, + "loss": 0.1418, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07841216027736664, + "step": 1620, + "valid_targets_mean": 2445.4, + "valid_targets_min": 696 + }, + { + "epoch": 0.8512310110005238, + "grad_norm": 0.4517191751461857, + "learning_rate": 3.994381534790339e-05, + "loss": 0.159, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07189537584781647, + "step": 1625, + "valid_targets_mean": 3514.9, + "valid_targets_min": 1068 + }, + { + "epoch": 0.8538501833420639, + "grad_norm": 0.5158046190436185, + "learning_rate": 3.994184159938593e-05, + "loss": 0.1412, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.060847245156764984, + "step": 1630, + "valid_targets_mean": 1602.8, + "valid_targets_min": 536 + }, + { + "epoch": 0.8564693556836039, + "grad_norm": 0.5277377242693408, + "learning_rate": 3.993983382865576e-05, + "loss": 0.1975, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14055420458316803, + "step": 1635, + "valid_targets_mean": 3568.8, + "valid_targets_min": 1507 + }, + { + "epoch": 0.859088528025144, + "grad_norm": 0.5069279427908884, + "learning_rate": 3.993779203913827e-05, + "loss": 0.1428, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06706821918487549, + "step": 1640, + "valid_targets_mean": 3292.2, + "valid_targets_min": 2342 + }, + { + "epoch": 0.8617077003666841, + "grad_norm": 0.6963105091913101, + "learning_rate": 3.99357162343169e-05, + "loss": 0.1733, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08217508345842361, + "step": 1645, + "valid_targets_mean": 1567.5, + "valid_targets_min": 687 + }, + { + "epoch": 0.8643268727082242, + "grad_norm": 0.626309530814196, + "learning_rate": 3.993360641773313e-05, + "loss": 0.1332, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0423566959798336, + "step": 1650, + "valid_targets_mean": 1145.4, + "valid_targets_min": 449 + }, + { + "epoch": 0.8669460450497642, + "grad_norm": 0.42519785233247775, + "learning_rate": 3.993146259298646e-05, + "loss": 0.1385, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05637018382549286, + "step": 1655, + "valid_targets_mean": 3191.0, + "valid_targets_min": 658 + }, + { + "epoch": 0.8695652173913043, + "grad_norm": 0.7088187288825465, + "learning_rate": 3.99292847637344e-05, + "loss": 0.1386, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08269469439983368, + "step": 1660, + "valid_targets_mean": 1924.8, + "valid_targets_min": 577 + }, + { + "epoch": 0.8721843897328444, + "grad_norm": 0.3732596807976658, + "learning_rate": 3.9927072933692484e-05, + "loss": 0.1135, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05370637774467468, + "step": 1665, + "valid_targets_mean": 3992.5, + "valid_targets_min": 726 + }, + { + "epoch": 0.8748035620743845, + "grad_norm": 0.4134721656759607, + "learning_rate": 3.992482710663426e-05, + "loss": 0.1138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06572000682353973, + "step": 1670, + "valid_targets_mean": 3626.4, + "valid_targets_min": 2252 + }, + { + "epoch": 0.8774227344159246, + "grad_norm": 0.5202339996629215, + "learning_rate": 3.992254728639127e-05, + "loss": 0.1246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05162326991558075, + "step": 1675, + "valid_targets_mean": 1556.2, + "valid_targets_min": 531 + }, + { + "epoch": 0.8800419067574646, + "grad_norm": 0.4644389455013823, + "learning_rate": 3.9920233476853035e-05, + "loss": 0.1503, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06630605459213257, + "step": 1680, + "valid_targets_mean": 2410.5, + "valid_targets_min": 744 + }, + { + "epoch": 0.8826610790990047, + "grad_norm": 0.45822935132382786, + "learning_rate": 3.99178856819671e-05, + "loss": 0.1395, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07550811767578125, + "step": 1685, + "valid_targets_mean": 3795.1, + "valid_targets_min": 3136 + }, + { + "epoch": 0.8852802514405448, + "grad_norm": 0.37909483938475036, + "learning_rate": 3.991550390573897e-05, + "loss": 0.1227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.052796460688114166, + "step": 1690, + "valid_targets_mean": 3324.4, + "valid_targets_min": 2366 + }, + { + "epoch": 0.8878994237820849, + "grad_norm": 0.4170391242135034, + "learning_rate": 3.9913088152232105e-05, + "loss": 0.1212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04679000750184059, + "step": 1695, + "valid_targets_mean": 1668.1, + "valid_targets_min": 669 + }, + { + "epoch": 0.8905185961236249, + "grad_norm": 0.47835404906149454, + "learning_rate": 3.9910638425567975e-05, + "loss": 0.149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07802337408065796, + "step": 1700, + "valid_targets_mean": 3529.8, + "valid_targets_min": 1785 + }, + { + "epoch": 0.893137768465165, + "grad_norm": 0.31806325971087684, + "learning_rate": 3.990815472992598e-05, + "loss": 0.109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05754898488521576, + "step": 1705, + "valid_targets_mean": 4120.1, + "valid_targets_min": 3862 + }, + { + "epoch": 0.8957569408067051, + "grad_norm": 0.4547597012813676, + "learning_rate": 3.9905637069543486e-05, + "loss": 0.1318, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.059976283460855484, + "step": 1710, + "valid_targets_mean": 3062.2, + "valid_targets_min": 539 + }, + { + "epoch": 0.8983761131482452, + "grad_norm": 0.4378450620162749, + "learning_rate": 3.9903085448715805e-05, + "loss": 0.1389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05159597843885422, + "step": 1715, + "valid_targets_mean": 2781.5, + "valid_targets_min": 1016 + }, + { + "epoch": 0.9009952854897852, + "grad_norm": 0.7506102404125042, + "learning_rate": 3.990049987179618e-05, + "loss": 0.1495, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08937472850084305, + "step": 1720, + "valid_targets_mean": 1102.9, + "valid_targets_min": 888 + }, + { + "epoch": 0.9036144578313253, + "grad_norm": 0.5309387154494348, + "learning_rate": 3.98978803431958e-05, + "loss": 0.1366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05678325146436691, + "step": 1725, + "valid_targets_mean": 2602.5, + "valid_targets_min": 697 + }, + { + "epoch": 0.9062336301728654, + "grad_norm": 0.6742771489158552, + "learning_rate": 3.989522686738375e-05, + "loss": 0.1378, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08440111577510834, + "step": 1730, + "valid_targets_mean": 1592.9, + "valid_targets_min": 605 + }, + { + "epoch": 0.9088528025144055, + "grad_norm": 0.4610770926209317, + "learning_rate": 3.989253944888707e-05, + "loss": 0.1341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05471458286046982, + "step": 1735, + "valid_targets_mean": 2899.1, + "valid_targets_min": 1117 + }, + { + "epoch": 0.9114719748559456, + "grad_norm": 0.4341204746225806, + "learning_rate": 3.988981809229067e-05, + "loss": 0.1598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.059293102473020554, + "step": 1740, + "valid_targets_mean": 3376.6, + "valid_targets_min": 1388 + }, + { + "epoch": 0.9140911471974856, + "grad_norm": 0.407443066879257, + "learning_rate": 3.98870628022374e-05, + "loss": 0.1287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05706991255283356, + "step": 1745, + "valid_targets_mean": 3243.4, + "valid_targets_min": 524 + }, + { + "epoch": 0.9167103195390257, + "grad_norm": 0.4697544449354311, + "learning_rate": 3.988427358342797e-05, + "loss": 0.1175, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05848868936300278, + "step": 1750, + "valid_targets_mean": 2468.0, + "valid_targets_min": 970 + }, + { + "epoch": 0.9193294918805658, + "grad_norm": 0.48937162451685806, + "learning_rate": 3.9881450440620994e-05, + "loss": 0.1428, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06698908656835556, + "step": 1755, + "valid_targets_mean": 2959.6, + "valid_targets_min": 877 + }, + { + "epoch": 0.9219486642221059, + "grad_norm": 0.35050547101950813, + "learning_rate": 3.987859337863295e-05, + "loss": 0.1385, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05743839591741562, + "step": 1760, + "valid_targets_mean": 3886.5, + "valid_targets_min": 3251 + }, + { + "epoch": 0.9245678365636459, + "grad_norm": 0.5895188068394133, + "learning_rate": 3.98757024023382e-05, + "loss": 0.1152, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06867806613445282, + "step": 1765, + "valid_targets_mean": 2695.6, + "valid_targets_min": 564 + }, + { + "epoch": 0.927187008905186, + "grad_norm": 0.3473075470152696, + "learning_rate": 3.9872777516668935e-05, + "loss": 0.1228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06826956570148468, + "step": 1770, + "valid_targets_mean": 4404.8, + "valid_targets_min": 2555 + }, + { + "epoch": 0.929806181246726, + "grad_norm": 0.3421684036177156, + "learning_rate": 3.9869818726615245e-05, + "loss": 0.1133, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05443980544805527, + "step": 1775, + "valid_targets_mean": 4410.5, + "valid_targets_min": 3261 + }, + { + "epoch": 0.9324253535882661, + "grad_norm": 0.4417010057915673, + "learning_rate": 3.9866826037225025e-05, + "loss": 0.1046, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04898755997419357, + "step": 1780, + "valid_targets_mean": 1768.5, + "valid_targets_min": 618 + }, + { + "epoch": 0.9350445259298061, + "grad_norm": 0.3543811897370335, + "learning_rate": 3.9863799453604026e-05, + "loss": 0.1331, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05469723045825958, + "step": 1785, + "valid_targets_mean": 3985.8, + "valid_targets_min": 3213 + }, + { + "epoch": 0.9376636982713462, + "grad_norm": 0.4264038979036985, + "learning_rate": 3.986073898091581e-05, + "loss": 0.1289, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.118505097925663, + "step": 1790, + "valid_targets_mean": 3149.1, + "valid_targets_min": 1539 + }, + { + "epoch": 0.9402828706128863, + "grad_norm": 0.3789345301334967, + "learning_rate": 3.985764462438176e-05, + "loss": 0.1392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04531242698431015, + "step": 1795, + "valid_targets_mean": 2094.8, + "valid_targets_min": 509 + }, + { + "epoch": 0.9429020429544264, + "grad_norm": 0.34121951059745015, + "learning_rate": 3.985451638928108e-05, + "loss": 0.1291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0372382327914238, + "step": 1800, + "valid_targets_mean": 2441.4, + "valid_targets_min": 633 + }, + { + "epoch": 0.9455212152959664, + "grad_norm": 0.42942031033018574, + "learning_rate": 3.9851354280950756e-05, + "loss": 0.1558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06137951835989952, + "step": 1805, + "valid_targets_mean": 2740.9, + "valid_targets_min": 737 + }, + { + "epoch": 0.9481403876375065, + "grad_norm": 0.36405462270761896, + "learning_rate": 3.9848158304785576e-05, + "loss": 0.1141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.056062668561935425, + "step": 1810, + "valid_targets_mean": 2726.9, + "valid_targets_min": 492 + }, + { + "epoch": 0.9507595599790466, + "grad_norm": 0.6623352936503045, + "learning_rate": 3.984492846623811e-05, + "loss": 0.1427, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08910174667835236, + "step": 1815, + "valid_targets_mean": 1607.9, + "valid_targets_min": 833 + }, + { + "epoch": 0.9533787323205867, + "grad_norm": 0.35061832091732376, + "learning_rate": 3.984166477081868e-05, + "loss": 0.1194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03973294422030449, + "step": 1820, + "valid_targets_mean": 3502.6, + "valid_targets_min": 923 + }, + { + "epoch": 0.9559979046621268, + "grad_norm": 0.6962754339523737, + "learning_rate": 3.983836722409539e-05, + "loss": 0.1792, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08447998017072678, + "step": 1825, + "valid_targets_mean": 1553.9, + "valid_targets_min": 531 + }, + { + "epoch": 0.9586170770036668, + "grad_norm": 0.5601831525746735, + "learning_rate": 3.98350358316941e-05, + "loss": 0.1617, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10630452632904053, + "step": 1830, + "valid_targets_mean": 1825.6, + "valid_targets_min": 575 + }, + { + "epoch": 0.9612362493452069, + "grad_norm": 0.5004613077270998, + "learning_rate": 3.9831670599298394e-05, + "loss": 0.1264, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06777000427246094, + "step": 1835, + "valid_targets_mean": 3701.9, + "valid_targets_min": 2784 + }, + { + "epoch": 0.963855421686747, + "grad_norm": 0.38095623986806926, + "learning_rate": 3.9828271532649595e-05, + "loss": 0.1248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05625955015420914, + "step": 1840, + "valid_targets_mean": 3575.8, + "valid_targets_min": 2525 + }, + { + "epoch": 0.9664745940282871, + "grad_norm": 0.3645503223771157, + "learning_rate": 3.9824838637546774e-05, + "loss": 0.122, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04756051301956177, + "step": 1845, + "valid_targets_mean": 3081.0, + "valid_targets_min": 970 + }, + { + "epoch": 0.9690937663698271, + "grad_norm": 0.49645775656429314, + "learning_rate": 3.982137191984668e-05, + "loss": 0.1184, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06135290116071701, + "step": 1850, + "valid_targets_mean": 1963.5, + "valid_targets_min": 817 + }, + { + "epoch": 0.9717129387113672, + "grad_norm": 0.7974570176042606, + "learning_rate": 3.98178713854638e-05, + "loss": 0.1544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10152144730091095, + "step": 1855, + "valid_targets_mean": 1270.9, + "valid_targets_min": 637 + }, + { + "epoch": 0.9743321110529073, + "grad_norm": 0.4046465137561532, + "learning_rate": 3.981433704037027e-05, + "loss": 0.1109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05127967149019241, + "step": 1860, + "valid_targets_mean": 2594.1, + "valid_targets_min": 893 + }, + { + "epoch": 0.9769512833944474, + "grad_norm": 0.3493509574031833, + "learning_rate": 3.981076889059596e-05, + "loss": 0.116, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05416160076856613, + "step": 1865, + "valid_targets_mean": 3222.2, + "valid_targets_min": 1606 + }, + { + "epoch": 0.9795704557359874, + "grad_norm": 0.4105765185711659, + "learning_rate": 3.980716694222838e-05, + "loss": 0.1234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06041751429438591, + "step": 1870, + "valid_targets_mean": 3023.8, + "valid_targets_min": 678 + }, + { + "epoch": 0.9821896280775275, + "grad_norm": 0.3137716102916606, + "learning_rate": 3.9803531201412716e-05, + "loss": 0.1285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0552176833152771, + "step": 1875, + "valid_targets_mean": 4263.8, + "valid_targets_min": 1078 + }, + { + "epoch": 0.9848088004190676, + "grad_norm": 0.38076869047499096, + "learning_rate": 3.9799861674351794e-05, + "loss": 0.1091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06345896422863007, + "step": 1880, + "valid_targets_mean": 4150.0, + "valid_targets_min": 761 + }, + { + "epoch": 0.9874279727606077, + "grad_norm": 0.4944113710787087, + "learning_rate": 3.9796158367306095e-05, + "loss": 0.1231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06043882295489311, + "step": 1885, + "valid_targets_mean": 1368.4, + "valid_targets_min": 538 + }, + { + "epoch": 0.9900471451021478, + "grad_norm": 0.5854892130133516, + "learning_rate": 3.979242128659373e-05, + "loss": 0.1399, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11408171057701111, + "step": 1890, + "valid_targets_mean": 2630.4, + "valid_targets_min": 780 + }, + { + "epoch": 0.9926663174436878, + "grad_norm": 0.37841290083701706, + "learning_rate": 3.9788650438590425e-05, + "loss": 0.2078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.051241979002952576, + "step": 1895, + "valid_targets_mean": 3353.9, + "valid_targets_min": 2347 + }, + { + "epoch": 0.9952854897852279, + "grad_norm": 0.43927741316702157, + "learning_rate": 3.9784845829729516e-05, + "loss": 0.1205, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07244317978620529, + "step": 1900, + "valid_targets_mean": 3880.2, + "valid_targets_min": 2473 + }, + { + "epoch": 0.997904662126768, + "grad_norm": 0.4138312053437435, + "learning_rate": 3.978100746650194e-05, + "loss": 0.119, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06079757958650589, + "step": 1905, + "valid_targets_mean": 3556.4, + "valid_targets_min": 2245 + }, + { + "epoch": 1.000523834468308, + "grad_norm": 1.194369845882971, + "learning_rate": 3.977713535545622e-05, + "loss": 0.1952, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1503610908985138, + "step": 1910, + "valid_targets_mean": 1492.2, + "valid_targets_min": 544 + }, + { + "epoch": 1.0031430068098481, + "grad_norm": 0.9818625513655856, + "learning_rate": 3.9773229503198455e-05, + "loss": 0.2881, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13344977796077728, + "step": 1915, + "valid_targets_mean": 1270.4, + "valid_targets_min": 632 + }, + { + "epoch": 1.0057621791513882, + "grad_norm": 1.0052963104092862, + "learning_rate": 3.976928991639231e-05, + "loss": 0.2637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11686259508132935, + "step": 1920, + "valid_targets_mean": 1358.4, + "valid_targets_min": 753 + }, + { + "epoch": 1.0083813514929283, + "grad_norm": 0.9433402217216043, + "learning_rate": 3.9765316601759e-05, + "loss": 0.2602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13791446387767792, + "step": 1925, + "valid_targets_mean": 1413.0, + "valid_targets_min": 701 + }, + { + "epoch": 1.0110005238344684, + "grad_norm": 0.7703734046875843, + "learning_rate": 3.976130956607729e-05, + "loss": 0.2488, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15123215317726135, + "step": 1930, + "valid_targets_mean": 1745.6, + "valid_targets_min": 754 + }, + { + "epoch": 1.0136196961760084, + "grad_norm": 0.8156969109616492, + "learning_rate": 3.9757268816183464e-05, + "loss": 0.2496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13424146175384521, + "step": 1935, + "valid_targets_mean": 1337.9, + "valid_targets_min": 746 + }, + { + "epoch": 1.0162388685175485, + "grad_norm": 0.762245798336208, + "learning_rate": 3.975319435897134e-05, + "loss": 0.2569, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13536062836647034, + "step": 1940, + "valid_targets_mean": 1728.8, + "valid_targets_min": 970 + }, + { + "epoch": 1.0188580408590886, + "grad_norm": 0.7655927328602858, + "learning_rate": 3.9749086201392224e-05, + "loss": 0.2354, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1405276507139206, + "step": 1945, + "valid_targets_mean": 1569.5, + "valid_targets_min": 648 + }, + { + "epoch": 1.0214772132006287, + "grad_norm": 0.8729326295398971, + "learning_rate": 3.9744944350454935e-05, + "loss": 0.2598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15222492814064026, + "step": 1950, + "valid_targets_mean": 1538.8, + "valid_targets_min": 727 + }, + { + "epoch": 1.0240963855421688, + "grad_norm": 0.724871270354201, + "learning_rate": 3.9740768813225765e-05, + "loss": 0.2335, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09660930931568146, + "step": 1955, + "valid_targets_mean": 1519.5, + "valid_targets_min": 788 + }, + { + "epoch": 1.0267155578837088, + "grad_norm": 0.807519620375925, + "learning_rate": 3.973655959682847e-05, + "loss": 0.2419, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1028185710310936, + "step": 1960, + "valid_targets_mean": 1325.1, + "valid_targets_min": 627 + }, + { + "epoch": 1.029334730225249, + "grad_norm": 0.8629622918174555, + "learning_rate": 3.9732316708444306e-05, + "loss": 0.2469, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15766587853431702, + "step": 1965, + "valid_targets_mean": 1732.4, + "valid_targets_min": 633 + }, + { + "epoch": 1.031953902566789, + "grad_norm": 0.7916278926192974, + "learning_rate": 3.9728040155311906e-05, + "loss": 0.2407, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13446414470672607, + "step": 1970, + "valid_targets_mean": 1525.6, + "valid_targets_min": 923 + }, + { + "epoch": 1.034573074908329, + "grad_norm": 0.8942876139817988, + "learning_rate": 3.972372994472741e-05, + "loss": 0.231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12159556150436401, + "step": 1975, + "valid_targets_mean": 1603.5, + "valid_targets_min": 740 + }, + { + "epoch": 1.0371922472498691, + "grad_norm": 0.778377599100849, + "learning_rate": 3.971938608404432e-05, + "loss": 0.229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11791212856769562, + "step": 1980, + "valid_targets_mean": 1757.0, + "valid_targets_min": 895 + }, + { + "epoch": 1.0398114195914092, + "grad_norm": 0.7636176226363194, + "learning_rate": 3.9715008580673595e-05, + "loss": 0.2227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11560601741075516, + "step": 1985, + "valid_targets_mean": 1391.5, + "valid_targets_min": 1005 + }, + { + "epoch": 1.0424305919329493, + "grad_norm": 0.8014038325436506, + "learning_rate": 3.9710597442083555e-05, + "loss": 0.2463, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08947145193815231, + "step": 1990, + "valid_targets_mean": 1217.1, + "valid_targets_min": 870 + }, + { + "epoch": 1.0450497642744894, + "grad_norm": 0.8699500894472375, + "learning_rate": 3.970615267579993e-05, + "loss": 0.2442, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12444935739040375, + "step": 1995, + "valid_targets_mean": 1619.1, + "valid_targets_min": 879 + }, + { + "epoch": 1.0476689366160294, + "grad_norm": 0.7436468038034245, + "learning_rate": 3.97016742894058e-05, + "loss": 0.2417, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1077117770910263, + "step": 2000, + "valid_targets_mean": 1507.5, + "valid_targets_min": 906 + }, + { + "epoch": 1.0502881089575693, + "grad_norm": 0.80509332534856, + "learning_rate": 3.969716229054162e-05, + "loss": 0.2357, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14222241938114166, + "step": 2005, + "valid_targets_mean": 1707.1, + "valid_targets_min": 814 + }, + { + "epoch": 1.0529072812991094, + "grad_norm": 0.7612458704908245, + "learning_rate": 3.969261668690518e-05, + "loss": 0.232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10558472573757172, + "step": 2010, + "valid_targets_mean": 1747.9, + "valid_targets_min": 832 + }, + { + "epoch": 1.0555264536406495, + "grad_norm": 0.6753537286936889, + "learning_rate": 3.9688037486251615e-05, + "loss": 0.2381, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09377558529376984, + "step": 2015, + "valid_targets_mean": 1581.9, + "valid_targets_min": 891 + }, + { + "epoch": 1.0581456259821895, + "grad_norm": 0.7688444067608663, + "learning_rate": 3.9683424696393355e-05, + "loss": 0.2395, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1449514925479889, + "step": 2020, + "valid_targets_mean": 1746.8, + "valid_targets_min": 1052 + }, + { + "epoch": 1.0607647983237296, + "grad_norm": 0.7971853412990318, + "learning_rate": 3.9678778325200164e-05, + "loss": 0.2225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11333002150058746, + "step": 2025, + "valid_targets_mean": 1469.5, + "valid_targets_min": 737 + }, + { + "epoch": 1.0633839706652697, + "grad_norm": 0.7484228655586582, + "learning_rate": 3.967409838059908e-05, + "loss": 0.233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11924304068088531, + "step": 2030, + "valid_targets_mean": 1762.2, + "valid_targets_min": 1062 + }, + { + "epoch": 1.0660031430068098, + "grad_norm": 0.7785912990514914, + "learning_rate": 3.966938487057442e-05, + "loss": 0.2223, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12280270457267761, + "step": 2035, + "valid_targets_mean": 1482.1, + "valid_targets_min": 805 + }, + { + "epoch": 1.0686223153483498, + "grad_norm": 0.6860369029184382, + "learning_rate": 3.9664637803167775e-05, + "loss": 0.23, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12503057718276978, + "step": 2040, + "valid_targets_mean": 1962.8, + "valid_targets_min": 1253 + }, + { + "epoch": 1.07124148768989, + "grad_norm": 0.7513660699268863, + "learning_rate": 3.965985718647798e-05, + "loss": 0.2308, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13035273551940918, + "step": 2045, + "valid_targets_mean": 1958.0, + "valid_targets_min": 1264 + }, + { + "epoch": 1.07386066003143, + "grad_norm": 0.8647787964953808, + "learning_rate": 3.965504302866112e-05, + "loss": 0.2248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09549619257450104, + "step": 2050, + "valid_targets_mean": 1201.4, + "valid_targets_min": 613 + }, + { + "epoch": 1.07647983237297, + "grad_norm": 0.8658928820184512, + "learning_rate": 3.965019533793048e-05, + "loss": 0.2257, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11795791238546371, + "step": 2055, + "valid_targets_mean": 1559.0, + "valid_targets_min": 768 + }, + { + "epoch": 1.0790990047145101, + "grad_norm": 0.8542433100391335, + "learning_rate": 3.964531412255657e-05, + "loss": 0.225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11437257379293442, + "step": 2060, + "valid_targets_mean": 1210.0, + "valid_targets_min": 714 + }, + { + "epoch": 1.0817181770560502, + "grad_norm": 0.859546874634809, + "learning_rate": 3.96403993908671e-05, + "loss": 0.2346, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09374754875898361, + "step": 2065, + "valid_targets_mean": 1242.2, + "valid_targets_min": 841 + }, + { + "epoch": 1.0843373493975903, + "grad_norm": 0.7231260646891682, + "learning_rate": 3.963545115124695e-05, + "loss": 0.2227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1218329519033432, + "step": 2070, + "valid_targets_mean": 1708.1, + "valid_targets_min": 936 + }, + { + "epoch": 1.0869565217391304, + "grad_norm": 1.0871171462012361, + "learning_rate": 3.963046941213818e-05, + "loss": 0.2224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10440310835838318, + "step": 2075, + "valid_targets_mean": 1163.1, + "valid_targets_min": 746 + }, + { + "epoch": 1.0895756940806705, + "grad_norm": 0.8386367512159356, + "learning_rate": 3.962545418203999e-05, + "loss": 0.2079, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1122165396809578, + "step": 2080, + "valid_targets_mean": 1380.4, + "valid_targets_min": 814 + }, + { + "epoch": 1.0921948664222105, + "grad_norm": 0.7611728018818952, + "learning_rate": 3.9620405469508714e-05, + "loss": 0.2239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14091750979423523, + "step": 2085, + "valid_targets_mean": 1625.4, + "valid_targets_min": 635 + }, + { + "epoch": 1.0948140387637506, + "grad_norm": 0.7671597940815614, + "learning_rate": 3.9615323283157825e-05, + "loss": 0.2215, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08596023917198181, + "step": 2090, + "valid_targets_mean": 1153.4, + "valid_targets_min": 734 + }, + { + "epoch": 1.0974332111052907, + "grad_norm": 1.0130613386512692, + "learning_rate": 3.96102076316579e-05, + "loss": 0.2213, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12400378286838531, + "step": 2095, + "valid_targets_mean": 1487.1, + "valid_targets_min": 831 + }, + { + "epoch": 1.1000523834468308, + "grad_norm": 0.7349219723401507, + "learning_rate": 3.96050585237366e-05, + "loss": 0.2248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1018712967634201, + "step": 2100, + "valid_targets_mean": 1479.1, + "valid_targets_min": 1015 + }, + { + "epoch": 1.1026715557883708, + "grad_norm": 0.7265585575593051, + "learning_rate": 3.959987596817868e-05, + "loss": 0.2255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1054868996143341, + "step": 2105, + "valid_targets_mean": 1366.5, + "valid_targets_min": 711 + }, + { + "epoch": 1.105290728129911, + "grad_norm": 0.7170020320852712, + "learning_rate": 3.9594659973825956e-05, + "loss": 0.2183, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07551706582307816, + "step": 2110, + "valid_targets_mean": 1318.1, + "valid_targets_min": 736 + }, + { + "epoch": 1.107909900471451, + "grad_norm": 0.8668127695322749, + "learning_rate": 3.958941054957728e-05, + "loss": 0.2256, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13176393508911133, + "step": 2115, + "valid_targets_mean": 1541.2, + "valid_targets_min": 931 + }, + { + "epoch": 1.110529072812991, + "grad_norm": 0.7426866355102264, + "learning_rate": 3.958412770438854e-05, + "loss": 0.2298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11150750517845154, + "step": 2120, + "valid_targets_mean": 1790.2, + "valid_targets_min": 1011 + }, + { + "epoch": 1.1131482451545311, + "grad_norm": 0.79793910226458, + "learning_rate": 3.957881144727266e-05, + "loss": 0.2365, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12302378565073013, + "step": 2125, + "valid_targets_mean": 1511.6, + "valid_targets_min": 748 + }, + { + "epoch": 1.1157674174960712, + "grad_norm": 0.8529625169049818, + "learning_rate": 3.957346178729956e-05, + "loss": 0.2214, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11573164165019989, + "step": 2130, + "valid_targets_mean": 1568.1, + "valid_targets_min": 699 + }, + { + "epoch": 1.1183865898376113, + "grad_norm": 0.852495053036662, + "learning_rate": 3.956807873359613e-05, + "loss": 0.2162, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09075269103050232, + "step": 2135, + "valid_targets_mean": 1002.4, + "valid_targets_min": 534 + }, + { + "epoch": 1.1210057621791514, + "grad_norm": 0.7757396558566536, + "learning_rate": 3.9562662295346256e-05, + "loss": 0.2281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10594692826271057, + "step": 2140, + "valid_targets_mean": 1367.1, + "valid_targets_min": 687 + }, + { + "epoch": 1.1236249345206915, + "grad_norm": 0.7465660688593253, + "learning_rate": 3.955721248179076e-05, + "loss": 0.2211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08780340850353241, + "step": 2145, + "valid_targets_mean": 1259.8, + "valid_targets_min": 835 + }, + { + "epoch": 1.1262441068622315, + "grad_norm": 0.7539584899370625, + "learning_rate": 3.9551729302227436e-05, + "loss": 0.2138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10159491002559662, + "step": 2150, + "valid_targets_mean": 1330.9, + "valid_targets_min": 829 + }, + { + "epoch": 1.1288632792037716, + "grad_norm": 0.8467666052896952, + "learning_rate": 3.9546212766010956e-05, + "loss": 0.2124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11529254913330078, + "step": 2155, + "valid_targets_mean": 1756.4, + "valid_targets_min": 1138 + }, + { + "epoch": 1.1314824515453117, + "grad_norm": 0.6862128095142289, + "learning_rate": 3.9540662882552944e-05, + "loss": 0.227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13152453303337097, + "step": 2160, + "valid_targets_mean": 1799.8, + "valid_targets_min": 1174 + }, + { + "epoch": 1.1341016238868518, + "grad_norm": 0.8123483728194234, + "learning_rate": 3.95350796613219e-05, + "loss": 0.2204, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10572031140327454, + "step": 2165, + "valid_targets_mean": 1524.5, + "valid_targets_min": 554 + }, + { + "epoch": 1.1367207962283918, + "grad_norm": 0.747590190784486, + "learning_rate": 3.9529463111843186e-05, + "loss": 0.2185, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10925063490867615, + "step": 2170, + "valid_targets_mean": 1367.2, + "valid_targets_min": 843 + }, + { + "epoch": 1.139339968569932, + "grad_norm": 0.9388007763174887, + "learning_rate": 3.952381324369905e-05, + "loss": 0.2129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10343623161315918, + "step": 2175, + "valid_targets_mean": 1673.1, + "valid_targets_min": 849 + }, + { + "epoch": 1.141959140911472, + "grad_norm": 0.8653252025215202, + "learning_rate": 3.951813006652856e-05, + "loss": 0.2246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11683325469493866, + "step": 2180, + "valid_targets_mean": 1509.0, + "valid_targets_min": 612 + }, + { + "epoch": 1.144578313253012, + "grad_norm": 0.9278457407371539, + "learning_rate": 3.951241359002764e-05, + "loss": 0.2157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10242593288421631, + "step": 2185, + "valid_targets_mean": 1401.0, + "valid_targets_min": 841 + }, + { + "epoch": 1.1471974855945521, + "grad_norm": 0.8022037075812134, + "learning_rate": 3.950666382394901e-05, + "loss": 0.2157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13213659822940826, + "step": 2190, + "valid_targets_mean": 1564.8, + "valid_targets_min": 746 + }, + { + "epoch": 1.1498166579360922, + "grad_norm": 0.7516270705204289, + "learning_rate": 3.9500880778102163e-05, + "loss": 0.2107, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08958139270544052, + "step": 2195, + "valid_targets_mean": 1293.1, + "valid_targets_min": 822 + }, + { + "epoch": 1.1524358302776323, + "grad_norm": 0.7547102416422085, + "learning_rate": 3.949506446235341e-05, + "loss": 0.1997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10334242880344391, + "step": 2200, + "valid_targets_mean": 1731.0, + "valid_targets_min": 670 + }, + { + "epoch": 1.1550550026191724, + "grad_norm": 1.1197584829502087, + "learning_rate": 3.9489214886625794e-05, + "loss": 0.2185, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12101603299379349, + "step": 2205, + "valid_targets_mean": 1624.1, + "valid_targets_min": 647 + }, + { + "epoch": 1.1576741749607125, + "grad_norm": 1.0909042034318837, + "learning_rate": 3.948333206089912e-05, + "loss": 0.2118, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08762732148170471, + "step": 2210, + "valid_targets_mean": 1429.1, + "valid_targets_min": 952 + }, + { + "epoch": 1.1602933473022525, + "grad_norm": 0.8287334070305442, + "learning_rate": 3.947741599520989e-05, + "loss": 0.2141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09083770215511322, + "step": 2215, + "valid_targets_mean": 1222.5, + "valid_targets_min": 746 + }, + { + "epoch": 1.1629125196437926, + "grad_norm": 0.7422438956164562, + "learning_rate": 3.947146669965136e-05, + "loss": 0.2147, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09345854818820953, + "step": 2220, + "valid_targets_mean": 1417.8, + "valid_targets_min": 892 + }, + { + "epoch": 1.1655316919853327, + "grad_norm": 0.8067699975678834, + "learning_rate": 3.9465484184373445e-05, + "loss": 0.2205, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12448067218065262, + "step": 2225, + "valid_targets_mean": 1636.0, + "valid_targets_min": 985 + }, + { + "epoch": 1.1681508643268728, + "grad_norm": 0.7594608853046841, + "learning_rate": 3.945946845958274e-05, + "loss": 0.2124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10024244338274002, + "step": 2230, + "valid_targets_mean": 1505.0, + "valid_targets_min": 636 + }, + { + "epoch": 1.1707700366684128, + "grad_norm": 0.7324083576368025, + "learning_rate": 3.945341953554251e-05, + "loss": 0.2139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09119733422994614, + "step": 2235, + "valid_targets_mean": 1286.5, + "valid_targets_min": 641 + }, + { + "epoch": 1.173389209009953, + "grad_norm": 0.7323386488755297, + "learning_rate": 3.944733742257266e-05, + "loss": 0.2201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12102872133255005, + "step": 2240, + "valid_targets_mean": 1567.5, + "valid_targets_min": 1020 + }, + { + "epoch": 1.176008381351493, + "grad_norm": 0.795772920577501, + "learning_rate": 3.9441222131049696e-05, + "loss": 0.2186, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09501123428344727, + "step": 2245, + "valid_targets_mean": 1252.4, + "valid_targets_min": 729 + }, + { + "epoch": 1.178627553693033, + "grad_norm": 0.829365981248302, + "learning_rate": 3.943507367140676e-05, + "loss": 0.2271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13544471561908722, + "step": 2250, + "valid_targets_mean": 1518.2, + "valid_targets_min": 682 + }, + { + "epoch": 1.1812467260345731, + "grad_norm": 0.6910621458994263, + "learning_rate": 3.9428892054133546e-05, + "loss": 0.2218, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11135991662740707, + "step": 2255, + "valid_targets_mean": 1619.2, + "valid_targets_min": 1260 + }, + { + "epoch": 1.1838658983761132, + "grad_norm": 0.7852480038349146, + "learning_rate": 3.942267728977635e-05, + "loss": 0.221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14127010107040405, + "step": 2260, + "valid_targets_mean": 1575.4, + "valid_targets_min": 906 + }, + { + "epoch": 1.1864850707176533, + "grad_norm": 0.7630474982212205, + "learning_rate": 3.941642938893801e-05, + "loss": 0.2185, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11815932393074036, + "step": 2265, + "valid_targets_mean": 1608.1, + "valid_targets_min": 801 + }, + { + "epoch": 1.1891042430591934, + "grad_norm": 0.6949087723774056, + "learning_rate": 3.9410148362277884e-05, + "loss": 0.2097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1087980642914772, + "step": 2270, + "valid_targets_mean": 1414.8, + "valid_targets_min": 564 + }, + { + "epoch": 1.1917234154007335, + "grad_norm": 0.7277531366323761, + "learning_rate": 3.940383422051185e-05, + "loss": 0.212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10609061270952225, + "step": 2275, + "valid_targets_mean": 1512.5, + "valid_targets_min": 651 + }, + { + "epoch": 1.1943425877422735, + "grad_norm": 0.730344588104479, + "learning_rate": 3.93974869744123e-05, + "loss": 0.2217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09614178538322449, + "step": 2280, + "valid_targets_mean": 1262.4, + "valid_targets_min": 716 + }, + { + "epoch": 1.1969617600838136, + "grad_norm": 0.7297937012909113, + "learning_rate": 3.939110663480809e-05, + "loss": 0.2102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09250747412443161, + "step": 2285, + "valid_targets_mean": 1230.0, + "valid_targets_min": 704 + }, + { + "epoch": 1.1995809324253537, + "grad_norm": 0.7617396957992164, + "learning_rate": 3.9384693212584524e-05, + "loss": 0.2052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0926002711057663, + "step": 2290, + "valid_targets_mean": 1497.5, + "valid_targets_min": 1251 + }, + { + "epoch": 1.2022001047668938, + "grad_norm": 0.7539149132777555, + "learning_rate": 3.9378246718683374e-05, + "loss": 0.2098, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10801123082637787, + "step": 2295, + "valid_targets_mean": 1470.8, + "valid_targets_min": 764 + }, + { + "epoch": 1.2048192771084336, + "grad_norm": 0.9524084561164579, + "learning_rate": 3.937176716410281e-05, + "loss": 0.2294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10383504629135132, + "step": 2300, + "valid_targets_mean": 1469.4, + "valid_targets_min": 846 + }, + { + "epoch": 1.207438449449974, + "grad_norm": 0.7372489587943898, + "learning_rate": 3.9365254559897426e-05, + "loss": 0.2046, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11510239541530609, + "step": 2305, + "valid_targets_mean": 1774.4, + "valid_targets_min": 1011 + }, + { + "epoch": 1.2100576217915138, + "grad_norm": 0.6890782437617907, + "learning_rate": 3.9358708917178194e-05, + "loss": 0.2135, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09536474198102951, + "step": 2310, + "valid_targets_mean": 1558.9, + "valid_targets_min": 823 + }, + { + "epoch": 1.212676794133054, + "grad_norm": 0.6239930558716202, + "learning_rate": 3.9352130247112444e-05, + "loss": 0.1889, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1046057790517807, + "step": 2315, + "valid_targets_mean": 1687.6, + "valid_targets_min": 595 + }, + { + "epoch": 1.215295966474594, + "grad_norm": 0.7836318798739531, + "learning_rate": 3.934551856092386e-05, + "loss": 0.2101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10032084584236145, + "step": 2320, + "valid_targets_mean": 1336.9, + "valid_targets_min": 868 + }, + { + "epoch": 1.2179151388161342, + "grad_norm": 0.8601781857987808, + "learning_rate": 3.933887386989245e-05, + "loss": 0.2095, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11940158158540726, + "step": 2325, + "valid_targets_mean": 1266.6, + "valid_targets_min": 818 + }, + { + "epoch": 1.220534311157674, + "grad_norm": 0.8009716500949716, + "learning_rate": 3.933219618535454e-05, + "loss": 0.212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.129446879029274, + "step": 2330, + "valid_targets_mean": 1976.8, + "valid_targets_min": 1080 + }, + { + "epoch": 1.2231534834992142, + "grad_norm": 0.7492745681712601, + "learning_rate": 3.932548551870273e-05, + "loss": 0.2084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11948906630277634, + "step": 2335, + "valid_targets_mean": 1554.1, + "valid_targets_min": 658 + }, + { + "epoch": 1.2257726558407542, + "grad_norm": 0.7850723118104741, + "learning_rate": 3.9318741881385906e-05, + "loss": 0.2141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09871551394462585, + "step": 2340, + "valid_targets_mean": 1499.6, + "valid_targets_min": 1018 + }, + { + "epoch": 1.2283918281822943, + "grad_norm": 0.6772448031374775, + "learning_rate": 3.9311965284909205e-05, + "loss": 0.2215, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10974691808223724, + "step": 2345, + "valid_targets_mean": 1475.5, + "valid_targets_min": 897 + }, + { + "epoch": 1.2310110005238344, + "grad_norm": 0.5016573935407069, + "learning_rate": 3.930515574083397e-05, + "loss": 0.2265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12183630466461182, + "step": 2350, + "valid_targets_mean": 7107.2, + "valid_targets_min": 5295 + }, + { + "epoch": 1.2336301728653745, + "grad_norm": 0.42133670248430216, + "learning_rate": 3.929831326077779e-05, + "loss": 0.2323, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12615281343460083, + "step": 2355, + "valid_targets_mean": 7098.2, + "valid_targets_min": 5066 + }, + { + "epoch": 1.2362493452069145, + "grad_norm": 0.41383673694225553, + "learning_rate": 3.929143785641441e-05, + "loss": 0.2232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1073240339756012, + "step": 2360, + "valid_targets_mean": 6838.1, + "valid_targets_min": 4923 + }, + { + "epoch": 1.2388685175484546, + "grad_norm": 0.9018915755468442, + "learning_rate": 3.9284529539473765e-05, + "loss": 0.2192, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10324497520923615, + "step": 2365, + "valid_targets_mean": 5701.2, + "valid_targets_min": 3922 + }, + { + "epoch": 1.2414876898899947, + "grad_norm": 0.39388164766272543, + "learning_rate": 3.9277588321741954e-05, + "loss": 0.2148, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10737532377243042, + "step": 2370, + "valid_targets_mean": 7340.9, + "valid_targets_min": 4797 + }, + { + "epoch": 1.2441068622315348, + "grad_norm": 0.43312552283028277, + "learning_rate": 3.927061421506118e-05, + "loss": 0.2366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12764379382133484, + "step": 2375, + "valid_targets_mean": 6343.9, + "valid_targets_min": 3853 + }, + { + "epoch": 1.2467260345730748, + "grad_norm": 0.4270684045685589, + "learning_rate": 3.926360723132977e-05, + "loss": 0.2232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10858067870140076, + "step": 2380, + "valid_targets_mean": 6566.2, + "valid_targets_min": 4586 + }, + { + "epoch": 1.249345206914615, + "grad_norm": 0.4067994069431279, + "learning_rate": 3.9256567382502145e-05, + "loss": 0.2133, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12333779782056808, + "step": 2385, + "valid_targets_mean": 7153.6, + "valid_targets_min": 4728 + }, + { + "epoch": 1.251964379256155, + "grad_norm": 0.49740636629506035, + "learning_rate": 3.9249494680588786e-05, + "loss": 0.2479, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19038259983062744, + "step": 2390, + "valid_targets_mean": 6562.0, + "valid_targets_min": 5203 + }, + { + "epoch": 1.254583551597695, + "grad_norm": 0.3797774326216875, + "learning_rate": 3.924238913765624e-05, + "loss": 0.2055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11123651266098022, + "step": 2395, + "valid_targets_mean": 7098.9, + "valid_targets_min": 4561 + }, + { + "epoch": 1.2572027239392352, + "grad_norm": 0.5778136233412741, + "learning_rate": 3.9235250765827075e-05, + "loss": 0.2224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13788042962551117, + "step": 2400, + "valid_targets_mean": 4960.2, + "valid_targets_min": 3439 + }, + { + "epoch": 1.2598218962807752, + "grad_norm": 0.49608254313307765, + "learning_rate": 3.922807957727985e-05, + "loss": 0.2106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09457670152187347, + "step": 2405, + "valid_targets_mean": 5384.2, + "valid_targets_min": 3635 + }, + { + "epoch": 1.2624410686223153, + "grad_norm": 0.41188277730720274, + "learning_rate": 3.9220875584249135e-05, + "loss": 0.2181, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10995665937662125, + "step": 2410, + "valid_targets_mean": 6940.2, + "valid_targets_min": 4393 + }, + { + "epoch": 1.2650602409638554, + "grad_norm": 0.3848453621339323, + "learning_rate": 3.921363879902546e-05, + "loss": 0.202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11147625744342804, + "step": 2415, + "valid_targets_mean": 6812.4, + "valid_targets_min": 4749 + }, + { + "epoch": 1.2676794133053955, + "grad_norm": 0.48623178931329286, + "learning_rate": 3.9206369233955304e-05, + "loss": 0.1989, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.044521696865558624, + "step": 2420, + "valid_targets_mean": 2363.0, + "valid_targets_min": 1062 + }, + { + "epoch": 1.2702985856469355, + "grad_norm": 0.41502605372146767, + "learning_rate": 3.919906690144106e-05, + "loss": 0.1997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09982247650623322, + "step": 2425, + "valid_targets_mean": 5841.2, + "valid_targets_min": 3119 + }, + { + "epoch": 1.2729177579884756, + "grad_norm": 0.4296180929373709, + "learning_rate": 3.919173181394103e-05, + "loss": 0.2129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11030298471450806, + "step": 2430, + "valid_targets_mean": 5761.4, + "valid_targets_min": 3774 + }, + { + "epoch": 1.2755369303300157, + "grad_norm": 0.7229441580441829, + "learning_rate": 3.9184363983969405e-05, + "loss": 0.2084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10802686214447021, + "step": 2435, + "valid_targets_mean": 6412.4, + "valid_targets_min": 5293 + }, + { + "epoch": 1.2781561026715558, + "grad_norm": 0.3671482076221174, + "learning_rate": 3.917696342409623e-05, + "loss": 0.1891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10334502905607224, + "step": 2440, + "valid_targets_mean": 6709.1, + "valid_targets_min": 5665 + }, + { + "epoch": 1.2807752750130958, + "grad_norm": 0.44540104176071077, + "learning_rate": 3.9169530146947396e-05, + "loss": 0.1959, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10827546566724777, + "step": 2445, + "valid_targets_mean": 7344.6, + "valid_targets_min": 4428 + }, + { + "epoch": 1.283394447354636, + "grad_norm": 0.4618878085458157, + "learning_rate": 3.916206416520459e-05, + "loss": 0.219, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10369175672531128, + "step": 2450, + "valid_targets_mean": 5780.6, + "valid_targets_min": 4690 + }, + { + "epoch": 1.286013619696176, + "grad_norm": 0.4317398263786524, + "learning_rate": 3.915456549160533e-05, + "loss": 0.2199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09932570159435272, + "step": 2455, + "valid_targets_mean": 5854.5, + "valid_targets_min": 4335 + }, + { + "epoch": 1.288632792037716, + "grad_norm": 0.41441258686101656, + "learning_rate": 3.914703413894289e-05, + "loss": 0.2004, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1022871732711792, + "step": 2460, + "valid_targets_mean": 6378.9, + "valid_targets_min": 5342 + }, + { + "epoch": 1.2912519643792562, + "grad_norm": 0.43417833329432376, + "learning_rate": 3.9139470120066295e-05, + "loss": 0.2091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0962183028459549, + "step": 2465, + "valid_targets_mean": 5756.5, + "valid_targets_min": 3840 + }, + { + "epoch": 1.2938711367207962, + "grad_norm": 0.4349955432381067, + "learning_rate": 3.9131873447880296e-05, + "loss": 0.2253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12103915959596634, + "step": 2470, + "valid_targets_mean": 6438.6, + "valid_targets_min": 5104 + }, + { + "epoch": 1.2964903090623363, + "grad_norm": 0.5636207800862163, + "learning_rate": 3.912424413534537e-05, + "loss": 0.2422, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09318073838949203, + "step": 2475, + "valid_targets_mean": 5190.4, + "valid_targets_min": 4224 + }, + { + "epoch": 1.2991094814038764, + "grad_norm": 0.41352492240745525, + "learning_rate": 3.9116582195477676e-05, + "loss": 0.2299, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10306873917579651, + "step": 2480, + "valid_targets_mean": 5932.8, + "valid_targets_min": 4318 + }, + { + "epoch": 1.3017286537454165, + "grad_norm": 0.3912057260667177, + "learning_rate": 3.910888764134902e-05, + "loss": 0.2104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10825017094612122, + "step": 2485, + "valid_targets_mean": 6348.5, + "valid_targets_min": 4783 + }, + { + "epoch": 1.3043478260869565, + "grad_norm": 0.4242389807432637, + "learning_rate": 3.9101160486086874e-05, + "loss": 0.2126, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10528185218572617, + "step": 2490, + "valid_targets_mean": 7200.1, + "valid_targets_min": 4412 + }, + { + "epoch": 1.3069669984284966, + "grad_norm": 0.5655384901625239, + "learning_rate": 3.909340074287431e-05, + "loss": 0.2178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11472706496715546, + "step": 2495, + "valid_targets_mean": 6137.5, + "valid_targets_min": 5033 + }, + { + "epoch": 1.3095861707700367, + "grad_norm": 0.45341216141074125, + "learning_rate": 3.908560842495002e-05, + "loss": 0.2104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09808801114559174, + "step": 2500, + "valid_targets_mean": 5695.5, + "valid_targets_min": 4822 + }, + { + "epoch": 1.3122053431115768, + "grad_norm": 0.47046598181440774, + "learning_rate": 3.9077783545608244e-05, + "loss": 0.2132, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11489500105381012, + "step": 2505, + "valid_targets_mean": 5906.1, + "valid_targets_min": 2364 + }, + { + "epoch": 1.3148245154531168, + "grad_norm": 0.5262879452966152, + "learning_rate": 3.906992611819879e-05, + "loss": 0.2192, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11242279410362244, + "step": 2510, + "valid_targets_mean": 6359.0, + "valid_targets_min": 4793 + }, + { + "epoch": 1.317443687794657, + "grad_norm": 0.5424578345324054, + "learning_rate": 3.9062036156127e-05, + "loss": 0.2113, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11259541660547256, + "step": 2515, + "valid_targets_mean": 6104.9, + "valid_targets_min": 4733 + }, + { + "epoch": 1.320062860136197, + "grad_norm": 0.3852376094367663, + "learning_rate": 3.905411367285371e-05, + "loss": 0.1932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09048554301261902, + "step": 2520, + "valid_targets_mean": 6780.8, + "valid_targets_min": 5388 + }, + { + "epoch": 1.322682032477737, + "grad_norm": 0.441983088883469, + "learning_rate": 3.9046158681895245e-05, + "loss": 0.1885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10433575510978699, + "step": 2525, + "valid_targets_mean": 5956.2, + "valid_targets_min": 3182 + }, + { + "epoch": 1.3253012048192772, + "grad_norm": 0.39460410967625675, + "learning_rate": 3.90381711968234e-05, + "loss": 0.2164, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1174294576048851, + "step": 2530, + "valid_targets_mean": 6389.4, + "valid_targets_min": 5077 + }, + { + "epoch": 1.3279203771608172, + "grad_norm": 0.5421430229515332, + "learning_rate": 3.903015123126538e-05, + "loss": 0.2172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12288212776184082, + "step": 2535, + "valid_targets_mean": 5607.8, + "valid_targets_min": 3663 + }, + { + "epoch": 1.3305395495023573, + "grad_norm": 0.43894542574203654, + "learning_rate": 3.9022098798903846e-05, + "loss": 0.2039, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09502558410167694, + "step": 2540, + "valid_targets_mean": 5616.4, + "valid_targets_min": 4105 + }, + { + "epoch": 1.3331587218438974, + "grad_norm": 0.3773569176447065, + "learning_rate": 3.90140139134768e-05, + "loss": 0.2049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10998235642910004, + "step": 2545, + "valid_targets_mean": 7271.0, + "valid_targets_min": 5201 + }, + { + "epoch": 1.3357778941854375, + "grad_norm": 0.4156053262329772, + "learning_rate": 3.900589658877765e-05, + "loss": 0.1946, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11112470924854279, + "step": 2550, + "valid_targets_mean": 6797.6, + "valid_targets_min": 5069 + }, + { + "epoch": 1.3383970665269775, + "grad_norm": 0.41824839708799705, + "learning_rate": 3.899774683865513e-05, + "loss": 0.2065, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10233832150697708, + "step": 2555, + "valid_targets_mean": 5787.4, + "valid_targets_min": 4729 + }, + { + "epoch": 1.3410162388685176, + "grad_norm": 0.44548469125969525, + "learning_rate": 3.898956467701331e-05, + "loss": 0.2124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10589951276779175, + "step": 2560, + "valid_targets_mean": 5989.0, + "valid_targets_min": 4567 + }, + { + "epoch": 1.3436354112100577, + "grad_norm": 0.41009003012121287, + "learning_rate": 3.8981350117811525e-05, + "loss": 0.1973, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09308187663555145, + "step": 2565, + "valid_targets_mean": 5873.4, + "valid_targets_min": 4464 + }, + { + "epoch": 1.3462545835515978, + "grad_norm": 0.4212542692971494, + "learning_rate": 3.897310317506441e-05, + "loss": 0.2176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10250398516654968, + "step": 2570, + "valid_targets_mean": 5373.8, + "valid_targets_min": 4908 + }, + { + "epoch": 1.3488737558931378, + "grad_norm": 0.4236756568668427, + "learning_rate": 3.8964823862841855e-05, + "loss": 0.1932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0861271470785141, + "step": 2575, + "valid_targets_mean": 5441.6, + "valid_targets_min": 4443 + }, + { + "epoch": 1.351492928234678, + "grad_norm": 0.4347939680190683, + "learning_rate": 3.8956512195268936e-05, + "loss": 0.1779, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08970703184604645, + "step": 2580, + "valid_targets_mean": 6286.8, + "valid_targets_min": 3381 + }, + { + "epoch": 1.3541121005762178, + "grad_norm": 0.40095729731188445, + "learning_rate": 3.894816818652598e-05, + "loss": 0.1836, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08964194357395172, + "step": 2585, + "valid_targets_mean": 6162.8, + "valid_targets_min": 4790 + }, + { + "epoch": 1.356731272917758, + "grad_norm": 0.40418046170075766, + "learning_rate": 3.893979185084844e-05, + "loss": 0.1879, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09120337665081024, + "step": 2590, + "valid_targets_mean": 6336.1, + "valid_targets_min": 5161 + }, + { + "epoch": 1.359350445259298, + "grad_norm": 0.4242269315409445, + "learning_rate": 3.893138320252698e-05, + "loss": 0.2068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09119582176208496, + "step": 2595, + "valid_targets_mean": 6038.0, + "valid_targets_min": 4491 + }, + { + "epoch": 1.3619696176008382, + "grad_norm": 0.9708595853734081, + "learning_rate": 3.8922942255907316e-05, + "loss": 0.2407, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1414804458618164, + "step": 2600, + "valid_targets_mean": 1423.0, + "valid_targets_min": 817 + }, + { + "epoch": 1.364588789942378, + "grad_norm": 0.4477758125594203, + "learning_rate": 3.891446902539033e-05, + "loss": 0.2182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09902373701334, + "step": 2605, + "valid_targets_mean": 5531.1, + "valid_targets_min": 3893 + }, + { + "epoch": 1.3672079622839184, + "grad_norm": 0.44661837506019453, + "learning_rate": 3.8905963525431975e-05, + "loss": 0.1975, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1093834713101387, + "step": 2610, + "valid_targets_mean": 6276.2, + "valid_targets_min": 4622 + }, + { + "epoch": 1.3698271346254582, + "grad_norm": 0.395648111157185, + "learning_rate": 3.889742577054321e-05, + "loss": 0.2055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10112433135509491, + "step": 2615, + "valid_targets_mean": 8019.8, + "valid_targets_min": 6108 + }, + { + "epoch": 1.3724463069669985, + "grad_norm": 0.4283627037962096, + "learning_rate": 3.888885577529009e-05, + "loss": 0.2093, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11028099060058594, + "step": 2620, + "valid_targets_mean": 6822.1, + "valid_targets_min": 4253 + }, + { + "epoch": 1.3750654793085384, + "grad_norm": 0.40795304311294595, + "learning_rate": 3.888025355429362e-05, + "loss": 0.2198, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10736887156963348, + "step": 2625, + "valid_targets_mean": 6800.6, + "valid_targets_min": 4990 + }, + { + "epoch": 1.3776846516500787, + "grad_norm": 0.4158131427344537, + "learning_rate": 3.8871619122229816e-05, + "loss": 0.2038, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12992602586746216, + "step": 2630, + "valid_targets_mean": 6860.5, + "valid_targets_min": 4957 + }, + { + "epoch": 1.3803038239916186, + "grad_norm": 0.3956084333567644, + "learning_rate": 3.886295249382964e-05, + "loss": 0.2086, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09402551501989365, + "step": 2635, + "valid_targets_mean": 5820.2, + "valid_targets_min": 4775 + }, + { + "epoch": 1.3829229963331588, + "grad_norm": 0.4269057881551316, + "learning_rate": 3.885425368387898e-05, + "loss": 0.1963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07762826979160309, + "step": 2640, + "valid_targets_mean": 5628.8, + "valid_targets_min": 4098 + }, + { + "epoch": 1.3855421686746987, + "grad_norm": 0.41321789055034214, + "learning_rate": 3.8845522707218626e-05, + "loss": 0.1895, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10863015055656433, + "step": 2645, + "valid_targets_mean": 6170.6, + "valid_targets_min": 4801 + }, + { + "epoch": 1.388161341016239, + "grad_norm": 0.5113842812158871, + "learning_rate": 3.8836759578744255e-05, + "loss": 0.2435, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21723729372024536, + "step": 2650, + "valid_targets_mean": 6196.0, + "valid_targets_min": 4734 + }, + { + "epoch": 1.3907805133577789, + "grad_norm": 0.4380085783797243, + "learning_rate": 3.882796431340639e-05, + "loss": 0.2045, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11256542056798935, + "step": 2655, + "valid_targets_mean": 6086.4, + "valid_targets_min": 4400 + }, + { + "epoch": 1.393399685699319, + "grad_norm": 0.43940376502954864, + "learning_rate": 3.881913692621039e-05, + "loss": 0.1934, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10712681710720062, + "step": 2660, + "valid_targets_mean": 6544.9, + "valid_targets_min": 4919 + }, + { + "epoch": 1.396018858040859, + "grad_norm": 0.4177688964837717, + "learning_rate": 3.8810277432216404e-05, + "loss": 0.2061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11651991307735443, + "step": 2665, + "valid_targets_mean": 6052.2, + "valid_targets_min": 4611 + }, + { + "epoch": 1.398638030382399, + "grad_norm": 0.4027821543625251, + "learning_rate": 3.880138584653937e-05, + "loss": 0.2079, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09147213399410248, + "step": 2670, + "valid_targets_mean": 6934.9, + "valid_targets_min": 2275 + }, + { + "epoch": 1.4012572027239392, + "grad_norm": 0.415163749331779, + "learning_rate": 3.879246218434896e-05, + "loss": 0.1836, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09008123725652695, + "step": 2675, + "valid_targets_mean": 5878.5, + "valid_targets_min": 4826 + }, + { + "epoch": 1.4038763750654792, + "grad_norm": 0.3753579362033299, + "learning_rate": 3.8783506460869605e-05, + "loss": 0.1984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08899456262588501, + "step": 2680, + "valid_targets_mean": 6784.9, + "valid_targets_min": 4707 + }, + { + "epoch": 1.4064955474070193, + "grad_norm": 0.37948171111073, + "learning_rate": 3.877451869138039e-05, + "loss": 0.1824, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12983255088329315, + "step": 2685, + "valid_targets_mean": 7245.8, + "valid_targets_min": 5421 + }, + { + "epoch": 1.4091147197485594, + "grad_norm": 0.3919828815276863, + "learning_rate": 3.876549889121511e-05, + "loss": 0.1923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0971972793340683, + "step": 2690, + "valid_targets_mean": 7122.0, + "valid_targets_min": 4949 + }, + { + "epoch": 1.4117338920900995, + "grad_norm": 0.37599481909327476, + "learning_rate": 3.875644707576218e-05, + "loss": 0.1913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10371506959199905, + "step": 2695, + "valid_targets_mean": 6444.5, + "valid_targets_min": 4831 + }, + { + "epoch": 1.4143530644316396, + "grad_norm": 0.42157672366288373, + "learning_rate": 3.8747363260464644e-05, + "loss": 0.1975, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11276239156723022, + "step": 2700, + "valid_targets_mean": 6454.9, + "valid_targets_min": 4018 + }, + { + "epoch": 1.4169722367731796, + "grad_norm": 0.590647973505511, + "learning_rate": 3.873824746082016e-05, + "loss": 0.1874, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07755673676729202, + "step": 2705, + "valid_targets_mean": 6851.4, + "valid_targets_min": 5034 + }, + { + "epoch": 1.4195914091147197, + "grad_norm": 0.415589389082563, + "learning_rate": 3.872909969238092e-05, + "loss": 0.1966, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11099794507026672, + "step": 2710, + "valid_targets_mean": 6674.2, + "valid_targets_min": 4682 + }, + { + "epoch": 1.4222105814562598, + "grad_norm": 0.4868111375104368, + "learning_rate": 3.871991997075368e-05, + "loss": 0.2075, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10624338686466217, + "step": 2715, + "valid_targets_mean": 5518.1, + "valid_targets_min": 4764 + }, + { + "epoch": 1.4248297537977999, + "grad_norm": 0.5715378448201193, + "learning_rate": 3.87107083115997e-05, + "loss": 0.2113, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11575331538915634, + "step": 2720, + "valid_targets_mean": 5329.2, + "valid_targets_min": 2481 + }, + { + "epoch": 1.42744892613934, + "grad_norm": 0.5199610461866421, + "learning_rate": 3.8701464730634734e-05, + "loss": 0.2856, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16606278717517853, + "step": 2725, + "valid_targets_mean": 4792.6, + "valid_targets_min": 702 + }, + { + "epoch": 1.43006809848088, + "grad_norm": 0.5535968504065762, + "learning_rate": 3.8692189243629e-05, + "loss": 0.3189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17155292630195618, + "step": 2730, + "valid_targets_mean": 5322.8, + "valid_targets_min": 1005 + }, + { + "epoch": 1.43268727082242, + "grad_norm": 0.4988420804817056, + "learning_rate": 3.868288186640714e-05, + "loss": 0.307, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11296539008617401, + "step": 2735, + "valid_targets_mean": 3584.6, + "valid_targets_min": 2054 + }, + { + "epoch": 1.4353064431639602, + "grad_norm": 0.6110701721483975, + "learning_rate": 3.86735426148482e-05, + "loss": 0.3078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1350294053554535, + "step": 2740, + "valid_targets_mean": 3685.6, + "valid_targets_min": 1751 + }, + { + "epoch": 1.4379256155055002, + "grad_norm": 0.4989938534479867, + "learning_rate": 3.8664171504885625e-05, + "loss": 0.3017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18602502346038818, + "step": 2745, + "valid_targets_mean": 5944.2, + "valid_targets_min": 1970 + }, + { + "epoch": 1.4405447878470403, + "grad_norm": 0.47585566879088936, + "learning_rate": 3.86547685525072e-05, + "loss": 0.3178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14865697920322418, + "step": 2750, + "valid_targets_mean": 5916.0, + "valid_targets_min": 920 + }, + { + "epoch": 1.4431639601885804, + "grad_norm": 0.48408636593936255, + "learning_rate": 3.864533377375503e-05, + "loss": 0.298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14260733127593994, + "step": 2755, + "valid_targets_mean": 6475.4, + "valid_targets_min": 2231 + }, + { + "epoch": 1.4457831325301205, + "grad_norm": 0.5158666232835837, + "learning_rate": 3.8635867184725516e-05, + "loss": 0.302, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11541718989610672, + "step": 2760, + "valid_targets_mean": 4043.4, + "valid_targets_min": 467 + }, + { + "epoch": 1.4484023048716606, + "grad_norm": 0.510309128453629, + "learning_rate": 3.862636880156936e-05, + "loss": 0.313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16205619275569916, + "step": 2765, + "valid_targets_mean": 5549.8, + "valid_targets_min": 3440 + }, + { + "epoch": 1.4510214772132006, + "grad_norm": 0.5221182088210312, + "learning_rate": 3.8616838640491474e-05, + "loss": 0.313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1546589732170105, + "step": 2770, + "valid_targets_mean": 4736.9, + "valid_targets_min": 1697 + }, + { + "epoch": 1.4536406495547407, + "grad_norm": 0.5833107024383283, + "learning_rate": 3.860727671775099e-05, + "loss": 0.3083, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18122589588165283, + "step": 2775, + "valid_targets_mean": 4838.2, + "valid_targets_min": 1223 + }, + { + "epoch": 1.4562598218962808, + "grad_norm": 0.5228591268026902, + "learning_rate": 3.859768304966125e-05, + "loss": 0.3041, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15430261194705963, + "step": 2780, + "valid_targets_mean": 5466.9, + "valid_targets_min": 1552 + }, + { + "epoch": 1.4588789942378209, + "grad_norm": 0.5353294956306439, + "learning_rate": 3.8588057652589724e-05, + "loss": 0.31, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17821773886680603, + "step": 2785, + "valid_targets_mean": 5166.0, + "valid_targets_min": 1546 + }, + { + "epoch": 1.461498166579361, + "grad_norm": 0.5503796718154574, + "learning_rate": 3.857840054295804e-05, + "loss": 0.3037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14941097795963287, + "step": 2790, + "valid_targets_mean": 3848.2, + "valid_targets_min": 1957 + }, + { + "epoch": 1.464117338920901, + "grad_norm": 0.5916325559924084, + "learning_rate": 3.8568711737241925e-05, + "loss": 0.3174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14574086666107178, + "step": 2795, + "valid_targets_mean": 3487.5, + "valid_targets_min": 1538 + }, + { + "epoch": 1.466736511262441, + "grad_norm": 0.5925249004918991, + "learning_rate": 3.855899125197116e-05, + "loss": 0.3112, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15048345923423767, + "step": 2800, + "valid_targets_mean": 3397.2, + "valid_targets_min": 1645 + }, + { + "epoch": 1.4693556836039812, + "grad_norm": 0.6334952039976055, + "learning_rate": 3.8549239103729606e-05, + "loss": 0.3109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13147863745689392, + "step": 2805, + "valid_targets_mean": 2859.4, + "valid_targets_min": 935 + }, + { + "epoch": 1.4719748559455212, + "grad_norm": 0.6237687179523252, + "learning_rate": 3.8539455309155116e-05, + "loss": 0.3216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16066870093345642, + "step": 2810, + "valid_targets_mean": 3490.6, + "valid_targets_min": 1269 + }, + { + "epoch": 1.4745940282870613, + "grad_norm": 0.6604809060385983, + "learning_rate": 3.852963988493955e-05, + "loss": 0.3179, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14912638068199158, + "step": 2815, + "valid_targets_mean": 2860.0, + "valid_targets_min": 1173 + }, + { + "epoch": 1.4772132006286014, + "grad_norm": 0.5470019823441967, + "learning_rate": 3.851979284782873e-05, + "loss": 0.3128, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1375359147787094, + "step": 2820, + "valid_targets_mean": 3480.9, + "valid_targets_min": 1392 + }, + { + "epoch": 1.4798323729701415, + "grad_norm": 0.6191223562860483, + "learning_rate": 3.850991421462241e-05, + "loss": 0.3155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1769552230834961, + "step": 2825, + "valid_targets_mean": 3878.6, + "valid_targets_min": 1883 + }, + { + "epoch": 1.4824515453116816, + "grad_norm": 0.6184574495831373, + "learning_rate": 3.850000400217424e-05, + "loss": 0.3064, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17909373342990875, + "step": 2830, + "valid_targets_mean": 3721.4, + "valid_targets_min": 2106 + }, + { + "epoch": 1.4850707176532216, + "grad_norm": 0.5242297805984385, + "learning_rate": 3.849006222739175e-05, + "loss": 0.2833, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10997025668621063, + "step": 2835, + "valid_targets_mean": 3868.5, + "valid_targets_min": 2222 + }, + { + "epoch": 1.4876898899947617, + "grad_norm": 0.631553110720061, + "learning_rate": 3.848008890723633e-05, + "loss": 0.3109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14636048674583435, + "step": 2840, + "valid_targets_mean": 3010.1, + "valid_targets_min": 958 + }, + { + "epoch": 1.4903090623363018, + "grad_norm": 0.5927771226679842, + "learning_rate": 3.8470084058723174e-05, + "loss": 0.3086, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15214566886425018, + "step": 2845, + "valid_targets_mean": 3789.1, + "valid_targets_min": 771 + }, + { + "epoch": 1.4929282346778419, + "grad_norm": 0.4971923591509714, + "learning_rate": 3.846004769892128e-05, + "loss": 0.3146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10021981596946716, + "step": 2850, + "valid_targets_mean": 3578.9, + "valid_targets_min": 1774 + }, + { + "epoch": 1.495547407019382, + "grad_norm": 0.6577345008187645, + "learning_rate": 3.844997984495338e-05, + "loss": 0.3015, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14464107155799866, + "step": 2855, + "valid_targets_mean": 2545.8, + "valid_targets_min": 997 + }, + { + "epoch": 1.498166579360922, + "grad_norm": 0.5793133638446858, + "learning_rate": 3.843988051399598e-05, + "loss": 0.2951, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15637826919555664, + "step": 2860, + "valid_targets_mean": 3667.1, + "valid_targets_min": 1741 + }, + { + "epoch": 1.500785751702462, + "grad_norm": 0.6542856165355548, + "learning_rate": 3.842974972327925e-05, + "loss": 0.3092, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15415236353874207, + "step": 2865, + "valid_targets_mean": 3606.1, + "valid_targets_min": 863 + }, + { + "epoch": 1.503404924044002, + "grad_norm": 0.5452351556476359, + "learning_rate": 3.841958749008704e-05, + "loss": 0.3018, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15664133429527283, + "step": 2870, + "valid_targets_mean": 3876.9, + "valid_targets_min": 1854 + }, + { + "epoch": 1.5060240963855422, + "grad_norm": 0.6084567799593589, + "learning_rate": 3.8409393831756857e-05, + "loss": 0.2932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14668738842010498, + "step": 2875, + "valid_targets_mean": 4763.2, + "valid_targets_min": 2040 + }, + { + "epoch": 1.508643268727082, + "grad_norm": 0.6095390383279379, + "learning_rate": 3.839916876567981e-05, + "loss": 0.3043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1429491937160492, + "step": 2880, + "valid_targets_mean": 3521.9, + "valid_targets_min": 1036 + }, + { + "epoch": 1.5112624410686224, + "grad_norm": 0.7525866704807807, + "learning_rate": 3.838891230930061e-05, + "loss": 0.3079, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15864211320877075, + "step": 2885, + "valid_targets_mean": 4304.8, + "valid_targets_min": 1279 + }, + { + "epoch": 1.5138816134101623, + "grad_norm": 0.6314225340741985, + "learning_rate": 3.837862448011748e-05, + "loss": 0.2977, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15632294118404388, + "step": 2890, + "valid_targets_mean": 3600.0, + "valid_targets_min": 1798 + }, + { + "epoch": 1.5165007857517026, + "grad_norm": 0.566585761284272, + "learning_rate": 3.836830529568222e-05, + "loss": 0.3109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13838429749011993, + "step": 2895, + "valid_targets_mean": 3067.2, + "valid_targets_min": 1446 + }, + { + "epoch": 1.5191199580932424, + "grad_norm": 0.5597242375298772, + "learning_rate": 3.835795477360008e-05, + "loss": 0.3039, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15407949686050415, + "step": 2900, + "valid_targets_mean": 4183.2, + "valid_targets_min": 1270 + }, + { + "epoch": 1.5217391304347827, + "grad_norm": 0.492745220516234, + "learning_rate": 3.834757293152981e-05, + "loss": 0.303, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15897804498672485, + "step": 2905, + "valid_targets_mean": 5485.8, + "valid_targets_min": 1216 + }, + { + "epoch": 1.5243583027763226, + "grad_norm": 0.5832887181140126, + "learning_rate": 3.833715978718357e-05, + "loss": 0.2927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17947159707546234, + "step": 2910, + "valid_targets_mean": 3994.0, + "valid_targets_min": 2028 + }, + { + "epoch": 1.5269774751178629, + "grad_norm": 0.5992472868552041, + "learning_rate": 3.832671535832693e-05, + "loss": 0.3045, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17488516867160797, + "step": 2915, + "valid_targets_mean": 3700.6, + "valid_targets_min": 2329 + }, + { + "epoch": 1.5295966474594027, + "grad_norm": 0.608689936567635, + "learning_rate": 3.831623966277884e-05, + "loss": 0.3018, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19074520468711853, + "step": 2920, + "valid_targets_mean": 4075.2, + "valid_targets_min": 1363 + }, + { + "epoch": 1.532215819800943, + "grad_norm": 0.5687522702510394, + "learning_rate": 3.830573271841157e-05, + "loss": 0.2939, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1393849402666092, + "step": 2925, + "valid_targets_mean": 3560.8, + "valid_targets_min": 1087 + }, + { + "epoch": 1.5348349921424829, + "grad_norm": 0.6557873431198882, + "learning_rate": 3.829519454315075e-05, + "loss": 0.308, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1506955921649933, + "step": 2930, + "valid_targets_mean": 3860.1, + "valid_targets_min": 2483 + }, + { + "epoch": 1.5374541644840232, + "grad_norm": 0.5802954065582627, + "learning_rate": 3.828462515497524e-05, + "loss": 0.3001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17755460739135742, + "step": 2935, + "valid_targets_mean": 4583.2, + "valid_targets_min": 2316 + }, + { + "epoch": 1.540073336825563, + "grad_norm": 0.5333037941904751, + "learning_rate": 3.8274024571917194e-05, + "loss": 0.2945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14878308773040771, + "step": 2940, + "valid_targets_mean": 4198.9, + "valid_targets_min": 2022 + }, + { + "epoch": 1.5426925091671033, + "grad_norm": 0.5918564145559779, + "learning_rate": 3.826339281206195e-05, + "loss": 0.284, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11888591945171356, + "step": 2945, + "valid_targets_mean": 3228.9, + "valid_targets_min": 1294 + }, + { + "epoch": 1.5453116815086432, + "grad_norm": 0.7659151280372383, + "learning_rate": 3.8252729893548066e-05, + "loss": 0.3103, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18149510025978088, + "step": 2950, + "valid_targets_mean": 3846.8, + "valid_targets_min": 2716 + }, + { + "epoch": 1.5479308538501835, + "grad_norm": 0.6781972012501118, + "learning_rate": 3.824203583456723e-05, + "loss": 0.2912, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14599120616912842, + "step": 2955, + "valid_targets_mean": 3211.6, + "valid_targets_min": 2060 + }, + { + "epoch": 1.5505500261917233, + "grad_norm": 0.6459462222115947, + "learning_rate": 3.8231310653364293e-05, + "loss": 0.3044, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16775554418563843, + "step": 2960, + "valid_targets_mean": 3320.4, + "valid_targets_min": 2407 + }, + { + "epoch": 1.5531691985332636, + "grad_norm": 0.583093980020909, + "learning_rate": 3.822055436823717e-05, + "loss": 0.3053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15554597973823547, + "step": 2965, + "valid_targets_mean": 4165.1, + "valid_targets_min": 1533 + }, + { + "epoch": 1.5557883708748035, + "grad_norm": 0.5786723076536124, + "learning_rate": 3.8209766997536867e-05, + "loss": 0.3031, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18110856413841248, + "step": 2970, + "valid_targets_mean": 5201.2, + "valid_targets_min": 2189 + }, + { + "epoch": 1.5584075432163438, + "grad_norm": 0.5810527634474358, + "learning_rate": 3.81989485596674e-05, + "loss": 0.2958, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18378518521785736, + "step": 2975, + "valid_targets_mean": 4193.1, + "valid_targets_min": 1328 + }, + { + "epoch": 1.5610267155578836, + "grad_norm": 0.5793278438385654, + "learning_rate": 3.81880990730858e-05, + "loss": 0.31, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21407201886177063, + "step": 2980, + "valid_targets_mean": 4500.4, + "valid_targets_min": 1708 + }, + { + "epoch": 1.563645887899424, + "grad_norm": 0.5545862624490651, + "learning_rate": 3.817721855630209e-05, + "loss": 0.2871, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11643369495868683, + "step": 2985, + "valid_targets_mean": 3494.0, + "valid_targets_min": 1912 + }, + { + "epoch": 1.5662650602409638, + "grad_norm": 0.5846290764905854, + "learning_rate": 3.816630702787919e-05, + "loss": 0.2841, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.176794171333313, + "step": 2990, + "valid_targets_mean": 4145.2, + "valid_targets_min": 2606 + }, + { + "epoch": 1.568884232582504, + "grad_norm": 0.5560977476076939, + "learning_rate": 3.815536450643296e-05, + "loss": 0.2833, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1391376554965973, + "step": 2995, + "valid_targets_mean": 4189.0, + "valid_targets_min": 1378 + }, + { + "epoch": 1.571503404924044, + "grad_norm": 0.5864475779631305, + "learning_rate": 3.814439101063212e-05, + "loss": 0.294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16940513253211975, + "step": 3000, + "valid_targets_mean": 3983.4, + "valid_targets_min": 1219 + }, + { + "epoch": 1.574122577265584, + "grad_norm": 0.5486004743118648, + "learning_rate": 3.8133386559198255e-05, + "loss": 0.3001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1555742472410202, + "step": 3005, + "valid_targets_mean": 3997.0, + "valid_targets_min": 2631 + }, + { + "epoch": 1.576741749607124, + "grad_norm": 0.59745850047092, + "learning_rate": 3.812235117090574e-05, + "loss": 0.2942, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18192443251609802, + "step": 3010, + "valid_targets_mean": 4167.4, + "valid_targets_min": 1423 + }, + { + "epoch": 1.5793609219486642, + "grad_norm": 0.5491789317813656, + "learning_rate": 3.8111284864581734e-05, + "loss": 0.293, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11260128021240234, + "step": 3015, + "valid_targets_mean": 3381.9, + "valid_targets_min": 2320 + }, + { + "epoch": 1.5819800942902043, + "grad_norm": 0.5986153968033281, + "learning_rate": 3.8100187659106155e-05, + "loss": 0.3031, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15462613105773926, + "step": 3020, + "valid_targets_mean": 3174.9, + "valid_targets_min": 1188 + }, + { + "epoch": 1.5845992666317443, + "grad_norm": 0.5360926088484862, + "learning_rate": 3.808905957341164e-05, + "loss": 0.3015, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1185324639081955, + "step": 3025, + "valid_targets_mean": 3378.6, + "valid_targets_min": 618 + }, + { + "epoch": 1.5872184389732844, + "grad_norm": 0.7183261171782832, + "learning_rate": 3.807790062648349e-05, + "loss": 0.2985, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1585368812084198, + "step": 3030, + "valid_targets_mean": 2988.1, + "valid_targets_min": 1364 + }, + { + "epoch": 1.5898376113148245, + "grad_norm": 0.6104807586407798, + "learning_rate": 3.806671083735967e-05, + "loss": 0.2864, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12601983547210693, + "step": 3035, + "valid_targets_mean": 3199.1, + "valid_targets_min": 1397 + }, + { + "epoch": 1.5924567836563646, + "grad_norm": 0.5254606303988886, + "learning_rate": 3.805549022513077e-05, + "loss": 0.2817, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1630454957485199, + "step": 3040, + "valid_targets_mean": 5348.0, + "valid_targets_min": 1778 + }, + { + "epoch": 1.5950759559979046, + "grad_norm": 0.6031622636026757, + "learning_rate": 3.804423880893995e-05, + "loss": 0.2902, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15097734332084656, + "step": 3045, + "valid_targets_mean": 3444.9, + "valid_targets_min": 621 + }, + { + "epoch": 1.5976951283394447, + "grad_norm": 0.5724648411597208, + "learning_rate": 3.803295660798294e-05, + "loss": 0.2763, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12265162169933319, + "step": 3050, + "valid_targets_mean": 3872.9, + "valid_targets_min": 1290 + }, + { + "epoch": 1.6003143006809848, + "grad_norm": 0.7795690843114012, + "learning_rate": 3.802164364150799e-05, + "loss": 0.2813, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13530173897743225, + "step": 3055, + "valid_targets_mean": 2546.6, + "valid_targets_min": 642 + }, + { + "epoch": 1.6029334730225249, + "grad_norm": 0.6840637976254862, + "learning_rate": 3.801029992881582e-05, + "loss": 0.2794, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.149607315659523, + "step": 3060, + "valid_targets_mean": 3428.2, + "valid_targets_min": 1978 + }, + { + "epoch": 1.605552645364065, + "grad_norm": 0.6326176079391664, + "learning_rate": 3.799892548925963e-05, + "loss": 0.2958, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19109661877155304, + "step": 3065, + "valid_targets_mean": 4160.0, + "valid_targets_min": 2642 + }, + { + "epoch": 1.608171817705605, + "grad_norm": 0.6106544881530916, + "learning_rate": 3.798752034224502e-05, + "loss": 0.305, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11555371433496475, + "step": 3070, + "valid_targets_mean": 2937.1, + "valid_targets_min": 1510 + }, + { + "epoch": 1.610790990047145, + "grad_norm": 0.7650744871424319, + "learning_rate": 3.7976084507229993e-05, + "loss": 0.2901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1490192413330078, + "step": 3075, + "valid_targets_mean": 2744.2, + "valid_targets_min": 987 + }, + { + "epoch": 1.6134101623886852, + "grad_norm": 0.6605609372990109, + "learning_rate": 3.79646180037249e-05, + "loss": 0.2927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13533622026443481, + "step": 3080, + "valid_targets_mean": 3638.4, + "valid_targets_min": 1428 + }, + { + "epoch": 1.6160293347302253, + "grad_norm": 0.5621241160860045, + "learning_rate": 3.7953120851292434e-05, + "loss": 0.2865, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1694134920835495, + "step": 3085, + "valid_targets_mean": 4731.5, + "valid_targets_min": 1700 + }, + { + "epoch": 1.6186485070717653, + "grad_norm": 0.4700900499169939, + "learning_rate": 3.794159306954754e-05, + "loss": 0.2795, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13708017766475677, + "step": 3090, + "valid_targets_mean": 5699.6, + "valid_targets_min": 1767 + }, + { + "epoch": 1.6212676794133054, + "grad_norm": 0.49097823508639377, + "learning_rate": 3.793003467815746e-05, + "loss": 0.2907, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12990702688694, + "step": 3095, + "valid_targets_mean": 4101.5, + "valid_targets_min": 2684 + }, + { + "epoch": 1.6238868517548455, + "grad_norm": 0.6395190214185987, + "learning_rate": 3.791844569684163e-05, + "loss": 0.2807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12870249152183533, + "step": 3100, + "valid_targets_mean": 2761.2, + "valid_targets_min": 1542 + }, + { + "epoch": 1.6265060240963856, + "grad_norm": 0.6030725114729525, + "learning_rate": 3.790682614537168e-05, + "loss": 0.2891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11910074204206467, + "step": 3105, + "valid_targets_mean": 2765.8, + "valid_targets_min": 1476 + }, + { + "epoch": 1.6291251964379256, + "grad_norm": 0.5808334324956393, + "learning_rate": 3.7895176043571406e-05, + "loss": 0.2862, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14055724442005157, + "step": 3110, + "valid_targets_mean": 3884.5, + "valid_targets_min": 1711 + }, + { + "epoch": 1.6317443687794657, + "grad_norm": 0.5901410595832308, + "learning_rate": 3.7883495411316716e-05, + "loss": 0.297, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.147047758102417, + "step": 3115, + "valid_targets_mean": 3235.6, + "valid_targets_min": 1669 + }, + { + "epoch": 1.6343635411210058, + "grad_norm": 0.632321140577519, + "learning_rate": 3.787178426853561e-05, + "loss": 0.3023, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14954209327697754, + "step": 3120, + "valid_targets_mean": 3388.5, + "valid_targets_min": 1624 + }, + { + "epoch": 1.6369827134625459, + "grad_norm": 0.6492849577970939, + "learning_rate": 3.786004263520812e-05, + "loss": 0.2919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16489383578300476, + "step": 3125, + "valid_targets_mean": 3380.9, + "valid_targets_min": 1676 + }, + { + "epoch": 1.639601885804086, + "grad_norm": 0.6179749169137074, + "learning_rate": 3.784827053136634e-05, + "loss": 0.3115, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12462452799081802, + "step": 3130, + "valid_targets_mean": 3148.4, + "valid_targets_min": 1500 + }, + { + "epoch": 1.642221058145626, + "grad_norm": 0.5304284636990658, + "learning_rate": 3.783646797709431e-05, + "loss": 0.2852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13992038369178772, + "step": 3135, + "valid_targets_mean": 4343.5, + "valid_targets_min": 2556 + }, + { + "epoch": 1.644840230487166, + "grad_norm": 0.5670035842137175, + "learning_rate": 3.782463499252804e-05, + "loss": 0.3041, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11929184198379517, + "step": 3140, + "valid_targets_mean": 3299.5, + "valid_targets_min": 1241 + }, + { + "epoch": 1.6474594028287062, + "grad_norm": 0.6174416573018309, + "learning_rate": 3.781277159785544e-05, + "loss": 0.3095, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18445512652397156, + "step": 3145, + "valid_targets_mean": 3547.0, + "valid_targets_min": 992 + }, + { + "epoch": 1.6500785751702463, + "grad_norm": 0.5931150254553617, + "learning_rate": 3.780087781331632e-05, + "loss": 0.2893, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15835313498973846, + "step": 3150, + "valid_targets_mean": 4328.6, + "valid_targets_min": 1133 + }, + { + "epoch": 1.6526977475117863, + "grad_norm": 0.5789403612166983, + "learning_rate": 3.7788953659202346e-05, + "loss": 0.2915, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15773682296276093, + "step": 3155, + "valid_targets_mean": 4202.6, + "valid_targets_min": 2369 + }, + { + "epoch": 1.6553169198533264, + "grad_norm": 0.5600810789182009, + "learning_rate": 3.7776999155856954e-05, + "loss": 0.2977, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12007777392864227, + "step": 3160, + "valid_targets_mean": 3563.0, + "valid_targets_min": 1919 + }, + { + "epoch": 1.6579360921948663, + "grad_norm": 0.6972311923198078, + "learning_rate": 3.776501432367539e-05, + "loss": 0.3011, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16129465401172638, + "step": 3165, + "valid_targets_mean": 3975.5, + "valid_targets_min": 2902 + }, + { + "epoch": 1.6605552645364066, + "grad_norm": 0.6683336450697415, + "learning_rate": 3.775299918310466e-05, + "loss": 0.2989, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18373434245586395, + "step": 3170, + "valid_targets_mean": 2975.5, + "valid_targets_min": 617 + }, + { + "epoch": 1.6631744368779464, + "grad_norm": 0.5676551411040464, + "learning_rate": 3.774095375464342e-05, + "loss": 0.2722, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12359879910945892, + "step": 3175, + "valid_targets_mean": 3290.4, + "valid_targets_min": 1349 + }, + { + "epoch": 1.6657936092194867, + "grad_norm": 0.6074011986936779, + "learning_rate": 3.772887805884207e-05, + "loss": 0.2822, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1485823392868042, + "step": 3180, + "valid_targets_mean": 3459.0, + "valid_targets_min": 1769 + }, + { + "epoch": 1.6684127815610266, + "grad_norm": 0.5214724890996397, + "learning_rate": 3.7716772116302585e-05, + "loss": 0.2848, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13624684512615204, + "step": 3185, + "valid_targets_mean": 4186.1, + "valid_targets_min": 2097 + }, + { + "epoch": 1.6710319539025669, + "grad_norm": 0.6182861701326247, + "learning_rate": 3.770463594767859e-05, + "loss": 0.2928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15617293119430542, + "step": 3190, + "valid_targets_mean": 3304.0, + "valid_targets_min": 1066 + }, + { + "epoch": 1.6736511262441067, + "grad_norm": 0.5120195811384913, + "learning_rate": 3.769246957367525e-05, + "loss": 0.2819, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13785767555236816, + "step": 3195, + "valid_targets_mean": 4457.9, + "valid_targets_min": 2635 + }, + { + "epoch": 1.676270298585647, + "grad_norm": 0.5692443938196813, + "learning_rate": 3.768027301504928e-05, + "loss": 0.3019, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15586672723293304, + "step": 3200, + "valid_targets_mean": 4296.2, + "valid_targets_min": 981 + }, + { + "epoch": 1.6788894709271869, + "grad_norm": 0.5517023110408084, + "learning_rate": 3.7668046292608885e-05, + "loss": 0.2793, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13861095905303955, + "step": 3205, + "valid_targets_mean": 4020.1, + "valid_targets_min": 2131 + }, + { + "epoch": 1.6815086432687272, + "grad_norm": 0.7075129242556276, + "learning_rate": 3.765578942721372e-05, + "loss": 0.2917, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14743347465991974, + "step": 3210, + "valid_targets_mean": 3541.0, + "valid_targets_min": 1353 + }, + { + "epoch": 1.684127815610267, + "grad_norm": 0.50982123500427, + "learning_rate": 3.764350243977488e-05, + "loss": 0.2858, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11397814750671387, + "step": 3215, + "valid_targets_mean": 3362.0, + "valid_targets_min": 1509 + }, + { + "epoch": 1.6867469879518073, + "grad_norm": 0.5199391510603668, + "learning_rate": 3.763118535125486e-05, + "loss": 0.2752, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12962158024311066, + "step": 3220, + "valid_targets_mean": 3918.9, + "valid_targets_min": 2128 + }, + { + "epoch": 1.6893661602933472, + "grad_norm": 0.5455390582889343, + "learning_rate": 3.761883818266748e-05, + "loss": 0.2715, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1064610630273819, + "step": 3225, + "valid_targets_mean": 2919.0, + "valid_targets_min": 1687 + }, + { + "epoch": 1.6919853326348875, + "grad_norm": 0.6119127564819121, + "learning_rate": 3.76064609550779e-05, + "loss": 0.2781, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.161942720413208, + "step": 3230, + "valid_targets_mean": 3696.9, + "valid_targets_min": 1803 + }, + { + "epoch": 1.6946045049764273, + "grad_norm": 0.618712313943341, + "learning_rate": 3.759405368960257e-05, + "loss": 0.2781, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13463839888572693, + "step": 3235, + "valid_targets_mean": 4102.0, + "valid_targets_min": 2263 + }, + { + "epoch": 1.6972236773179676, + "grad_norm": 0.5470521788680083, + "learning_rate": 3.7581616407409156e-05, + "loss": 0.2811, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16817307472229004, + "step": 3240, + "valid_targets_mean": 4621.4, + "valid_targets_min": 2232 + }, + { + "epoch": 1.6998428496595075, + "grad_norm": 0.600468764132397, + "learning_rate": 3.756914912971657e-05, + "loss": 0.2717, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16401325166225433, + "step": 3245, + "valid_targets_mean": 4051.6, + "valid_targets_min": 873 + }, + { + "epoch": 1.7024620220010478, + "grad_norm": 0.5871156474593303, + "learning_rate": 3.755665187779487e-05, + "loss": 0.2772, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12342692911624908, + "step": 3250, + "valid_targets_mean": 3340.1, + "valid_targets_min": 1942 + }, + { + "epoch": 1.7050811943425876, + "grad_norm": 0.618710048195054, + "learning_rate": 3.754412467296528e-05, + "loss": 0.2818, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14007382094860077, + "step": 3255, + "valid_targets_mean": 3179.4, + "valid_targets_min": 897 + }, + { + "epoch": 1.707700366684128, + "grad_norm": 0.584669972621538, + "learning_rate": 3.7531567536600096e-05, + "loss": 0.2991, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14600828289985657, + "step": 3260, + "valid_targets_mean": 3492.2, + "valid_targets_min": 1695 + }, + { + "epoch": 1.7103195390256678, + "grad_norm": 0.6040311028107254, + "learning_rate": 3.75189804901227e-05, + "loss": 0.2834, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13014143705368042, + "step": 3265, + "valid_targets_mean": 4043.9, + "valid_targets_min": 1712 + }, + { + "epoch": 1.712938711367208, + "grad_norm": 0.5891106352840271, + "learning_rate": 3.75063635550075e-05, + "loss": 0.2828, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12240810692310333, + "step": 3270, + "valid_targets_mean": 2987.9, + "valid_targets_min": 993 + }, + { + "epoch": 1.715557883708748, + "grad_norm": 0.5299023195932661, + "learning_rate": 3.7493716752779885e-05, + "loss": 0.274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14450840651988983, + "step": 3275, + "valid_targets_mean": 3854.8, + "valid_targets_min": 1679 + }, + { + "epoch": 1.7181770560502883, + "grad_norm": 0.540981281742683, + "learning_rate": 3.748104010501621e-05, + "loss": 0.2837, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13237908482551575, + "step": 3280, + "valid_targets_mean": 3938.8, + "valid_targets_min": 2345 + }, + { + "epoch": 1.720796228391828, + "grad_norm": 0.5468890533600974, + "learning_rate": 3.746833363334374e-05, + "loss": 0.2848, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14428837597370148, + "step": 3285, + "valid_targets_mean": 4507.9, + "valid_targets_min": 3068 + }, + { + "epoch": 1.7234154007333684, + "grad_norm": 0.5226147361815041, + "learning_rate": 3.745559735944064e-05, + "loss": 0.2876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13451524078845978, + "step": 3290, + "valid_targets_mean": 4080.9, + "valid_targets_min": 2965 + }, + { + "epoch": 1.7260345730749083, + "grad_norm": 0.5913684135118995, + "learning_rate": 3.74428313050359e-05, + "loss": 0.2848, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1181318536400795, + "step": 3295, + "valid_targets_mean": 2993.5, + "valid_targets_min": 1817 + }, + { + "epoch": 1.7286537454164486, + "grad_norm": 0.5572804765560735, + "learning_rate": 3.743003549190933e-05, + "loss": 0.2828, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13754969835281372, + "step": 3300, + "valid_targets_mean": 3795.2, + "valid_targets_min": 1727 + }, + { + "epoch": 1.7312729177579884, + "grad_norm": 0.5331802199450895, + "learning_rate": 3.741720994189149e-05, + "loss": 0.2812, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14808553457260132, + "step": 3305, + "valid_targets_mean": 4095.9, + "valid_targets_min": 2491 + }, + { + "epoch": 1.7338920900995285, + "grad_norm": 0.5780295247817255, + "learning_rate": 3.740435467686371e-05, + "loss": 0.2245, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12938253581523895, + "step": 3310, + "valid_targets_mean": 2046.1, + "valid_targets_min": 333 + }, + { + "epoch": 1.7365112624410686, + "grad_norm": 0.4291125213521186, + "learning_rate": 3.739146971875798e-05, + "loss": 0.1269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06559838354587555, + "step": 3315, + "valid_targets_mean": 3455.9, + "valid_targets_min": 712 + }, + { + "epoch": 1.7391304347826086, + "grad_norm": 0.49518588227739074, + "learning_rate": 3.737855508955696e-05, + "loss": 0.1147, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05264649912714958, + "step": 3320, + "valid_targets_mean": 2452.6, + "valid_targets_min": 732 + }, + { + "epoch": 1.7417496071241487, + "grad_norm": 0.4791849034140046, + "learning_rate": 3.736561081129395e-05, + "loss": 0.1227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.053869135677814484, + "step": 3325, + "valid_targets_mean": 2228.9, + "valid_targets_min": 803 + }, + { + "epoch": 1.7443687794656888, + "grad_norm": 0.38578294663538254, + "learning_rate": 3.7352636906052804e-05, + "loss": 0.1077, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05738483741879463, + "step": 3330, + "valid_targets_mean": 3038.6, + "valid_targets_min": 818 + }, + { + "epoch": 1.7469879518072289, + "grad_norm": 0.4318151690490142, + "learning_rate": 3.733963339596795e-05, + "loss": 0.1175, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06107759475708008, + "step": 3335, + "valid_targets_mean": 3049.4, + "valid_targets_min": 1524 + }, + { + "epoch": 1.749607124148769, + "grad_norm": 0.7982300239873034, + "learning_rate": 3.7326600303224286e-05, + "loss": 0.1683, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07463137805461884, + "step": 3340, + "valid_targets_mean": 1256.1, + "valid_targets_min": 539 + }, + { + "epoch": 1.752226296490309, + "grad_norm": 0.39247918274137605, + "learning_rate": 3.731353765005723e-05, + "loss": 0.1285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.054993003606796265, + "step": 3345, + "valid_targets_mean": 3597.0, + "valid_targets_min": 2920 + }, + { + "epoch": 1.754845468831849, + "grad_norm": 0.6197858134037353, + "learning_rate": 3.730044545875258e-05, + "loss": 0.1259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06043145805597305, + "step": 3350, + "valid_targets_mean": 2737.9, + "valid_targets_min": 1048 + }, + { + "epoch": 1.7574646411733892, + "grad_norm": 0.3204751526751142, + "learning_rate": 3.728732375164657e-05, + "loss": 0.1564, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04147946089506149, + "step": 3355, + "valid_targets_mean": 4340.1, + "valid_targets_min": 962 + }, + { + "epoch": 1.7600838135149293, + "grad_norm": 0.3381245996923048, + "learning_rate": 3.727417255112577e-05, + "loss": 0.0978, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06389027833938599, + "step": 3360, + "valid_targets_mean": 4283.1, + "valid_targets_min": 2091 + }, + { + "epoch": 1.7627029858564693, + "grad_norm": 0.3499036909764462, + "learning_rate": 3.7260991879627077e-05, + "loss": 0.1097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05116523802280426, + "step": 3365, + "valid_targets_mean": 4320.9, + "valid_targets_min": 3349 + }, + { + "epoch": 1.7653221581980094, + "grad_norm": 0.34840836148116416, + "learning_rate": 3.724778175963765e-05, + "loss": 0.1115, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05876196548342705, + "step": 3370, + "valid_targets_mean": 3895.9, + "valid_targets_min": 518 + }, + { + "epoch": 1.7679413305395495, + "grad_norm": 0.5146942827484791, + "learning_rate": 3.723454221369491e-05, + "loss": 0.1585, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06485970318317413, + "step": 3375, + "valid_targets_mean": 2219.6, + "valid_targets_min": 549 + }, + { + "epoch": 1.7705605028810896, + "grad_norm": 0.3655799217404372, + "learning_rate": 3.7221273264386476e-05, + "loss": 0.1015, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04247612878680229, + "step": 3380, + "valid_targets_mean": 3700.2, + "valid_targets_min": 2724 + }, + { + "epoch": 1.7731796752226296, + "grad_norm": 0.5511475710791736, + "learning_rate": 3.720797493435012e-05, + "loss": 0.1214, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.057143114507198334, + "step": 3385, + "valid_targets_mean": 1672.5, + "valid_targets_min": 775 + }, + { + "epoch": 1.7757988475641697, + "grad_norm": 0.3703889552448537, + "learning_rate": 3.7194647246273745e-05, + "loss": 0.0984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02953612431883812, + "step": 3390, + "valid_targets_mean": 3546.2, + "valid_targets_min": 3183 + }, + { + "epoch": 1.7784180199057098, + "grad_norm": 0.44206201540152384, + "learning_rate": 3.718129022289536e-05, + "loss": 0.116, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.052335482090711594, + "step": 3395, + "valid_targets_mean": 2473.2, + "valid_targets_min": 577 + }, + { + "epoch": 1.7810371922472499, + "grad_norm": 0.588365869244826, + "learning_rate": 3.7167903887002984e-05, + "loss": 0.1298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08485578745603561, + "step": 3400, + "valid_targets_mean": 1597.0, + "valid_targets_min": 557 + }, + { + "epoch": 1.78365636458879, + "grad_norm": 0.4247359837759308, + "learning_rate": 3.715448826143468e-05, + "loss": 0.1239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06827764213085175, + "step": 3405, + "valid_targets_mean": 3019.1, + "valid_targets_min": 774 + }, + { + "epoch": 1.78627553693033, + "grad_norm": 0.4115914246403156, + "learning_rate": 3.7141043369078466e-05, + "loss": 0.1267, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.052259765565395355, + "step": 3410, + "valid_targets_mean": 1825.8, + "valid_targets_min": 680 + }, + { + "epoch": 1.78889470927187, + "grad_norm": 0.5027405469936328, + "learning_rate": 3.712756923287229e-05, + "loss": 0.1726, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08953357487916946, + "step": 3415, + "valid_targets_mean": 3686.9, + "valid_targets_min": 2819 + }, + { + "epoch": 1.7915138816134102, + "grad_norm": 0.341914931576673, + "learning_rate": 3.711406587580399e-05, + "loss": 0.1053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04390271008014679, + "step": 3420, + "valid_targets_mean": 4137.8, + "valid_targets_min": 3927 + }, + { + "epoch": 1.7941330539549503, + "grad_norm": 0.5547878511262697, + "learning_rate": 3.710053332091128e-05, + "loss": 0.1191, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07518318295478821, + "step": 3425, + "valid_targets_mean": 1376.1, + "valid_targets_min": 714 + }, + { + "epoch": 1.7967522262964903, + "grad_norm": 0.38780164210154305, + "learning_rate": 3.708697159128165e-05, + "loss": 0.1511, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.053412362933158875, + "step": 3430, + "valid_targets_mean": 3432.0, + "valid_targets_min": 754 + }, + { + "epoch": 1.7993713986380304, + "grad_norm": 0.3622569328164762, + "learning_rate": 3.7073380710052394e-05, + "loss": 0.1338, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.057908304035663605, + "step": 3435, + "valid_targets_mean": 3855.2, + "valid_targets_min": 3178 + }, + { + "epoch": 1.8019905709795705, + "grad_norm": 0.7660458310395545, + "learning_rate": 3.705976070041053e-05, + "loss": 0.1567, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1433018147945404, + "step": 3440, + "valid_targets_mean": 1566.6, + "valid_targets_min": 920 + }, + { + "epoch": 1.8046097433211106, + "grad_norm": 0.4264581704629832, + "learning_rate": 3.704611158559277e-05, + "loss": 0.3033, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.057927440851926804, + "step": 3445, + "valid_targets_mean": 3478.0, + "valid_targets_min": 2314 + }, + { + "epoch": 1.8072289156626506, + "grad_norm": 0.421070094231295, + "learning_rate": 3.703243338888548e-05, + "loss": 0.1302, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04688467085361481, + "step": 3450, + "valid_targets_mean": 2561.1, + "valid_targets_min": 833 + }, + { + "epoch": 1.8098480880041907, + "grad_norm": 0.4449631252726508, + "learning_rate": 3.701872613362466e-05, + "loss": 0.1251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0818537250161171, + "step": 3455, + "valid_targets_mean": 3509.2, + "valid_targets_min": 1803 + }, + { + "epoch": 1.8124672603457308, + "grad_norm": 0.40631985479418165, + "learning_rate": 3.7004989843195846e-05, + "loss": 0.2259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07911115139722824, + "step": 3460, + "valid_targets_mean": 4291.4, + "valid_targets_min": 3089 + }, + { + "epoch": 1.8150864326872709, + "grad_norm": 0.2501241430639796, + "learning_rate": 3.6991224541034155e-05, + "loss": 0.0919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.045642465353012085, + "step": 3465, + "valid_targets_mean": 4843.2, + "valid_targets_min": 2664 + }, + { + "epoch": 1.8177056050288107, + "grad_norm": 0.3398211835960956, + "learning_rate": 3.697743025062418e-05, + "loss": 0.1262, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03657059744000435, + "step": 3470, + "valid_targets_mean": 3042.1, + "valid_targets_min": 560 + }, + { + "epoch": 1.820324777370351, + "grad_norm": 0.3910868523973532, + "learning_rate": 3.696360699549996e-05, + "loss": 0.1246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0625862404704094, + "step": 3475, + "valid_targets_mean": 3863.6, + "valid_targets_min": 1615 + }, + { + "epoch": 1.8229439497118909, + "grad_norm": 0.3456416958516906, + "learning_rate": 3.694975479924496e-05, + "loss": 0.1068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03799763694405556, + "step": 3480, + "valid_targets_mean": 3312.5, + "valid_targets_min": 2172 + }, + { + "epoch": 1.8255631220534312, + "grad_norm": 0.4206614882492888, + "learning_rate": 3.693587368549203e-05, + "loss": 0.1037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04803289473056793, + "step": 3485, + "valid_targets_mean": 3059.9, + "valid_targets_min": 536 + }, + { + "epoch": 1.828182294394971, + "grad_norm": 0.3680179904899294, + "learning_rate": 3.6921963677923336e-05, + "loss": 0.1096, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05506697669625282, + "step": 3490, + "valid_targets_mean": 3881.0, + "valid_targets_min": 3295 + }, + { + "epoch": 1.8308014667365113, + "grad_norm": 0.3696429312740505, + "learning_rate": 3.6908024800270364e-05, + "loss": 0.1021, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.045204613357782364, + "step": 3495, + "valid_targets_mean": 3287.2, + "valid_targets_min": 820 + }, + { + "epoch": 1.8334206390780512, + "grad_norm": 0.5566468816324691, + "learning_rate": 3.689405707631383e-05, + "loss": 0.1574, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1554620862007141, + "step": 3500, + "valid_targets_mean": 2566.6, + "valid_targets_min": 1046 + }, + { + "epoch": 1.8360398114195915, + "grad_norm": 0.33316738802021517, + "learning_rate": 3.688006052988366e-05, + "loss": 0.1002, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05008360370993614, + "step": 3505, + "valid_targets_mean": 3590.1, + "valid_targets_min": 2719 + }, + { + "epoch": 1.8386589837611313, + "grad_norm": 0.6472921695898947, + "learning_rate": 3.6866035184858996e-05, + "loss": 0.1043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08209703117609024, + "step": 3510, + "valid_targets_mean": 1638.1, + "valid_targets_min": 699 + }, + { + "epoch": 1.8412781561026716, + "grad_norm": 0.3288394336914071, + "learning_rate": 3.685198106516806e-05, + "loss": 0.0967, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04378296434879303, + "step": 3515, + "valid_targets_mean": 3621.6, + "valid_targets_min": 2353 + }, + { + "epoch": 1.8438973284442115, + "grad_norm": 0.39765837004469934, + "learning_rate": 3.683789819478819e-05, + "loss": 0.0999, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05021953955292702, + "step": 3520, + "valid_targets_mean": 2328.1, + "valid_targets_min": 549 + }, + { + "epoch": 1.8465165007857518, + "grad_norm": 0.36074171564719126, + "learning_rate": 3.682378659774579e-05, + "loss": 0.1633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04425311088562012, + "step": 3525, + "valid_targets_mean": 3330.4, + "valid_targets_min": 908 + }, + { + "epoch": 1.8491356731272917, + "grad_norm": 0.3865231180181791, + "learning_rate": 3.680964629811624e-05, + "loss": 0.1318, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08880967646837234, + "step": 3530, + "valid_targets_mean": 3458.4, + "valid_targets_min": 2196 + }, + { + "epoch": 1.851754845468832, + "grad_norm": 0.35925425435447844, + "learning_rate": 3.6795477320023915e-05, + "loss": 0.1228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04197625070810318, + "step": 3535, + "valid_targets_mean": 1252.1, + "valid_targets_min": 598 + }, + { + "epoch": 1.8543740178103718, + "grad_norm": 0.8289333790703438, + "learning_rate": 3.6781279687642105e-05, + "loss": 0.1429, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1264137625694275, + "step": 3540, + "valid_targets_mean": 1353.1, + "valid_targets_min": 578 + }, + { + "epoch": 1.856993190151912, + "grad_norm": 0.6176220078989897, + "learning_rate": 3.676705342519299e-05, + "loss": 0.1667, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09037410467863083, + "step": 3545, + "valid_targets_mean": 1974.2, + "valid_targets_min": 695 + }, + { + "epoch": 1.859612362493452, + "grad_norm": 0.5105167569485973, + "learning_rate": 3.675279855694759e-05, + "loss": 0.1142, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.049207840114831924, + "step": 3550, + "valid_targets_mean": 1724.5, + "valid_targets_min": 691 + }, + { + "epoch": 1.8622315348349923, + "grad_norm": 0.3471757300765962, + "learning_rate": 3.673851510722574e-05, + "loss": 0.1396, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04608806222677231, + "step": 3555, + "valid_targets_mean": 3842.6, + "valid_targets_min": 2024 + }, + { + "epoch": 1.8648507071765321, + "grad_norm": 0.6162071645345287, + "learning_rate": 3.672420310039603e-05, + "loss": 0.1231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07409866899251938, + "step": 3560, + "valid_targets_mean": 1651.0, + "valid_targets_min": 523 + }, + { + "epoch": 1.8674698795180724, + "grad_norm": 0.31578727458606826, + "learning_rate": 3.670986256087577e-05, + "loss": 0.1079, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04291585460305214, + "step": 3565, + "valid_targets_mean": 3532.5, + "valid_targets_min": 468 + }, + { + "epoch": 1.8700890518596123, + "grad_norm": 0.28444034402660834, + "learning_rate": 3.669549351313094e-05, + "loss": 0.1133, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.028033385053277016, + "step": 3570, + "valid_targets_mean": 5298.0, + "valid_targets_min": 1195 + }, + { + "epoch": 1.8727082242011526, + "grad_norm": 0.3262378658558787, + "learning_rate": 3.668109598167618e-05, + "loss": 0.1018, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0372658334672451, + "step": 3575, + "valid_targets_mean": 3562.6, + "valid_targets_min": 459 + }, + { + "epoch": 1.8753273965426924, + "grad_norm": 0.3356185013987389, + "learning_rate": 3.666666999107471e-05, + "loss": 0.1013, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04638240486383438, + "step": 3580, + "valid_targets_mean": 3548.0, + "valid_targets_min": 981 + }, + { + "epoch": 1.8779465688842327, + "grad_norm": 0.421021617725726, + "learning_rate": 3.6652215565938296e-05, + "loss": 0.114, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06632312387228012, + "step": 3585, + "valid_targets_mean": 2130.1, + "valid_targets_min": 697 + }, + { + "epoch": 1.8805657412257726, + "grad_norm": 0.4194821722809897, + "learning_rate": 3.663773273092723e-05, + "loss": 0.1235, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05778392404317856, + "step": 3590, + "valid_targets_mean": 3661.6, + "valid_targets_min": 2759 + }, + { + "epoch": 1.8831849135673129, + "grad_norm": 0.5582186855630541, + "learning_rate": 3.662322151075027e-05, + "loss": 0.12, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.059523727744817734, + "step": 3595, + "valid_targets_mean": 3909.5, + "valid_targets_min": 3391 + }, + { + "epoch": 1.8858040859088527, + "grad_norm": 0.3249548361125933, + "learning_rate": 3.660868193016459e-05, + "loss": 0.1049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04768374562263489, + "step": 3600, + "valid_targets_mean": 3319.9, + "valid_targets_min": 1099 + }, + { + "epoch": 1.888423258250393, + "grad_norm": 0.3762130049174686, + "learning_rate": 3.6594114013975773e-05, + "loss": 0.107, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05660580098628998, + "step": 3605, + "valid_targets_mean": 3717.0, + "valid_targets_min": 1874 + }, + { + "epoch": 1.8910424305919329, + "grad_norm": 0.3431053442027875, + "learning_rate": 3.6579517787037716e-05, + "loss": 0.1232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05007211118936539, + "step": 3610, + "valid_targets_mean": 3263.5, + "valid_targets_min": 724 + }, + { + "epoch": 1.8936616029334732, + "grad_norm": 0.28758993152211504, + "learning_rate": 3.656489327425264e-05, + "loss": 0.0923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.041469305753707886, + "step": 3615, + "valid_targets_mean": 3707.5, + "valid_targets_min": 2769 + }, + { + "epoch": 1.896280775275013, + "grad_norm": 0.41053107516302273, + "learning_rate": 3.6550240500571e-05, + "loss": 0.1204, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05078805983066559, + "step": 3620, + "valid_targets_mean": 2815.8, + "valid_targets_min": 645 + }, + { + "epoch": 1.8988999476165531, + "grad_norm": 0.3576607627383553, + "learning_rate": 3.653555949099149e-05, + "loss": 0.1134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.047421231865882874, + "step": 3625, + "valid_targets_mean": 3488.8, + "valid_targets_min": 600 + }, + { + "epoch": 1.9015191199580932, + "grad_norm": 0.378035252875767, + "learning_rate": 3.652085027056095e-05, + "loss": 0.1336, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05577198788523674, + "step": 3630, + "valid_targets_mean": 3373.4, + "valid_targets_min": 1648 + }, + { + "epoch": 1.9041382922996333, + "grad_norm": 0.4165422980003152, + "learning_rate": 3.6506112864374394e-05, + "loss": 0.1171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07040315866470337, + "step": 3635, + "valid_targets_mean": 2555.0, + "valid_targets_min": 821 + }, + { + "epoch": 1.9067574646411733, + "grad_norm": 0.8415366072166318, + "learning_rate": 3.6491347297574874e-05, + "loss": 0.1323, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07888585329055786, + "step": 3640, + "valid_targets_mean": 867.1, + "valid_targets_min": 612 + }, + { + "epoch": 1.9093766369827134, + "grad_norm": 0.5041458430821508, + "learning_rate": 3.647655359535351e-05, + "loss": 0.1152, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08341926336288452, + "step": 3645, + "valid_targets_mean": 2202.1, + "valid_targets_min": 830 + }, + { + "epoch": 1.9119958093242535, + "grad_norm": 0.40226385036764234, + "learning_rate": 3.646173178294942e-05, + "loss": 0.1279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05278739333152771, + "step": 3650, + "valid_targets_mean": 3027.0, + "valid_targets_min": 1146 + }, + { + "epoch": 1.9146149816657936, + "grad_norm": 0.4110868173650747, + "learning_rate": 3.644688188564968e-05, + "loss": 0.1134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0692356526851654, + "step": 3655, + "valid_targets_mean": 3296.6, + "valid_targets_min": 2760 + }, + { + "epoch": 1.9172341540073337, + "grad_norm": 0.592891977918973, + "learning_rate": 3.643200392878928e-05, + "loss": 0.1067, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07121525704860687, + "step": 3660, + "valid_targets_mean": 1469.5, + "valid_targets_min": 628 + }, + { + "epoch": 1.9198533263488737, + "grad_norm": 0.5921042005229938, + "learning_rate": 3.641709793775108e-05, + "loss": 0.1316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10891153663396835, + "step": 3665, + "valid_targets_mean": 1752.1, + "valid_targets_min": 691 + }, + { + "epoch": 1.9224724986904138, + "grad_norm": 0.2899199301344974, + "learning_rate": 3.640216393796578e-05, + "loss": 0.1038, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0305730439722538, + "step": 3670, + "valid_targets_mean": 3863.9, + "valid_targets_min": 3613 + }, + { + "epoch": 1.9250916710319539, + "grad_norm": 0.34772988219079837, + "learning_rate": 3.6387201954911835e-05, + "loss": 0.1022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.051469407975673676, + "step": 3675, + "valid_targets_mean": 4304.2, + "valid_targets_min": 1773 + }, + { + "epoch": 1.927710843373494, + "grad_norm": 0.362820734701823, + "learning_rate": 3.637221201411549e-05, + "loss": 0.1102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.058442264795303345, + "step": 3680, + "valid_targets_mean": 1971.9, + "valid_targets_min": 762 + }, + { + "epoch": 1.930330015715034, + "grad_norm": 0.39901476818103243, + "learning_rate": 3.6357194141150636e-05, + "loss": 0.0967, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0717681273818016, + "step": 3685, + "valid_targets_mean": 4554.1, + "valid_targets_min": 946 + }, + { + "epoch": 1.9329491880565741, + "grad_norm": 0.36834707097157554, + "learning_rate": 3.634214836163885e-05, + "loss": 0.0921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0641884058713913, + "step": 3690, + "valid_targets_mean": 5015.5, + "valid_targets_min": 4104 + }, + { + "epoch": 1.9355683603981142, + "grad_norm": 0.37260637980081013, + "learning_rate": 3.632707470124931e-05, + "loss": 0.1159, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05261462181806564, + "step": 3695, + "valid_targets_mean": 3064.4, + "valid_targets_min": 739 + }, + { + "epoch": 1.9381875327396543, + "grad_norm": 0.44098208940525413, + "learning_rate": 3.631197318569877e-05, + "loss": 0.1288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05642792209982872, + "step": 3700, + "valid_targets_mean": 3863.6, + "valid_targets_min": 3550 + }, + { + "epoch": 1.9408067050811943, + "grad_norm": 0.3466346466006047, + "learning_rate": 3.629684384075148e-05, + "loss": 0.1094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06260032206773758, + "step": 3705, + "valid_targets_mean": 3474.9, + "valid_targets_min": 704 + }, + { + "epoch": 1.9434258774227344, + "grad_norm": 0.3386632212967048, + "learning_rate": 3.6281686692219215e-05, + "loss": 0.1107, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04761439934372902, + "step": 3710, + "valid_targets_mean": 2568.8, + "valid_targets_min": 774 + }, + { + "epoch": 1.9460450497642745, + "grad_norm": 0.29558164946962245, + "learning_rate": 3.626650176596114e-05, + "loss": 0.1344, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.045535311102867126, + "step": 3715, + "valid_targets_mean": 3486.2, + "valid_targets_min": 888 + }, + { + "epoch": 1.9486642221058146, + "grad_norm": 0.3685079925522479, + "learning_rate": 3.625128908788383e-05, + "loss": 0.1055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05522261559963226, + "step": 3720, + "valid_targets_mean": 3371.6, + "valid_targets_min": 1048 + }, + { + "epoch": 1.9512833944473547, + "grad_norm": 0.38643874766158975, + "learning_rate": 3.6236048683941207e-05, + "loss": 0.12, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05579588934779167, + "step": 3725, + "valid_targets_mean": 2941.5, + "valid_targets_min": 722 + }, + { + "epoch": 1.9539025667888947, + "grad_norm": 0.40259470466238484, + "learning_rate": 3.62207805801345e-05, + "loss": 0.1144, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06654039025306702, + "step": 3730, + "valid_targets_mean": 2359.2, + "valid_targets_min": 865 + }, + { + "epoch": 1.9565217391304348, + "grad_norm": 0.48631724845097407, + "learning_rate": 3.620548480251218e-05, + "loss": 0.1605, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04295656830072403, + "step": 3735, + "valid_targets_mean": 1747.0, + "valid_targets_min": 570 + }, + { + "epoch": 1.9591409114719749, + "grad_norm": 0.4102309246391661, + "learning_rate": 3.6190161377169946e-05, + "loss": 0.1329, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06898366659879684, + "step": 3740, + "valid_targets_mean": 3704.2, + "valid_targets_min": 2811 + }, + { + "epoch": 1.961760083813515, + "grad_norm": 0.41579990829819685, + "learning_rate": 3.6174810330250664e-05, + "loss": 0.1099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.047321662306785583, + "step": 3745, + "valid_targets_mean": 1749.1, + "valid_targets_min": 635 + }, + { + "epoch": 1.964379256155055, + "grad_norm": 0.36412973997585185, + "learning_rate": 3.615943168794432e-05, + "loss": 0.1076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05411919951438904, + "step": 3750, + "valid_targets_mean": 2985.1, + "valid_targets_min": 1591 + }, + { + "epoch": 1.9669984284965951, + "grad_norm": 0.4142314566337443, + "learning_rate": 3.6144025476487976e-05, + "loss": 0.1064, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04836519807577133, + "step": 3755, + "valid_targets_mean": 2912.6, + "valid_targets_min": 800 + }, + { + "epoch": 1.9696176008381352, + "grad_norm": 0.35907542692044886, + "learning_rate": 3.612859172216574e-05, + "loss": 0.0994, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.055306024849414825, + "step": 3760, + "valid_targets_mean": 3084.9, + "valid_targets_min": 860 + }, + { + "epoch": 1.9722367731796753, + "grad_norm": 0.4488371386465046, + "learning_rate": 3.61131304513087e-05, + "loss": 0.1388, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06375181674957275, + "step": 3765, + "valid_targets_mean": 2482.6, + "valid_targets_min": 878 + }, + { + "epoch": 1.9748559455212154, + "grad_norm": 0.3495903817194169, + "learning_rate": 3.60976416902949e-05, + "loss": 0.0939, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.047893598675727844, + "step": 3770, + "valid_targets_mean": 3403.2, + "valid_targets_min": 1024 + }, + { + "epoch": 1.9774751178627552, + "grad_norm": 0.4355827963253253, + "learning_rate": 3.608212546554927e-05, + "loss": 0.1071, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05321928486227989, + "step": 3775, + "valid_targets_mean": 2173.1, + "valid_targets_min": 786 + }, + { + "epoch": 1.9800942902042955, + "grad_norm": 0.43601912121827463, + "learning_rate": 3.6066581803543605e-05, + "loss": 0.1098, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06638313829898834, + "step": 3780, + "valid_targets_mean": 3233.9, + "valid_targets_min": 2573 + }, + { + "epoch": 1.9827134625458354, + "grad_norm": 0.307649421102193, + "learning_rate": 3.605101073079651e-05, + "loss": 0.1085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.056634437292814255, + "step": 3785, + "valid_targets_mean": 3821.9, + "valid_targets_min": 2274 + }, + { + "epoch": 1.9853326348873757, + "grad_norm": 0.3786213196256713, + "learning_rate": 3.6035412273873355e-05, + "loss": 0.0957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0659828782081604, + "step": 3790, + "valid_targets_mean": 3791.2, + "valid_targets_min": 892 + }, + { + "epoch": 1.9879518072289155, + "grad_norm": 0.3037949300453433, + "learning_rate": 3.601978645938623e-05, + "loss": 0.1047, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.042338401079177856, + "step": 3795, + "valid_targets_mean": 4820.4, + "valid_targets_min": 4491 + }, + { + "epoch": 1.9905709795704558, + "grad_norm": 0.516157150218108, + "learning_rate": 3.6004133313993874e-05, + "loss": 0.1482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1160566657781601, + "step": 3800, + "valid_targets_mean": 2159.1, + "valid_targets_min": 709 + }, + { + "epoch": 1.9931901519119957, + "grad_norm": 0.30142097086660685, + "learning_rate": 3.5988452864401695e-05, + "loss": 0.1598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.034394338726997375, + "step": 3805, + "valid_targets_mean": 3430.8, + "valid_targets_min": 1097 + }, + { + "epoch": 1.995809324253536, + "grad_norm": 0.33310269310201696, + "learning_rate": 3.597274513736167e-05, + "loss": 0.1094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04524791240692139, + "step": 3810, + "valid_targets_mean": 3032.0, + "valid_targets_min": 840 + }, + { + "epoch": 1.9984284965950758, + "grad_norm": 0.31566090994172014, + "learning_rate": 3.595701015967229e-05, + "loss": 0.1029, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04328145459294319, + "step": 3815, + "valid_targets_mean": 3812.2, + "valid_targets_min": 3106 + }, + { + "epoch": 2.001047668936616, + "grad_norm": 0.8926428358074082, + "learning_rate": 3.5941247958178574e-05, + "loss": 0.1922, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1102590411901474, + "step": 3820, + "valid_targets_mean": 1653.2, + "valid_targets_min": 777 + }, + { + "epoch": 2.003666841278156, + "grad_norm": 0.8223433508863462, + "learning_rate": 3.5925458559771954e-05, + "loss": 0.2248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10741463303565979, + "step": 3825, + "valid_targets_mean": 1349.8, + "valid_targets_min": 788 + }, + { + "epoch": 2.0062860136196963, + "grad_norm": 0.710236684697301, + "learning_rate": 3.590964199139029e-05, + "loss": 0.2042, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08701279759407043, + "step": 3830, + "valid_targets_mean": 1582.2, + "valid_targets_min": 914 + }, + { + "epoch": 2.008905185961236, + "grad_norm": 0.7585428118511915, + "learning_rate": 3.589379828001777e-05, + "loss": 0.202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09916609525680542, + "step": 3835, + "valid_targets_mean": 1468.5, + "valid_targets_min": 680 + }, + { + "epoch": 2.0115243583027764, + "grad_norm": 0.6791949417976332, + "learning_rate": 3.587792745268492e-05, + "loss": 0.202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09496802091598511, + "step": 3840, + "valid_targets_mean": 1762.2, + "valid_targets_min": 1058 + }, + { + "epoch": 2.0141435306443163, + "grad_norm": 0.749855232106419, + "learning_rate": 3.586202953646848e-05, + "loss": 0.1994, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09410624951124191, + "step": 3845, + "valid_targets_mean": 1261.5, + "valid_targets_min": 734 + }, + { + "epoch": 2.0167627029858566, + "grad_norm": 0.7015288073990621, + "learning_rate": 3.5846104558491465e-05, + "loss": 0.2087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10790140926837921, + "step": 3850, + "valid_targets_mean": 1791.1, + "valid_targets_min": 930 + }, + { + "epoch": 2.0193818753273964, + "grad_norm": 0.7924206807083869, + "learning_rate": 3.5830152545923024e-05, + "loss": 0.1861, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11440248787403107, + "step": 3855, + "valid_targets_mean": 1598.8, + "valid_targets_min": 737 + }, + { + "epoch": 2.0220010476689367, + "grad_norm": 0.7386126975367331, + "learning_rate": 3.581417352597843e-05, + "loss": 0.2111, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08926434814929962, + "step": 3860, + "valid_targets_mean": 1449.5, + "valid_targets_min": 759 + }, + { + "epoch": 2.0246202200104766, + "grad_norm": 0.9632976534987181, + "learning_rate": 3.579816752591903e-05, + "loss": 0.1951, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09514357894659042, + "step": 3865, + "valid_targets_mean": 1652.8, + "valid_targets_min": 753 + }, + { + "epoch": 2.027239392352017, + "grad_norm": 0.7834421185090436, + "learning_rate": 3.578213457305222e-05, + "loss": 0.1983, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12458643317222595, + "step": 3870, + "valid_targets_mean": 1675.9, + "valid_targets_min": 780 + }, + { + "epoch": 2.0298585646935567, + "grad_norm": 0.748004283273961, + "learning_rate": 3.5766074694731374e-05, + "loss": 0.2036, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07764267176389694, + "step": 3875, + "valid_targets_mean": 1187.5, + "valid_targets_min": 679 + }, + { + "epoch": 2.032477737035097, + "grad_norm": 0.7663537229597992, + "learning_rate": 3.574998791835578e-05, + "loss": 0.2001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08690992742776871, + "step": 3880, + "valid_targets_mean": 1200.9, + "valid_targets_min": 771 + }, + { + "epoch": 2.035096909376637, + "grad_norm": 0.6898331140298751, + "learning_rate": 3.573387427137064e-05, + "loss": 0.1842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08832302689552307, + "step": 3885, + "valid_targets_mean": 1593.0, + "valid_targets_min": 986 + }, + { + "epoch": 2.037716081718177, + "grad_norm": 0.708967320449303, + "learning_rate": 3.5717733781266994e-05, + "loss": 0.1884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10770932585000992, + "step": 3890, + "valid_targets_mean": 1591.4, + "valid_targets_min": 1103 + }, + { + "epoch": 2.040335254059717, + "grad_norm": 0.7089081171481766, + "learning_rate": 3.5701566475581675e-05, + "loss": 0.1954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08699934929609299, + "step": 3895, + "valid_targets_mean": 1343.2, + "valid_targets_min": 675 + }, + { + "epoch": 2.0429544264012574, + "grad_norm": 0.6949969333301061, + "learning_rate": 3.568537238189727e-05, + "loss": 0.1966, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10397947579622269, + "step": 3900, + "valid_targets_mean": 1491.6, + "valid_targets_min": 941 + }, + { + "epoch": 2.045573598742797, + "grad_norm": 0.7473021370579906, + "learning_rate": 3.566915152784206e-05, + "loss": 0.2023, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1123787984251976, + "step": 3905, + "valid_targets_mean": 1921.4, + "valid_targets_min": 1062 + }, + { + "epoch": 2.0481927710843375, + "grad_norm": 0.7142355552447804, + "learning_rate": 3.565290394108998e-05, + "loss": 0.2001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08229781687259674, + "step": 3910, + "valid_targets_mean": 1375.2, + "valid_targets_min": 1023 + }, + { + "epoch": 2.0508119434258774, + "grad_norm": 0.75568883902217, + "learning_rate": 3.56366296493606e-05, + "loss": 0.2029, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09430685639381409, + "step": 3915, + "valid_targets_mean": 1440.0, + "valid_targets_min": 660 + }, + { + "epoch": 2.0534311157674177, + "grad_norm": 0.6820924771511605, + "learning_rate": 3.562032868041901e-05, + "loss": 0.1923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07597774267196655, + "step": 3920, + "valid_targets_mean": 1234.9, + "valid_targets_min": 658 + }, + { + "epoch": 2.0560502881089575, + "grad_norm": 0.7222333855023938, + "learning_rate": 3.560400106207584e-05, + "loss": 0.2003, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07671467959880829, + "step": 3925, + "valid_targets_mean": 1198.9, + "valid_targets_min": 650 + }, + { + "epoch": 2.058669460450498, + "grad_norm": 0.7836793704441655, + "learning_rate": 3.558764682218717e-05, + "loss": 0.2016, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07579369843006134, + "step": 3930, + "valid_targets_mean": 1354.0, + "valid_targets_min": 863 + }, + { + "epoch": 2.0612886327920377, + "grad_norm": 0.7340836520402091, + "learning_rate": 3.557126598865452e-05, + "loss": 0.1849, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10264989733695984, + "step": 3935, + "valid_targets_mean": 1517.6, + "valid_targets_min": 728 + }, + { + "epoch": 2.063907805133578, + "grad_norm": 0.7224732121013455, + "learning_rate": 3.5554858589424755e-05, + "loss": 0.1956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09368730336427689, + "step": 3940, + "valid_targets_mean": 1649.9, + "valid_targets_min": 686 + }, + { + "epoch": 2.066526977475118, + "grad_norm": 0.725587499393139, + "learning_rate": 3.553842465249009e-05, + "loss": 0.1893, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09984948486089706, + "step": 3945, + "valid_targets_mean": 1512.1, + "valid_targets_min": 697 + }, + { + "epoch": 2.069146149816658, + "grad_norm": 0.6655391235263616, + "learning_rate": 3.552196420588799e-05, + "loss": 0.1889, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07939508557319641, + "step": 3950, + "valid_targets_mean": 1428.5, + "valid_targets_min": 779 + }, + { + "epoch": 2.071765322158198, + "grad_norm": 0.7260574699338164, + "learning_rate": 3.550547727770115e-05, + "loss": 0.2007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10762490332126617, + "step": 3955, + "valid_targets_mean": 1555.8, + "valid_targets_min": 1266 + }, + { + "epoch": 2.0743844944997383, + "grad_norm": 0.7434906694477653, + "learning_rate": 3.548896389605748e-05, + "loss": 0.1874, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0947028249502182, + "step": 3960, + "valid_targets_mean": 1495.4, + "valid_targets_min": 1033 + }, + { + "epoch": 2.077003666841278, + "grad_norm": 0.7109038144568908, + "learning_rate": 3.547242408912997e-05, + "loss": 0.1944, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07691630721092224, + "step": 3965, + "valid_targets_mean": 1375.0, + "valid_targets_min": 847 + }, + { + "epoch": 2.0796228391828184, + "grad_norm": 0.7311476978095995, + "learning_rate": 3.545585788513672e-05, + "loss": 0.1917, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09924264997243881, + "step": 3970, + "valid_targets_mean": 1515.8, + "valid_targets_min": 793 + }, + { + "epoch": 2.0822420115243583, + "grad_norm": 0.6821558270361922, + "learning_rate": 3.5439265312340874e-05, + "loss": 0.1949, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08497537672519684, + "step": 3975, + "valid_targets_mean": 1370.6, + "valid_targets_min": 806 + }, + { + "epoch": 2.0848611838658986, + "grad_norm": 0.6821998944070964, + "learning_rate": 3.542264639905054e-05, + "loss": 0.1933, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09639190137386322, + "step": 3980, + "valid_targets_mean": 1514.8, + "valid_targets_min": 803 + }, + { + "epoch": 2.0874803562074384, + "grad_norm": 0.7289424882358152, + "learning_rate": 3.5406001173618785e-05, + "loss": 0.1918, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08458380401134491, + "step": 3985, + "valid_targets_mean": 1385.2, + "valid_targets_min": 800 + }, + { + "epoch": 2.0900995285489787, + "grad_norm": 0.675048563702559, + "learning_rate": 3.5389329664443546e-05, + "loss": 0.1771, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0678868219256401, + "step": 3990, + "valid_targets_mean": 1232.2, + "valid_targets_min": 837 + }, + { + "epoch": 2.0927187008905186, + "grad_norm": 0.678815702539696, + "learning_rate": 3.5372631899967626e-05, + "loss": 0.1901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08220085501670837, + "step": 3995, + "valid_targets_mean": 1317.6, + "valid_targets_min": 719 + }, + { + "epoch": 2.095337873232059, + "grad_norm": 0.6740938563868182, + "learning_rate": 3.535590790867861e-05, + "loss": 0.1936, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07967671751976013, + "step": 4000, + "valid_targets_mean": 1312.8, + "valid_targets_min": 765 + }, + { + "epoch": 2.0979570455735987, + "grad_norm": 0.7141291054969721, + "learning_rate": 3.5339157719108825e-05, + "loss": 0.1884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09623882174491882, + "step": 4005, + "valid_targets_mean": 1511.5, + "valid_targets_min": 875 + }, + { + "epoch": 2.1005762179151386, + "grad_norm": 0.7336572112922154, + "learning_rate": 3.532238135983529e-05, + "loss": 0.1885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08519243448972702, + "step": 4010, + "valid_targets_mean": 1320.1, + "valid_targets_min": 739 + }, + { + "epoch": 2.103195390256679, + "grad_norm": 0.7441682298736509, + "learning_rate": 3.530557885947968e-05, + "loss": 0.1963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10714493691921234, + "step": 4015, + "valid_targets_mean": 1628.4, + "valid_targets_min": 669 + }, + { + "epoch": 2.1058145625982188, + "grad_norm": 0.7190417323186135, + "learning_rate": 3.528875024670827e-05, + "loss": 0.1828, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09126546233892441, + "step": 4020, + "valid_targets_mean": 1412.2, + "valid_targets_min": 1046 + }, + { + "epoch": 2.108433734939759, + "grad_norm": 0.7170551586019916, + "learning_rate": 3.5271895550231874e-05, + "loss": 0.1982, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12611155211925507, + "step": 4025, + "valid_targets_mean": 2057.2, + "valid_targets_min": 873 + }, + { + "epoch": 2.111052907281299, + "grad_norm": 0.6701651977269235, + "learning_rate": 3.525501479880583e-05, + "loss": 0.1953, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10826807469129562, + "step": 4030, + "valid_targets_mean": 1732.9, + "valid_targets_min": 907 + }, + { + "epoch": 2.113672079622839, + "grad_norm": 0.7644199373172864, + "learning_rate": 3.523810802122989e-05, + "loss": 0.2028, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08702050149440765, + "step": 4035, + "valid_targets_mean": 1521.4, + "valid_targets_min": 764 + }, + { + "epoch": 2.116291251964379, + "grad_norm": 0.6548591291141537, + "learning_rate": 3.522117524634824e-05, + "loss": 0.1863, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07724203914403915, + "step": 4040, + "valid_targets_mean": 1395.0, + "valid_targets_min": 822 + }, + { + "epoch": 2.1189104243059194, + "grad_norm": 0.6815393108692591, + "learning_rate": 3.520421650304942e-05, + "loss": 0.1858, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10110010206699371, + "step": 4045, + "valid_targets_mean": 1654.0, + "valid_targets_min": 1291 + }, + { + "epoch": 2.121529596647459, + "grad_norm": 0.7724843355268597, + "learning_rate": 3.518723182026625e-05, + "loss": 0.1974, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10089796036481857, + "step": 4050, + "valid_targets_mean": 1573.2, + "valid_targets_min": 816 + }, + { + "epoch": 2.1241487689889995, + "grad_norm": 0.7093961681655364, + "learning_rate": 3.517022122697581e-05, + "loss": 0.1852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09187100827693939, + "step": 4055, + "valid_targets_mean": 1310.8, + "valid_targets_min": 721 + }, + { + "epoch": 2.1267679413305394, + "grad_norm": 0.6856877135989632, + "learning_rate": 3.5153184752199407e-05, + "loss": 0.1835, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08593648672103882, + "step": 4060, + "valid_targets_mean": 1413.8, + "valid_targets_min": 785 + }, + { + "epoch": 2.1293871136720797, + "grad_norm": 0.7008541080505509, + "learning_rate": 3.513612242500248e-05, + "loss": 0.1879, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.129766047000885, + "step": 4065, + "valid_targets_mean": 2005.6, + "valid_targets_min": 734 + }, + { + "epoch": 2.1320062860136195, + "grad_norm": 0.6690436451371921, + "learning_rate": 3.511903427449459e-05, + "loss": 0.1922, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11221389472484589, + "step": 4070, + "valid_targets_mean": 1750.0, + "valid_targets_min": 744 + }, + { + "epoch": 2.13462545835516, + "grad_norm": 0.6992679651353025, + "learning_rate": 3.510192032982935e-05, + "loss": 0.1916, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11023158580064774, + "step": 4075, + "valid_targets_mean": 1856.8, + "valid_targets_min": 620 + }, + { + "epoch": 2.1372446306966997, + "grad_norm": 0.652670841490309, + "learning_rate": 3.508478062020437e-05, + "loss": 0.1839, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1008521318435669, + "step": 4080, + "valid_targets_mean": 1614.4, + "valid_targets_min": 949 + }, + { + "epoch": 2.13986380303824, + "grad_norm": 0.6280896076662544, + "learning_rate": 3.506761517486123e-05, + "loss": 0.1915, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09381900727748871, + "step": 4085, + "valid_targets_mean": 1898.5, + "valid_targets_min": 1078 + }, + { + "epoch": 2.14248297537978, + "grad_norm": 0.6953352163842283, + "learning_rate": 3.505042402308541e-05, + "loss": 0.1854, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09103520214557648, + "step": 4090, + "valid_targets_mean": 1538.6, + "valid_targets_min": 711 + }, + { + "epoch": 2.14510214772132, + "grad_norm": 0.711371271604788, + "learning_rate": 3.5033207194206245e-05, + "loss": 0.1918, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10047143697738647, + "step": 4095, + "valid_targets_mean": 1591.0, + "valid_targets_min": 1122 + }, + { + "epoch": 2.14772132006286, + "grad_norm": 0.701579462853468, + "learning_rate": 3.501596471759689e-05, + "loss": 0.1866, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08872205764055252, + "step": 4100, + "valid_targets_mean": 1377.5, + "valid_targets_min": 674 + }, + { + "epoch": 2.1503404924044003, + "grad_norm": 0.6937603851188818, + "learning_rate": 3.499869662267423e-05, + "loss": 0.1803, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07986070215702057, + "step": 4105, + "valid_targets_mean": 1198.6, + "valid_targets_min": 661 + }, + { + "epoch": 2.15295966474594, + "grad_norm": 0.7309748288880897, + "learning_rate": 3.498140293889889e-05, + "loss": 0.1782, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11420120298862457, + "step": 4110, + "valid_targets_mean": 1806.1, + "valid_targets_min": 1011 + }, + { + "epoch": 2.1555788370874804, + "grad_norm": 0.6495847377174823, + "learning_rate": 3.4964083695775136e-05, + "loss": 0.1924, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09754351526498795, + "step": 4115, + "valid_targets_mean": 1644.0, + "valid_targets_min": 1271 + }, + { + "epoch": 2.1581980094290203, + "grad_norm": 0.6451295156488667, + "learning_rate": 3.4946738922850825e-05, + "loss": 0.1832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08996035158634186, + "step": 4120, + "valid_targets_mean": 1391.1, + "valid_targets_min": 812 + }, + { + "epoch": 2.1608171817705606, + "grad_norm": 0.6577673028743707, + "learning_rate": 3.49293686497174e-05, + "loss": 0.1879, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09317929297685623, + "step": 4125, + "valid_targets_mean": 1529.6, + "valid_targets_min": 954 + }, + { + "epoch": 2.1634363541121004, + "grad_norm": 0.6870101085446985, + "learning_rate": 3.491197290600978e-05, + "loss": 0.1884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08796785771846771, + "step": 4130, + "valid_targets_mean": 1537.9, + "valid_targets_min": 1297 + }, + { + "epoch": 2.1660555264536407, + "grad_norm": 0.7033994409983768, + "learning_rate": 3.489455172140637e-05, + "loss": 0.1898, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0888407975435257, + "step": 4135, + "valid_targets_mean": 1411.9, + "valid_targets_min": 790 + }, + { + "epoch": 2.1686746987951806, + "grad_norm": 0.68174779726752, + "learning_rate": 3.487710512562894e-05, + "loss": 0.1868, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10044382512569427, + "step": 4140, + "valid_targets_mean": 1824.5, + "valid_targets_min": 592 + }, + { + "epoch": 2.171293871136721, + "grad_norm": 0.7058446912301533, + "learning_rate": 3.4859633148442644e-05, + "loss": 0.1881, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09607305377721786, + "step": 4145, + "valid_targets_mean": 1587.0, + "valid_targets_min": 662 + }, + { + "epoch": 2.1739130434782608, + "grad_norm": 0.7109324969687294, + "learning_rate": 3.4842135819655926e-05, + "loss": 0.1919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08893938362598419, + "step": 4150, + "valid_targets_mean": 1366.5, + "valid_targets_min": 622 + }, + { + "epoch": 2.176532215819801, + "grad_norm": 0.7091820730051697, + "learning_rate": 3.482461316912049e-05, + "loss": 0.1868, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07064250111579895, + "step": 4155, + "valid_targets_mean": 1229.2, + "valid_targets_min": 625 + }, + { + "epoch": 2.179151388161341, + "grad_norm": 0.7304958338240904, + "learning_rate": 3.480706522673124e-05, + "loss": 0.1986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09226875007152557, + "step": 4160, + "valid_targets_mean": 1548.0, + "valid_targets_min": 888 + }, + { + "epoch": 2.181770560502881, + "grad_norm": 0.8269923067529306, + "learning_rate": 3.47894920224262e-05, + "loss": 0.189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07171830534934998, + "step": 4165, + "valid_targets_mean": 1331.6, + "valid_targets_min": 635 + }, + { + "epoch": 2.184389732844421, + "grad_norm": 0.7316829722718358, + "learning_rate": 3.477189358618655e-05, + "loss": 0.1957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13178831338882446, + "step": 4170, + "valid_targets_mean": 1781.0, + "valid_targets_min": 522 + }, + { + "epoch": 2.1870089051859614, + "grad_norm": 0.6989346135672048, + "learning_rate": 3.4754269948036465e-05, + "loss": 0.1854, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08098998665809631, + "step": 4175, + "valid_targets_mean": 1283.8, + "valid_targets_min": 697 + }, + { + "epoch": 2.189628077527501, + "grad_norm": 0.6609140467070396, + "learning_rate": 3.473662113804314e-05, + "loss": 0.1806, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07369507849216461, + "step": 4180, + "valid_targets_mean": 1332.5, + "valid_targets_min": 869 + }, + { + "epoch": 2.1922472498690415, + "grad_norm": 0.7339790791732105, + "learning_rate": 3.4718947186316714e-05, + "loss": 0.1883, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08820786327123642, + "step": 4185, + "valid_targets_mean": 1341.1, + "valid_targets_min": 769 + }, + { + "epoch": 2.1948664222105814, + "grad_norm": 0.6865017670917262, + "learning_rate": 3.4701248123010214e-05, + "loss": 0.189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08384440839290619, + "step": 4190, + "valid_targets_mean": 1329.4, + "valid_targets_min": 745 + }, + { + "epoch": 2.1974855945521217, + "grad_norm": 0.6817303509529443, + "learning_rate": 3.4683523978319514e-05, + "loss": 0.1815, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0841609388589859, + "step": 4195, + "valid_targets_mean": 1297.8, + "valid_targets_min": 680 + }, + { + "epoch": 2.2001047668936615, + "grad_norm": 0.6522827159862312, + "learning_rate": 3.4665774782483275e-05, + "loss": 0.1805, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11358039081096649, + "step": 4200, + "valid_targets_mean": 1903.4, + "valid_targets_min": 1323 + }, + { + "epoch": 2.202723939235202, + "grad_norm": 0.7825502975856193, + "learning_rate": 3.464800056578289e-05, + "loss": 0.1884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10468216240406036, + "step": 4205, + "valid_targets_mean": 1449.0, + "valid_targets_min": 851 + }, + { + "epoch": 2.2053431115767417, + "grad_norm": 0.6706125180804291, + "learning_rate": 3.4630201358542476e-05, + "loss": 0.1901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09529706090688705, + "step": 4210, + "valid_targets_mean": 1540.2, + "valid_targets_min": 903 + }, + { + "epoch": 2.207962283918282, + "grad_norm": 0.6309444219938192, + "learning_rate": 3.461237719112872e-05, + "loss": 0.1788, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09462803602218628, + "step": 4215, + "valid_targets_mean": 1497.5, + "valid_targets_min": 854 + }, + { + "epoch": 2.210581456259822, + "grad_norm": 0.5323564402683407, + "learning_rate": 3.459452809395097e-05, + "loss": 0.1783, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06672701984643936, + "step": 4220, + "valid_targets_mean": 1495.4, + "valid_targets_min": 917 + }, + { + "epoch": 2.213200628601362, + "grad_norm": 0.612533975177077, + "learning_rate": 3.457665409746103e-05, + "loss": 0.1688, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07375086843967438, + "step": 4225, + "valid_targets_mean": 1462.5, + "valid_targets_min": 930 + }, + { + "epoch": 2.215819800942902, + "grad_norm": 0.6502973513547888, + "learning_rate": 3.455875523215325e-05, + "loss": 0.1864, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08019331097602844, + "step": 4230, + "valid_targets_mean": 1464.4, + "valid_targets_min": 570 + }, + { + "epoch": 2.2184389732844423, + "grad_norm": 0.6362908081945943, + "learning_rate": 3.454083152856435e-05, + "loss": 0.1828, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09245746582746506, + "step": 4235, + "valid_targets_mean": 1536.1, + "valid_targets_min": 870 + }, + { + "epoch": 2.221058145625982, + "grad_norm": 0.6704801346208137, + "learning_rate": 3.452288301727348e-05, + "loss": 0.1849, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09293714165687561, + "step": 4240, + "valid_targets_mean": 1563.5, + "valid_targets_min": 1215 + }, + { + "epoch": 2.2236773179675224, + "grad_norm": 0.6738442410852162, + "learning_rate": 3.450490972890208e-05, + "loss": 0.1884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0857582688331604, + "step": 4245, + "valid_targets_mean": 1545.9, + "valid_targets_min": 1214 + }, + { + "epoch": 2.2262964903090623, + "grad_norm": 0.7121593190212068, + "learning_rate": 3.448691169411386e-05, + "loss": 0.1798, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11348661035299301, + "step": 4250, + "valid_targets_mean": 1675.2, + "valid_targets_min": 591 + }, + { + "epoch": 2.2289156626506026, + "grad_norm": 0.7297488641520847, + "learning_rate": 3.446888894361477e-05, + "loss": 0.1933, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09707330167293549, + "step": 4255, + "valid_targets_mean": 1329.6, + "valid_targets_min": 646 + }, + { + "epoch": 2.2315348349921424, + "grad_norm": 0.4715234550471819, + "learning_rate": 3.445084150815292e-05, + "loss": 0.1984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08680760860443115, + "step": 4260, + "valid_targets_mean": 5262.4, + "valid_targets_min": 4751 + }, + { + "epoch": 2.2341540073336827, + "grad_norm": 0.5179432162410191, + "learning_rate": 3.443276941851851e-05, + "loss": 0.1965, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10530431568622589, + "step": 4265, + "valid_targets_mean": 8557.5, + "valid_targets_min": 5164 + }, + { + "epoch": 2.2367731796752226, + "grad_norm": 0.35189088859712925, + "learning_rate": 3.4414672705543836e-05, + "loss": 0.1871, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08838881552219391, + "step": 4270, + "valid_targets_mean": 6448.5, + "valid_targets_min": 4342 + }, + { + "epoch": 2.239392352016763, + "grad_norm": 0.3967730785170395, + "learning_rate": 3.43965514001032e-05, + "loss": 0.1884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08274708688259125, + "step": 4275, + "valid_targets_mean": 5300.6, + "valid_targets_min": 3853 + }, + { + "epoch": 2.2420115243583028, + "grad_norm": 0.3914698796402864, + "learning_rate": 3.437840553311282e-05, + "loss": 0.1944, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1191055178642273, + "step": 4280, + "valid_targets_mean": 5632.0, + "valid_targets_min": 4669 + }, + { + "epoch": 2.244630696699843, + "grad_norm": 0.3826804658437182, + "learning_rate": 3.436023513553087e-05, + "loss": 0.1985, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10407496988773346, + "step": 4285, + "valid_targets_mean": 6666.6, + "valid_targets_min": 5144 + }, + { + "epoch": 2.247249869041383, + "grad_norm": 0.40704622259157347, + "learning_rate": 3.434204023835735e-05, + "loss": 0.194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10071707516908646, + "step": 4290, + "valid_targets_mean": 5754.6, + "valid_targets_min": 4350 + }, + { + "epoch": 2.249869041382923, + "grad_norm": 0.35141069529027763, + "learning_rate": 3.432382087263405e-05, + "loss": 0.1839, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09793560206890106, + "step": 4295, + "valid_targets_mean": 6102.2, + "valid_targets_min": 3934 + }, + { + "epoch": 2.252488213724463, + "grad_norm": 0.41169499298812734, + "learning_rate": 3.430557706944452e-05, + "loss": 0.2143, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08575282990932465, + "step": 4300, + "valid_targets_mean": 6471.4, + "valid_targets_min": 5231 + }, + { + "epoch": 2.255107386066003, + "grad_norm": 0.40526461109259, + "learning_rate": 3.4287308859914e-05, + "loss": 0.1874, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10314113646745682, + "step": 4305, + "valid_targets_mean": 6736.8, + "valid_targets_min": 5062 + }, + { + "epoch": 2.257726558407543, + "grad_norm": 0.6096771286476559, + "learning_rate": 3.426901627520937e-05, + "loss": 0.1948, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0975448489189148, + "step": 4310, + "valid_targets_mean": 3416.1, + "valid_targets_min": 229 + }, + { + "epoch": 2.2603457307490835, + "grad_norm": 0.36027677446290235, + "learning_rate": 3.425069934653907e-05, + "loss": 0.1839, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09143798798322678, + "step": 4315, + "valid_targets_mean": 6196.9, + "valid_targets_min": 4508 + }, + { + "epoch": 2.2629649030906234, + "grad_norm": 0.39418300333836775, + "learning_rate": 3.423235810515313e-05, + "loss": 0.1935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09388123452663422, + "step": 4320, + "valid_targets_mean": 5994.6, + "valid_targets_min": 4673 + }, + { + "epoch": 2.2655840754321632, + "grad_norm": 0.32210755336423735, + "learning_rate": 3.4213992582343e-05, + "loss": 0.1754, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0751730352640152, + "step": 4325, + "valid_targets_mean": 6293.1, + "valid_targets_min": 4995 + }, + { + "epoch": 2.2682032477737035, + "grad_norm": 0.44027247201770786, + "learning_rate": 3.419560280944158e-05, + "loss": 0.1745, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10627452284097672, + "step": 4330, + "valid_targets_mean": 5654.2, + "valid_targets_min": 4108 + }, + { + "epoch": 2.270822420115244, + "grad_norm": 0.3914400928933456, + "learning_rate": 3.417718881782315e-05, + "loss": 0.1831, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12119898200035095, + "step": 4335, + "valid_targets_mean": 7076.8, + "valid_targets_min": 4527 + }, + { + "epoch": 2.2734415924567837, + "grad_norm": 0.5025289124302289, + "learning_rate": 3.41587506389033e-05, + "loss": 0.1982, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11772619932889938, + "step": 4340, + "valid_targets_mean": 2271.2, + "valid_targets_min": 1783 + }, + { + "epoch": 2.2760607647983235, + "grad_norm": 0.37806515377016836, + "learning_rate": 3.4140288304138885e-05, + "loss": 0.1659, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0790642648935318, + "step": 4345, + "valid_targets_mean": 6375.6, + "valid_targets_min": 5316 + }, + { + "epoch": 2.278679937139864, + "grad_norm": 0.3847792712836001, + "learning_rate": 3.4121801845027965e-05, + "loss": 0.1722, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09972573816776276, + "step": 4350, + "valid_targets_mean": 6093.6, + "valid_targets_min": 5056 + }, + { + "epoch": 2.2812991094814037, + "grad_norm": 0.35680978232665095, + "learning_rate": 3.410329129310977e-05, + "loss": 0.1717, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09506428241729736, + "step": 4355, + "valid_targets_mean": 7712.4, + "valid_targets_min": 2834 + }, + { + "epoch": 2.283918281822944, + "grad_norm": 0.37489894585228845, + "learning_rate": 3.4084756679964645e-05, + "loss": 0.2041, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11063200235366821, + "step": 4360, + "valid_targets_mean": 7032.0, + "valid_targets_min": 4181 + }, + { + "epoch": 2.286537454164484, + "grad_norm": 0.34295699089468396, + "learning_rate": 3.4066198037213956e-05, + "loss": 0.1834, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08322663605213165, + "step": 4365, + "valid_targets_mean": 7101.1, + "valid_targets_min": 4689 + }, + { + "epoch": 2.289156626506024, + "grad_norm": 0.3670372159304986, + "learning_rate": 3.4047615396520073e-05, + "loss": 0.1805, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08686234056949615, + "step": 4370, + "valid_targets_mean": 6668.0, + "valid_targets_min": 4670 + }, + { + "epoch": 2.291775798847564, + "grad_norm": 0.37134005811384047, + "learning_rate": 3.402900878958633e-05, + "loss": 0.1917, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11375340819358826, + "step": 4375, + "valid_targets_mean": 7794.4, + "valid_targets_min": 4501 + }, + { + "epoch": 2.2943949711891043, + "grad_norm": 0.4295427738825388, + "learning_rate": 3.4010378248156925e-05, + "loss": 0.2027, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09965578466653824, + "step": 4380, + "valid_targets_mean": 6428.1, + "valid_targets_min": 4998 + }, + { + "epoch": 2.297014143530644, + "grad_norm": 0.389803008593126, + "learning_rate": 3.39917238040169e-05, + "loss": 0.2194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09798961132764816, + "step": 4385, + "valid_targets_mean": 6159.2, + "valid_targets_min": 4640 + }, + { + "epoch": 2.2996333158721844, + "grad_norm": 0.3775684215634937, + "learning_rate": 3.397304548899207e-05, + "loss": 0.2003, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0962294191122055, + "step": 4390, + "valid_targets_mean": 6138.4, + "valid_targets_min": 4800 + }, + { + "epoch": 2.3022524882137243, + "grad_norm": 0.4164029673006619, + "learning_rate": 3.395434333494899e-05, + "loss": 0.1918, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11183840781450272, + "step": 4395, + "valid_targets_mean": 6040.1, + "valid_targets_min": 4455 + }, + { + "epoch": 2.3048716605552646, + "grad_norm": 0.38789717205487884, + "learning_rate": 3.3935617373794875e-05, + "loss": 0.185, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09181490540504456, + "step": 4400, + "valid_targets_mean": 6714.5, + "valid_targets_min": 4891 + }, + { + "epoch": 2.3074908328968045, + "grad_norm": 0.40947172820355565, + "learning_rate": 3.391686763747755e-05, + "loss": 0.1972, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1077517420053482, + "step": 4405, + "valid_targets_mean": 5823.5, + "valid_targets_min": 4710 + }, + { + "epoch": 2.3101100052383448, + "grad_norm": 0.3550831915380223, + "learning_rate": 3.3898094157985424e-05, + "loss": 0.1871, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08461962640285492, + "step": 4410, + "valid_targets_mean": 6401.5, + "valid_targets_min": 5370 + }, + { + "epoch": 2.3127291775798846, + "grad_norm": 0.39518422640270573, + "learning_rate": 3.3879296967347386e-05, + "loss": 0.1934, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09296444058418274, + "step": 4415, + "valid_targets_mean": 6424.5, + "valid_targets_min": 4608 + }, + { + "epoch": 2.315348349921425, + "grad_norm": 0.38336885075106303, + "learning_rate": 3.38604760976328e-05, + "loss": 0.1926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08820196986198425, + "step": 4420, + "valid_targets_mean": 5586.1, + "valid_targets_min": 4580 + }, + { + "epoch": 2.3179675222629648, + "grad_norm": 0.539587906084315, + "learning_rate": 3.3841631580951414e-05, + "loss": 0.1914, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09103749692440033, + "step": 4425, + "valid_targets_mean": 6329.4, + "valid_targets_min": 4754 + }, + { + "epoch": 2.320586694604505, + "grad_norm": 0.3132796125370284, + "learning_rate": 3.382276344945334e-05, + "loss": 0.1655, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07120954990386963, + "step": 4430, + "valid_targets_mean": 7311.5, + "valid_targets_min": 6287 + }, + { + "epoch": 2.323205866946045, + "grad_norm": 0.3786549569109157, + "learning_rate": 3.380387173532895e-05, + "loss": 0.179, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10338225960731506, + "step": 4435, + "valid_targets_mean": 7010.4, + "valid_targets_min": 3468 + }, + { + "epoch": 2.325825039287585, + "grad_norm": 0.354358681080531, + "learning_rate": 3.378495647080886e-05, + "loss": 0.1925, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09100731462240219, + "step": 4440, + "valid_targets_mean": 6255.4, + "valid_targets_min": 5221 + }, + { + "epoch": 2.328444211629125, + "grad_norm": 0.36484120389471236, + "learning_rate": 3.376601768816388e-05, + "loss": 0.1926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08618143945932388, + "step": 4445, + "valid_targets_mean": 6060.5, + "valid_targets_min": 4438 + }, + { + "epoch": 2.3310633839706654, + "grad_norm": 0.38168634070322494, + "learning_rate": 3.374705541970494e-05, + "loss": 0.1855, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09062792360782623, + "step": 4450, + "valid_targets_mean": 5617.6, + "valid_targets_min": 3915 + }, + { + "epoch": 2.3336825563122052, + "grad_norm": 0.3182791292068853, + "learning_rate": 3.372806969778302e-05, + "loss": 0.1773, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06596499681472778, + "step": 4455, + "valid_targets_mean": 5274.1, + "valid_targets_min": 4135 + }, + { + "epoch": 2.3363017286537455, + "grad_norm": 0.3980520306984013, + "learning_rate": 3.3709060554789114e-05, + "loss": 0.1854, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11008140444755554, + "step": 4460, + "valid_targets_mean": 6510.1, + "valid_targets_min": 4295 + }, + { + "epoch": 2.3389209009952854, + "grad_norm": 0.399551997504261, + "learning_rate": 3.36900280231542e-05, + "loss": 0.1856, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.110128253698349, + "step": 4465, + "valid_targets_mean": 6065.0, + "valid_targets_min": 4865 + }, + { + "epoch": 2.3415400733368257, + "grad_norm": 0.38392949159985834, + "learning_rate": 3.3670972135349136e-05, + "loss": 0.1854, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09090718626976013, + "step": 4470, + "valid_targets_mean": 6150.2, + "valid_targets_min": 4643 + }, + { + "epoch": 2.3441592456783655, + "grad_norm": 0.35208214019483036, + "learning_rate": 3.365189292388463e-05, + "loss": 0.1763, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09005999565124512, + "step": 4475, + "valid_targets_mean": 6384.5, + "valid_targets_min": 4705 + }, + { + "epoch": 2.346778418019906, + "grad_norm": 0.3846867579860675, + "learning_rate": 3.36327904213112e-05, + "loss": 0.2026, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09906090795993805, + "step": 4480, + "valid_targets_mean": 5637.6, + "valid_targets_min": 4652 + }, + { + "epoch": 2.3493975903614457, + "grad_norm": 0.36982382045858164, + "learning_rate": 3.361366466021907e-05, + "loss": 0.1652, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07524531334638596, + "step": 4485, + "valid_targets_mean": 5898.2, + "valid_targets_min": 5007 + }, + { + "epoch": 2.352016762702986, + "grad_norm": 0.3586455082897619, + "learning_rate": 3.3594515673238164e-05, + "loss": 0.1613, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08170197904109955, + "step": 4490, + "valid_targets_mean": 5927.9, + "valid_targets_min": 4546 + }, + { + "epoch": 2.354635935044526, + "grad_norm": 0.3627252830677402, + "learning_rate": 3.357534349303804e-05, + "loss": 0.1652, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08540515601634979, + "step": 4495, + "valid_targets_mean": 5954.4, + "valid_targets_min": 3200 + }, + { + "epoch": 2.357255107386066, + "grad_norm": 0.35767876753365935, + "learning_rate": 3.3556148152327796e-05, + "loss": 0.1716, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08642897009849548, + "step": 4500, + "valid_targets_mean": 6702.5, + "valid_targets_min": 5010 + }, + { + "epoch": 2.359874279727606, + "grad_norm": 0.38355130876545307, + "learning_rate": 3.3536929683856075e-05, + "loss": 0.193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0961657464504242, + "step": 4505, + "valid_targets_mean": 6308.1, + "valid_targets_min": 4904 + }, + { + "epoch": 2.3624934520691463, + "grad_norm": 0.39846948733145526, + "learning_rate": 3.351768812041095e-05, + "loss": 0.2206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11881693452596664, + "step": 4510, + "valid_targets_mean": 6365.5, + "valid_targets_min": 5081 + }, + { + "epoch": 2.365112624410686, + "grad_norm": 0.4071323760198838, + "learning_rate": 3.349842349481992e-05, + "loss": 0.1888, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07891501486301422, + "step": 4515, + "valid_targets_mean": 4943.8, + "valid_targets_min": 3629 + }, + { + "epoch": 2.3677317967522264, + "grad_norm": 0.3910265333978852, + "learning_rate": 3.347913583994982e-05, + "loss": 0.1807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09046255052089691, + "step": 4520, + "valid_targets_mean": 6236.2, + "valid_targets_min": 4324 + }, + { + "epoch": 2.3703509690937663, + "grad_norm": 0.35925362948621203, + "learning_rate": 3.345982518870676e-05, + "loss": 0.1842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07996508479118347, + "step": 4525, + "valid_targets_mean": 7204.9, + "valid_targets_min": 4920 + }, + { + "epoch": 2.3729701414353066, + "grad_norm": 0.3790145575135124, + "learning_rate": 3.344049157403611e-05, + "loss": 0.1932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0945851132273674, + "step": 4530, + "valid_targets_mean": 6281.5, + "valid_targets_min": 4882 + }, + { + "epoch": 2.3755893137768465, + "grad_norm": 0.3562095630949342, + "learning_rate": 3.342113502892239e-05, + "loss": 0.1976, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09100031852722168, + "step": 4535, + "valid_targets_mean": 7296.2, + "valid_targets_min": 3943 + }, + { + "epoch": 2.3782084861183868, + "grad_norm": 0.3889102556751455, + "learning_rate": 3.340175558638927e-05, + "loss": 0.1876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10129101574420929, + "step": 4540, + "valid_targets_mean": 7207.0, + "valid_targets_min": 5382 + }, + { + "epoch": 2.3808276584599266, + "grad_norm": 0.3616664728118041, + "learning_rate": 3.338235327949946e-05, + "loss": 0.1862, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09182766079902649, + "step": 4545, + "valid_targets_mean": 6385.6, + "valid_targets_min": 4461 + }, + { + "epoch": 2.383446830801467, + "grad_norm": 0.35250339413631243, + "learning_rate": 3.3362928141354697e-05, + "loss": 0.1762, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08577057719230652, + "step": 4550, + "valid_targets_mean": 7383.1, + "valid_targets_min": 5364 + }, + { + "epoch": 2.3860660031430068, + "grad_norm": 0.3613497836153022, + "learning_rate": 3.334348020509565e-05, + "loss": 0.1753, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0901482105255127, + "step": 4555, + "valid_targets_mean": 5899.0, + "valid_targets_min": 4444 + }, + { + "epoch": 2.388685175484547, + "grad_norm": 0.3732680956771438, + "learning_rate": 3.332400950390189e-05, + "loss": 0.2313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09998985379934311, + "step": 4560, + "valid_targets_mean": 6466.9, + "valid_targets_min": 4474 + }, + { + "epoch": 2.391304347826087, + "grad_norm": 0.3215897801694627, + "learning_rate": 3.330451607099185e-05, + "loss": 0.1763, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09537540376186371, + "step": 4565, + "valid_targets_mean": 7983.6, + "valid_targets_min": 6076 + }, + { + "epoch": 2.393923520167627, + "grad_norm": 0.359957824578163, + "learning_rate": 3.328499993962271e-05, + "loss": 0.1772, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09370891749858856, + "step": 4570, + "valid_targets_mean": 6965.8, + "valid_targets_min": 4718 + }, + { + "epoch": 2.396542692509167, + "grad_norm": 0.361204202925108, + "learning_rate": 3.326546114309039e-05, + "loss": 0.1899, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09906766563653946, + "step": 4575, + "valid_targets_mean": 6808.2, + "valid_targets_min": 4714 + }, + { + "epoch": 2.3991618648507074, + "grad_norm": 0.3826464800023626, + "learning_rate": 3.324589971472949e-05, + "loss": 0.1861, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08802899718284607, + "step": 4580, + "valid_targets_mean": 5286.5, + "valid_targets_min": 3828 + }, + { + "epoch": 2.4017810371922472, + "grad_norm": 0.35754151744307855, + "learning_rate": 3.32263156879132e-05, + "loss": 0.1622, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07199066132307053, + "step": 4585, + "valid_targets_mean": 6731.1, + "valid_targets_min": 5089 + }, + { + "epoch": 2.4044002095337875, + "grad_norm": 0.3830574411711552, + "learning_rate": 3.320670909605328e-05, + "loss": 0.1822, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08338411152362823, + "step": 4590, + "valid_targets_mean": 6523.9, + "valid_targets_min": 4509 + }, + { + "epoch": 2.4070193818753274, + "grad_norm": 0.3766898876673147, + "learning_rate": 3.318707997259998e-05, + "loss": 0.1688, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10137352347373962, + "step": 4595, + "valid_targets_mean": 7736.0, + "valid_targets_min": 5193 + }, + { + "epoch": 2.4096385542168672, + "grad_norm": 0.35915128351202785, + "learning_rate": 3.3167428351042e-05, + "loss": 0.1706, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0861617922782898, + "step": 4600, + "valid_targets_mean": 6165.9, + "valid_targets_min": 4343 + }, + { + "epoch": 2.4122577265584075, + "grad_norm": 0.36197540903740943, + "learning_rate": 3.31477542649064e-05, + "loss": 0.1758, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0850772112607956, + "step": 4605, + "valid_targets_mean": 6185.9, + "valid_targets_min": 4815 + }, + { + "epoch": 2.414876898899948, + "grad_norm": 0.33820687033900637, + "learning_rate": 3.31280577477586e-05, + "loss": 0.1796, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07993307709693909, + "step": 4610, + "valid_targets_mean": 7682.5, + "valid_targets_min": 5751 + }, + { + "epoch": 2.4174960712414877, + "grad_norm": 0.34784080140637824, + "learning_rate": 3.310833883320227e-05, + "loss": 0.1711, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08610358089208603, + "step": 4615, + "valid_targets_mean": 6375.6, + "valid_targets_min": 3977 + }, + { + "epoch": 2.4201152435830275, + "grad_norm": 0.39648090166834754, + "learning_rate": 3.3088597554879275e-05, + "loss": 0.1823, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09887340664863586, + "step": 4620, + "valid_targets_mean": 6607.8, + "valid_targets_min": 5098 + }, + { + "epoch": 2.422734415924568, + "grad_norm": 0.44055110866968583, + "learning_rate": 3.3068833946469677e-05, + "loss": 0.1876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10944779962301254, + "step": 4625, + "valid_targets_mean": 5749.6, + "valid_targets_min": 4550 + }, + { + "epoch": 2.425353588266108, + "grad_norm": 0.4129639305919711, + "learning_rate": 3.30490480416916e-05, + "loss": 0.189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09889828413724899, + "step": 4630, + "valid_targets_mean": 5552.6, + "valid_targets_min": 3619 + }, + { + "epoch": 2.427972760607648, + "grad_norm": 0.6992836949420002, + "learning_rate": 3.302923987430121e-05, + "loss": 0.2792, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1501704752445221, + "step": 4635, + "valid_targets_mean": 3486.5, + "valid_targets_min": 770 + }, + { + "epoch": 2.430591932949188, + "grad_norm": 0.49681113723633175, + "learning_rate": 3.3009409478092664e-05, + "loss": 0.2761, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12776651978492737, + "step": 4640, + "valid_targets_mean": 4703.8, + "valid_targets_min": 1799 + }, + { + "epoch": 2.433211105290728, + "grad_norm": 0.483795517262897, + "learning_rate": 3.298955688689805e-05, + "loss": 0.2688, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13452821969985962, + "step": 4645, + "valid_targets_mean": 5730.6, + "valid_targets_min": 3015 + }, + { + "epoch": 2.4358302776322684, + "grad_norm": 0.4451395934905341, + "learning_rate": 3.296968213458731e-05, + "loss": 0.2657, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12698446214199066, + "step": 4650, + "valid_targets_mean": 5475.6, + "valid_targets_min": 1841 + }, + { + "epoch": 2.4384494499738083, + "grad_norm": 0.568085783596915, + "learning_rate": 3.294978525506819e-05, + "loss": 0.2793, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16987842321395874, + "step": 4655, + "valid_targets_mean": 4238.2, + "valid_targets_min": 1374 + }, + { + "epoch": 2.441068622315348, + "grad_norm": 0.5399690888229732, + "learning_rate": 3.29298662822862e-05, + "loss": 0.275, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14218473434448242, + "step": 4660, + "valid_targets_mean": 4297.9, + "valid_targets_min": 1951 + }, + { + "epoch": 2.4436877946568885, + "grad_norm": 0.4665755676585302, + "learning_rate": 3.290992525022455e-05, + "loss": 0.2651, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10295194387435913, + "step": 4665, + "valid_targets_mean": 3986.4, + "valid_targets_min": 967 + }, + { + "epoch": 2.4463069669984283, + "grad_norm": 0.4810606992303234, + "learning_rate": 3.288996219290405e-05, + "loss": 0.272, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14516176283359528, + "step": 4670, + "valid_targets_mean": 5266.1, + "valid_targets_min": 1831 + }, + { + "epoch": 2.4489261393399686, + "grad_norm": 0.5548954720725366, + "learning_rate": 3.2869977144383114e-05, + "loss": 0.2805, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13955682516098022, + "step": 4675, + "valid_targets_mean": 3626.9, + "valid_targets_min": 2077 + }, + { + "epoch": 2.4515453116815085, + "grad_norm": 0.4881601822284099, + "learning_rate": 3.2849970138757675e-05, + "loss": 0.2732, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12774524092674255, + "step": 4680, + "valid_targets_mean": 4431.5, + "valid_targets_min": 2834 + }, + { + "epoch": 2.4541644840230488, + "grad_norm": 0.5286262928112249, + "learning_rate": 3.2829941210161106e-05, + "loss": 0.2765, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14698627591133118, + "step": 4685, + "valid_targets_mean": 4406.6, + "valid_targets_min": 1873 + }, + { + "epoch": 2.4567836563645886, + "grad_norm": 0.4622668282561899, + "learning_rate": 3.2809890392764216e-05, + "loss": 0.2653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12009242177009583, + "step": 4690, + "valid_targets_mean": 3873.5, + "valid_targets_min": 1013 + }, + { + "epoch": 2.459402828706129, + "grad_norm": 0.5705828101329861, + "learning_rate": 3.2789817720775126e-05, + "loss": 0.2747, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14647673070430756, + "step": 4695, + "valid_targets_mean": 4464.8, + "valid_targets_min": 1939 + }, + { + "epoch": 2.4620220010476688, + "grad_norm": 0.58339715082754, + "learning_rate": 3.2769723228439265e-05, + "loss": 0.2698, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16818226873874664, + "step": 4700, + "valid_targets_mean": 4397.6, + "valid_targets_min": 2391 + }, + { + "epoch": 2.464641173389209, + "grad_norm": 0.6181542558710681, + "learning_rate": 3.274960695003927e-05, + "loss": 0.2812, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18955881893634796, + "step": 4705, + "valid_targets_mean": 4258.1, + "valid_targets_min": 1589 + }, + { + "epoch": 2.467260345730749, + "grad_norm": 0.521980103704629, + "learning_rate": 3.272946891989495e-05, + "loss": 0.2645, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12609046697616577, + "step": 4710, + "valid_targets_mean": 4111.2, + "valid_targets_min": 1840 + }, + { + "epoch": 2.4698795180722892, + "grad_norm": 0.5491561012683551, + "learning_rate": 3.2709309172363236e-05, + "loss": 0.2735, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13917270302772522, + "step": 4715, + "valid_targets_mean": 3903.1, + "valid_targets_min": 1269 + }, + { + "epoch": 2.472498690413829, + "grad_norm": 0.5919069763103967, + "learning_rate": 3.268912774183811e-05, + "loss": 0.2854, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13042256236076355, + "step": 4720, + "valid_targets_mean": 3429.4, + "valid_targets_min": 1695 + }, + { + "epoch": 2.4751178627553694, + "grad_norm": 0.5622471486979514, + "learning_rate": 3.2668924662750535e-05, + "loss": 0.2826, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16786539554595947, + "step": 4725, + "valid_targets_mean": 4396.5, + "valid_targets_min": 1542 + }, + { + "epoch": 2.4777370350969092, + "grad_norm": 0.599374258150151, + "learning_rate": 3.2648699969568415e-05, + "loss": 0.2677, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1258111596107483, + "step": 4730, + "valid_targets_mean": 3763.1, + "valid_targets_min": 1438 + }, + { + "epoch": 2.4803562074384495, + "grad_norm": 0.5574771684252116, + "learning_rate": 3.262845369679652e-05, + "loss": 0.2798, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14597754180431366, + "step": 4735, + "valid_targets_mean": 4322.0, + "valid_targets_min": 2080 + }, + { + "epoch": 2.4829753797799894, + "grad_norm": 0.5335917055886615, + "learning_rate": 3.260818587897646e-05, + "loss": 0.2668, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11487531661987305, + "step": 4740, + "valid_targets_mean": 3656.5, + "valid_targets_min": 1026 + }, + { + "epoch": 2.4855945521215297, + "grad_norm": 0.6647589643530221, + "learning_rate": 3.258789655068657e-05, + "loss": 0.2549, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14061737060546875, + "step": 4745, + "valid_targets_mean": 3275.9, + "valid_targets_min": 1772 + }, + { + "epoch": 2.4882137244630695, + "grad_norm": 0.5828423175607111, + "learning_rate": 3.256758574654191e-05, + "loss": 0.2731, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14968352019786835, + "step": 4750, + "valid_targets_mean": 3340.6, + "valid_targets_min": 1588 + }, + { + "epoch": 2.49083289680461, + "grad_norm": 0.6068833100306307, + "learning_rate": 3.254725350119416e-05, + "loss": 0.2738, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12587854266166687, + "step": 4755, + "valid_targets_mean": 3175.5, + "valid_targets_min": 1276 + }, + { + "epoch": 2.4934520691461497, + "grad_norm": 0.4952352072659673, + "learning_rate": 3.2526899849331604e-05, + "loss": 0.2669, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11407821625471115, + "step": 4760, + "valid_targets_mean": 4294.9, + "valid_targets_min": 1631 + }, + { + "epoch": 2.49607124148769, + "grad_norm": 0.5488663596585718, + "learning_rate": 3.250652482567902e-05, + "loss": 0.2759, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16853857040405273, + "step": 4765, + "valid_targets_mean": 5289.8, + "valid_targets_min": 3090 + }, + { + "epoch": 2.49869041382923, + "grad_norm": 0.6661768035799297, + "learning_rate": 3.248612846499767e-05, + "loss": 0.2595, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13370314240455627, + "step": 4770, + "valid_targets_mean": 3234.0, + "valid_targets_min": 1446 + }, + { + "epoch": 2.50130958617077, + "grad_norm": 0.6239150762558955, + "learning_rate": 3.24657108020852e-05, + "loss": 0.2749, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13287469744682312, + "step": 4775, + "valid_targets_mean": 3117.9, + "valid_targets_min": 1685 + }, + { + "epoch": 2.50392875851231, + "grad_norm": 0.5235567064263872, + "learning_rate": 3.244527187177561e-05, + "loss": 0.2598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12638260424137115, + "step": 4780, + "valid_targets_mean": 3541.6, + "valid_targets_min": 1596 + }, + { + "epoch": 2.5065479308538503, + "grad_norm": 0.6633883278924252, + "learning_rate": 3.2424811708939186e-05, + "loss": 0.2637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14612677693367004, + "step": 4785, + "valid_targets_mean": 5101.5, + "valid_targets_min": 2251 + }, + { + "epoch": 2.50916710319539, + "grad_norm": 0.650243258812906, + "learning_rate": 3.240433034848243e-05, + "loss": 0.2641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1239681988954544, + "step": 4790, + "valid_targets_mean": 2717.9, + "valid_targets_min": 1458 + }, + { + "epoch": 2.5117862755369305, + "grad_norm": 0.6162560405529081, + "learning_rate": 3.238382782534802e-05, + "loss": 0.2714, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11557632684707642, + "step": 4795, + "valid_targets_mean": 3202.1, + "valid_targets_min": 1162 + }, + { + "epoch": 2.5144054478784703, + "grad_norm": 0.6153507368134533, + "learning_rate": 3.236330417451472e-05, + "loss": 0.2622, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1267622411251068, + "step": 4800, + "valid_targets_mean": 3012.8, + "valid_targets_min": 1480 + }, + { + "epoch": 2.5170246202200106, + "grad_norm": 0.5956133163742262, + "learning_rate": 3.234275943099736e-05, + "loss": 0.2721, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14925609529018402, + "step": 4805, + "valid_targets_mean": 3682.4, + "valid_targets_min": 1229 + }, + { + "epoch": 2.5196437925615505, + "grad_norm": 0.6351685164908751, + "learning_rate": 3.232219362984674e-05, + "loss": 0.2691, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14006267488002777, + "step": 4810, + "valid_targets_mean": 3763.1, + "valid_targets_min": 1276 + }, + { + "epoch": 2.5222629649030908, + "grad_norm": 0.6162058804285464, + "learning_rate": 3.23016068061496e-05, + "loss": 0.2617, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11890268325805664, + "step": 4815, + "valid_targets_mean": 3172.8, + "valid_targets_min": 1208 + }, + { + "epoch": 2.5248821372446306, + "grad_norm": 0.5749928458656193, + "learning_rate": 3.228099899502853e-05, + "loss": 0.2603, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12680307030677795, + "step": 4820, + "valid_targets_mean": 3354.0, + "valid_targets_min": 924 + }, + { + "epoch": 2.527501309586171, + "grad_norm": 0.5724131019946627, + "learning_rate": 3.226037023164194e-05, + "loss": 0.267, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13974511623382568, + "step": 4825, + "valid_targets_mean": 4218.9, + "valid_targets_min": 1531 + }, + { + "epoch": 2.5301204819277108, + "grad_norm": 0.5910025466904364, + "learning_rate": 3.223972055118398e-05, + "loss": 0.2672, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13048329949378967, + "step": 4830, + "valid_targets_mean": 3040.9, + "valid_targets_min": 1643 + }, + { + "epoch": 2.532739654269251, + "grad_norm": 0.567667815004245, + "learning_rate": 3.221904998888448e-05, + "loss": 0.2596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15320153534412384, + "step": 4835, + "valid_targets_mean": 4129.6, + "valid_targets_min": 1244 + }, + { + "epoch": 2.535358826610791, + "grad_norm": 0.5616875504141101, + "learning_rate": 3.219835858000892e-05, + "loss": 0.2719, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11181098222732544, + "step": 4840, + "valid_targets_mean": 3491.1, + "valid_targets_min": 730 + }, + { + "epoch": 2.5379779989523312, + "grad_norm": 0.6548795772657205, + "learning_rate": 3.217764635985831e-05, + "loss": 0.2657, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11994566023349762, + "step": 4845, + "valid_targets_mean": 3085.4, + "valid_targets_min": 977 + }, + { + "epoch": 2.540597171293871, + "grad_norm": 0.5326832519042694, + "learning_rate": 3.215691336376919e-05, + "loss": 0.2576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13010746240615845, + "step": 4850, + "valid_targets_mean": 4896.9, + "valid_targets_min": 2091 + }, + { + "epoch": 2.543216343635411, + "grad_norm": 0.5801183408858036, + "learning_rate": 3.213615962711354e-05, + "loss": 0.2525, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1055474579334259, + "step": 4855, + "valid_targets_mean": 3125.9, + "valid_targets_min": 1654 + }, + { + "epoch": 2.5458355159769512, + "grad_norm": 0.5219430315952756, + "learning_rate": 3.211538518529872e-05, + "loss": 0.2731, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12499532848596573, + "step": 4860, + "valid_targets_mean": 4228.1, + "valid_targets_min": 1432 + }, + { + "epoch": 2.5484546883184915, + "grad_norm": 0.5512349112170226, + "learning_rate": 3.209459007376744e-05, + "loss": 0.2596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1550905406475067, + "step": 4865, + "valid_targets_mean": 4512.6, + "valid_targets_min": 2422 + }, + { + "epoch": 2.5510738606600314, + "grad_norm": 0.6283528677051325, + "learning_rate": 3.207377432799762e-05, + "loss": 0.2697, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1240365281701088, + "step": 4870, + "valid_targets_mean": 3584.2, + "valid_targets_min": 1124 + }, + { + "epoch": 2.5536930330015712, + "grad_norm": 0.5565275234233498, + "learning_rate": 3.205293798350243e-05, + "loss": 0.2647, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13041697442531586, + "step": 4875, + "valid_targets_mean": 3950.6, + "valid_targets_min": 1219 + }, + { + "epoch": 2.5563122053431115, + "grad_norm": 0.5639979123752346, + "learning_rate": 3.203208107583017e-05, + "loss": 0.2721, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14429600536823273, + "step": 4880, + "valid_targets_mean": 3843.0, + "valid_targets_min": 1328 + }, + { + "epoch": 2.558931377684652, + "grad_norm": 0.6039266296646495, + "learning_rate": 3.201120364056422e-05, + "loss": 0.2547, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11220163851976395, + "step": 4885, + "valid_targets_mean": 2625.0, + "valid_targets_min": 916 + }, + { + "epoch": 2.5615505500261917, + "grad_norm": 0.5575623583731243, + "learning_rate": 3.199030571332299e-05, + "loss": 0.2734, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08969323337078094, + "step": 4890, + "valid_targets_mean": 3081.5, + "valid_targets_min": 1302 + }, + { + "epoch": 2.5641697223677316, + "grad_norm": 0.5863420722239778, + "learning_rate": 3.1969387329759823e-05, + "loss": 0.2594, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.172468364238739, + "step": 4895, + "valid_targets_mean": 4390.5, + "valid_targets_min": 1500 + }, + { + "epoch": 2.566788894709272, + "grad_norm": 0.5419491414286708, + "learning_rate": 3.194844852556301e-05, + "loss": 0.249, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14079037308692932, + "step": 4900, + "valid_targets_mean": 4516.0, + "valid_targets_min": 1909 + }, + { + "epoch": 2.569408067050812, + "grad_norm": 0.5742549479956544, + "learning_rate": 3.1927489336455634e-05, + "loss": 0.2446, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11546041071414948, + "step": 4905, + "valid_targets_mean": 3179.0, + "valid_targets_min": 809 + }, + { + "epoch": 2.572027239392352, + "grad_norm": 0.6280354658180206, + "learning_rate": 3.190650979819558e-05, + "loss": 0.2755, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13638462126255035, + "step": 4910, + "valid_targets_mean": 3833.9, + "valid_targets_min": 2662 + }, + { + "epoch": 2.574646411733892, + "grad_norm": 0.518374228157193, + "learning_rate": 3.188550994657544e-05, + "loss": 0.2596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1271933913230896, + "step": 4915, + "valid_targets_mean": 4343.4, + "valid_targets_min": 1460 + }, + { + "epoch": 2.577265584075432, + "grad_norm": 0.5180685671704083, + "learning_rate": 3.186448981742249e-05, + "loss": 0.263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14760158956050873, + "step": 4920, + "valid_targets_mean": 5864.5, + "valid_targets_min": 3945 + }, + { + "epoch": 2.5798847564169725, + "grad_norm": 0.574567284867831, + "learning_rate": 3.184344944659855e-05, + "loss": 0.2623, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.156520813703537, + "step": 4925, + "valid_targets_mean": 4052.5, + "valid_targets_min": 2504 + }, + { + "epoch": 2.5825039287585123, + "grad_norm": 0.5578714284179954, + "learning_rate": 3.182238887000002e-05, + "loss": 0.2681, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1554621011018753, + "step": 4930, + "valid_targets_mean": 5593.9, + "valid_targets_min": 3596 + }, + { + "epoch": 2.585123101100052, + "grad_norm": 0.6046078395960688, + "learning_rate": 3.180130812355775e-05, + "loss": 0.2702, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12882524728775024, + "step": 4935, + "valid_targets_mean": 3224.1, + "valid_targets_min": 1352 + }, + { + "epoch": 2.5877422734415925, + "grad_norm": 0.5122085684412675, + "learning_rate": 3.1780207243237e-05, + "loss": 0.2553, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12836720049381256, + "step": 4940, + "valid_targets_mean": 5189.8, + "valid_targets_min": 1722 + }, + { + "epoch": 2.5903614457831328, + "grad_norm": 0.5459458711195225, + "learning_rate": 3.17590862650374e-05, + "loss": 0.2531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1324058324098587, + "step": 4945, + "valid_targets_mean": 4270.8, + "valid_targets_min": 2090 + }, + { + "epoch": 2.5929806181246726, + "grad_norm": 0.6004641655982031, + "learning_rate": 3.173794522499284e-05, + "loss": 0.2529, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13428449630737305, + "step": 4950, + "valid_targets_mean": 3596.2, + "valid_targets_min": 1731 + }, + { + "epoch": 2.5955997904662125, + "grad_norm": 0.6172992051651541, + "learning_rate": 3.171678415917146e-05, + "loss": 0.2545, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13604748249053955, + "step": 4955, + "valid_targets_mean": 3311.6, + "valid_targets_min": 1460 + }, + { + "epoch": 2.5982189628077528, + "grad_norm": 0.572741597250024, + "learning_rate": 3.169560310367556e-05, + "loss": 0.2431, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1529918611049652, + "step": 4960, + "valid_targets_mean": 4707.2, + "valid_targets_min": 2357 + }, + { + "epoch": 2.600838135149293, + "grad_norm": 0.5831300386644992, + "learning_rate": 3.1674402094641534e-05, + "loss": 0.2444, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12589526176452637, + "step": 4965, + "valid_targets_mean": 3636.2, + "valid_targets_min": 1511 + }, + { + "epoch": 2.603457307490833, + "grad_norm": 0.5927490633887448, + "learning_rate": 3.1653181168239824e-05, + "loss": 0.2478, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14207634329795837, + "step": 4970, + "valid_targets_mean": 4583.0, + "valid_targets_min": 1764 + }, + { + "epoch": 2.606076479832373, + "grad_norm": 0.6305783971358412, + "learning_rate": 3.163194036067485e-05, + "loss": 0.2689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14542587101459503, + "step": 4975, + "valid_targets_mean": 3437.5, + "valid_targets_min": 1175 + }, + { + "epoch": 2.608695652173913, + "grad_norm": 0.4970617621017961, + "learning_rate": 3.161067970818496e-05, + "loss": 0.2616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09945046156644821, + "step": 4980, + "valid_targets_mean": 3982.1, + "valid_targets_min": 2546 + }, + { + "epoch": 2.6113148245154534, + "grad_norm": 0.5949517503873936, + "learning_rate": 3.158939924704236e-05, + "loss": 0.2625, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.146941676735878, + "step": 4985, + "valid_targets_mean": 4124.0, + "valid_targets_min": 1244 + }, + { + "epoch": 2.6139339968569932, + "grad_norm": 0.525319801845006, + "learning_rate": 3.156809901355303e-05, + "loss": 0.2543, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13219237327575684, + "step": 4990, + "valid_targets_mean": 5047.1, + "valid_targets_min": 1856 + }, + { + "epoch": 2.616553169198533, + "grad_norm": 0.5590760328022601, + "learning_rate": 3.154677904405671e-05, + "loss": 0.2533, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14278973639011383, + "step": 4995, + "valid_targets_mean": 3927.4, + "valid_targets_min": 1948 + }, + { + "epoch": 2.6191723415400734, + "grad_norm": 0.5511814734502197, + "learning_rate": 3.152543937492678e-05, + "loss": 0.2481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12088270485401154, + "step": 5000, + "valid_targets_mean": 3516.5, + "valid_targets_min": 1248 + }, + { + "epoch": 2.6217915138816132, + "grad_norm": 0.5009950800692684, + "learning_rate": 3.150408004257026e-05, + "loss": 0.2514, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12171660363674164, + "step": 5005, + "valid_targets_mean": 4611.0, + "valid_targets_min": 1145 + }, + { + "epoch": 2.6244106862231535, + "grad_norm": 0.6747271785946586, + "learning_rate": 3.1482701083427696e-05, + "loss": 0.2541, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1250152587890625, + "step": 5010, + "valid_targets_mean": 3262.6, + "valid_targets_min": 2058 + }, + { + "epoch": 2.6270298585646934, + "grad_norm": 0.5540119181488308, + "learning_rate": 3.1461302533973136e-05, + "loss": 0.2537, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1475522816181183, + "step": 5015, + "valid_targets_mean": 4546.5, + "valid_targets_min": 1708 + }, + { + "epoch": 2.6296490309062337, + "grad_norm": 0.581373530694527, + "learning_rate": 3.143988443071403e-05, + "loss": 0.2536, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11121198534965515, + "step": 5020, + "valid_targets_mean": 3555.8, + "valid_targets_min": 1301 + }, + { + "epoch": 2.6322682032477736, + "grad_norm": 0.5712205243857897, + "learning_rate": 3.141844681019121e-05, + "loss": 0.2699, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09923257678747177, + "step": 5025, + "valid_targets_mean": 3068.1, + "valid_targets_min": 1971 + }, + { + "epoch": 2.634887375589314, + "grad_norm": 0.5980222178924863, + "learning_rate": 3.139698970897879e-05, + "loss": 0.2651, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15571749210357666, + "step": 5030, + "valid_targets_mean": 5172.4, + "valid_targets_min": 1054 + }, + { + "epoch": 2.6375065479308537, + "grad_norm": 0.609268242830208, + "learning_rate": 3.1375513163684116e-05, + "loss": 0.2603, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14475512504577637, + "step": 5035, + "valid_targets_mean": 3143.4, + "valid_targets_min": 1612 + }, + { + "epoch": 2.640125720272394, + "grad_norm": 0.573022933412219, + "learning_rate": 3.135401721094773e-05, + "loss": 0.2704, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12014967203140259, + "step": 5040, + "valid_targets_mean": 3499.6, + "valid_targets_min": 1274 + }, + { + "epoch": 2.642744892613934, + "grad_norm": 0.6055266043189158, + "learning_rate": 3.1332501887443264e-05, + "loss": 0.2611, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13370947539806366, + "step": 5045, + "valid_targets_mean": 3628.4, + "valid_targets_min": 1625 + }, + { + "epoch": 2.645364064955474, + "grad_norm": 0.5638328015687015, + "learning_rate": 3.13109672298774e-05, + "loss": 0.2685, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14932434260845184, + "step": 5050, + "valid_targets_mean": 4642.5, + "valid_targets_min": 1381 + }, + { + "epoch": 2.647983237297014, + "grad_norm": 0.6375225173023469, + "learning_rate": 3.128941327498982e-05, + "loss": 0.2739, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15590864419937134, + "step": 5055, + "valid_targets_mean": 3540.1, + "valid_targets_min": 1591 + }, + { + "epoch": 2.6506024096385543, + "grad_norm": 0.5701764304397182, + "learning_rate": 3.12678400595531e-05, + "loss": 0.2544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11090701818466187, + "step": 5060, + "valid_targets_mean": 3714.9, + "valid_targets_min": 1227 + }, + { + "epoch": 2.653221581980094, + "grad_norm": 0.5933349445025315, + "learning_rate": 3.1246247620372705e-05, + "loss": 0.2598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1708788275718689, + "step": 5065, + "valid_targets_mean": 4004.1, + "valid_targets_min": 1409 + }, + { + "epoch": 2.6558407543216345, + "grad_norm": 0.6464940498552127, + "learning_rate": 3.122463599428688e-05, + "loss": 0.2613, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1424185037612915, + "step": 5070, + "valid_targets_mean": 2940.8, + "valid_targets_min": 885 + }, + { + "epoch": 2.6584599266631743, + "grad_norm": 0.6196882426891219, + "learning_rate": 3.120300521816662e-05, + "loss": 0.2632, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12973468005657196, + "step": 5075, + "valid_targets_mean": 3441.9, + "valid_targets_min": 814 + }, + { + "epoch": 2.6610790990047146, + "grad_norm": 0.5928158810880748, + "learning_rate": 3.118135532891557e-05, + "loss": 0.2605, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12601789832115173, + "step": 5080, + "valid_targets_mean": 4079.0, + "valid_targets_min": 2331 + }, + { + "epoch": 2.6636982713462545, + "grad_norm": 0.5101825477237227, + "learning_rate": 3.1159686363470004e-05, + "loss": 0.2421, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13512998819351196, + "step": 5085, + "valid_targets_mean": 5371.5, + "valid_targets_min": 2618 + }, + { + "epoch": 2.6663174436877948, + "grad_norm": 0.607352602278322, + "learning_rate": 3.1137998358798725e-05, + "loss": 0.2551, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12532103061676025, + "step": 5090, + "valid_targets_mean": 3675.1, + "valid_targets_min": 1434 + }, + { + "epoch": 2.6689366160293346, + "grad_norm": 0.627662258246156, + "learning_rate": 3.1116291351903024e-05, + "loss": 0.2482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13801538944244385, + "step": 5095, + "valid_targets_mean": 3813.4, + "valid_targets_min": 1074 + }, + { + "epoch": 2.671555788370875, + "grad_norm": 0.6024155475347305, + "learning_rate": 3.109456537981662e-05, + "loss": 0.26, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12260854989290237, + "step": 5100, + "valid_targets_mean": 3690.8, + "valid_targets_min": 980 + }, + { + "epoch": 2.674174960712415, + "grad_norm": 0.604902604391588, + "learning_rate": 3.107282047960557e-05, + "loss": 0.2535, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14585041999816895, + "step": 5105, + "valid_targets_mean": 4903.5, + "valid_targets_min": 2366 + }, + { + "epoch": 2.676794133053955, + "grad_norm": 0.5585577080282759, + "learning_rate": 3.1051056688368245e-05, + "loss": 0.2641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1398429274559021, + "step": 5110, + "valid_targets_mean": 4654.6, + "valid_targets_min": 1460 + }, + { + "epoch": 2.679413305395495, + "grad_norm": 0.6854350057724503, + "learning_rate": 3.102927404323524e-05, + "loss": 0.2512, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13275103271007538, + "step": 5115, + "valid_targets_mean": 3612.0, + "valid_targets_min": 1351 + }, + { + "epoch": 2.6820324777370352, + "grad_norm": 0.5979776717379521, + "learning_rate": 3.1007472581369284e-05, + "loss": 0.2538, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13742196559906006, + "step": 5120, + "valid_targets_mean": 3632.5, + "valid_targets_min": 2014 + }, + { + "epoch": 2.684651650078575, + "grad_norm": 0.5899005881509998, + "learning_rate": 3.098565233996525e-05, + "loss": 0.2575, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11421630531549454, + "step": 5125, + "valid_targets_mean": 3135.9, + "valid_targets_min": 1084 + }, + { + "epoch": 2.6872708224201154, + "grad_norm": 0.6249029388850529, + "learning_rate": 3.096381335625005e-05, + "loss": 0.2455, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13513506948947906, + "step": 5130, + "valid_targets_mean": 3479.2, + "valid_targets_min": 1618 + }, + { + "epoch": 2.6898899947616552, + "grad_norm": 0.6100810280728409, + "learning_rate": 3.094195566748254e-05, + "loss": 0.2398, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13206806778907776, + "step": 5135, + "valid_targets_mean": 3399.5, + "valid_targets_min": 1747 + }, + { + "epoch": 2.6925091671031955, + "grad_norm": 0.5283575842317508, + "learning_rate": 3.092007931095351e-05, + "loss": 0.2493, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14287996292114258, + "step": 5140, + "valid_targets_mean": 5037.9, + "valid_targets_min": 2092 + }, + { + "epoch": 2.6951283394447354, + "grad_norm": 0.5752611882581933, + "learning_rate": 3.0898184323985594e-05, + "loss": 0.2483, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13903933763504028, + "step": 5145, + "valid_targets_mean": 3843.4, + "valid_targets_min": 2786 + }, + { + "epoch": 2.6977475117862757, + "grad_norm": 0.535866848835118, + "learning_rate": 3.0876270743933214e-05, + "loss": 0.2368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10054393112659454, + "step": 5150, + "valid_targets_mean": 4153.8, + "valid_targets_min": 1246 + }, + { + "epoch": 2.7003666841278156, + "grad_norm": 0.5746289328777828, + "learning_rate": 3.08543386081825e-05, + "loss": 0.2421, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10839236527681351, + "step": 5155, + "valid_targets_mean": 3389.8, + "valid_targets_min": 1484 + }, + { + "epoch": 2.702985856469356, + "grad_norm": 0.578449089828753, + "learning_rate": 3.083238795415126e-05, + "loss": 0.2481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1460162103176117, + "step": 5160, + "valid_targets_mean": 4818.0, + "valid_targets_min": 3185 + }, + { + "epoch": 2.7056050288108957, + "grad_norm": 0.6219474109360055, + "learning_rate": 3.0810418819288886e-05, + "loss": 0.2471, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11964847147464752, + "step": 5165, + "valid_targets_mean": 3818.9, + "valid_targets_min": 1530 + }, + { + "epoch": 2.7082242011524356, + "grad_norm": 0.6404418781897823, + "learning_rate": 3.0788431241076286e-05, + "loss": 0.2719, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.148534893989563, + "step": 5170, + "valid_targets_mean": 3010.2, + "valid_targets_min": 887 + }, + { + "epoch": 2.710843373493976, + "grad_norm": 0.5670251738122322, + "learning_rate": 3.076642525702586e-05, + "loss": 0.2432, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12288151681423187, + "step": 5175, + "valid_targets_mean": 4294.1, + "valid_targets_min": 2525 + }, + { + "epoch": 2.713462545835516, + "grad_norm": 0.5556573831730579, + "learning_rate": 3.074440090468138e-05, + "loss": 0.2472, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1274084895849228, + "step": 5180, + "valid_targets_mean": 4256.4, + "valid_targets_min": 1759 + }, + { + "epoch": 2.716081718177056, + "grad_norm": 0.5237360238484792, + "learning_rate": 3.072235822161799e-05, + "loss": 0.2408, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12600873410701752, + "step": 5185, + "valid_targets_mean": 4883.9, + "valid_targets_min": 2155 + }, + { + "epoch": 2.718700890518596, + "grad_norm": 0.6052618076285045, + "learning_rate": 3.070029724544208e-05, + "loss": 0.2558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12613743543624878, + "step": 5190, + "valid_targets_mean": 3758.9, + "valid_targets_min": 2048 + }, + { + "epoch": 2.721320062860136, + "grad_norm": 0.6131391571695859, + "learning_rate": 3.067821801379125e-05, + "loss": 0.2521, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10715790092945099, + "step": 5195, + "valid_targets_mean": 2550.0, + "valid_targets_min": 1233 + }, + { + "epoch": 2.7239392352016765, + "grad_norm": 0.5511481275343706, + "learning_rate": 3.0656120564334265e-05, + "loss": 0.2559, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09842834621667862, + "step": 5200, + "valid_targets_mean": 2796.5, + "valid_targets_min": 732 + }, + { + "epoch": 2.7265584075432163, + "grad_norm": 0.5393218879075641, + "learning_rate": 3.063400493477097e-05, + "loss": 0.251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1217995434999466, + "step": 5205, + "valid_targets_mean": 4085.5, + "valid_targets_min": 1800 + }, + { + "epoch": 2.729177579884756, + "grad_norm": 0.5974752377112322, + "learning_rate": 3.061187116283219e-05, + "loss": 0.2528, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12144285440444946, + "step": 5210, + "valid_targets_mean": 3429.1, + "valid_targets_min": 2327 + }, + { + "epoch": 2.7317967522262965, + "grad_norm": 0.5971786736186465, + "learning_rate": 3.0589719286279736e-05, + "loss": 0.2499, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12138991802930832, + "step": 5215, + "valid_targets_mean": 3262.4, + "valid_targets_min": 1597 + }, + { + "epoch": 2.7344159245678368, + "grad_norm": 0.43442958150724836, + "learning_rate": 3.056754934290631e-05, + "loss": 0.168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07654788345098495, + "step": 5220, + "valid_targets_mean": 3631.8, + "valid_targets_min": 2342 + }, + { + "epoch": 2.7370350969093766, + "grad_norm": 0.4518304418024818, + "learning_rate": 3.054536137053542e-05, + "loss": 0.1062, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.039826858788728714, + "step": 5225, + "valid_targets_mean": 3542.6, + "valid_targets_min": 2731 + }, + { + "epoch": 2.7396542692509165, + "grad_norm": 0.3723356923704959, + "learning_rate": 3.0523155407021343e-05, + "loss": 0.0993, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03338192030787468, + "step": 5230, + "valid_targets_mean": 3569.4, + "valid_targets_min": 2927 + }, + { + "epoch": 2.742273441592457, + "grad_norm": 0.4012919897718542, + "learning_rate": 3.0500931490249032e-05, + "loss": 0.1141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06943926960229874, + "step": 5235, + "valid_targets_mean": 3426.9, + "valid_targets_min": 2213 + }, + { + "epoch": 2.744892613933997, + "grad_norm": 0.46765799501116584, + "learning_rate": 3.04786896581341e-05, + "loss": 0.0949, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.055836021900177, + "step": 5240, + "valid_targets_mean": 2539.8, + "valid_targets_min": 560 + }, + { + "epoch": 2.747511786275537, + "grad_norm": 0.4050166095909045, + "learning_rate": 3.0456429948622702e-05, + "loss": 0.1012, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05261792242527008, + "step": 5245, + "valid_targets_mean": 2907.5, + "valid_targets_min": 1002 + }, + { + "epoch": 2.750130958617077, + "grad_norm": 0.6799795998400201, + "learning_rate": 3.04341523996915e-05, + "loss": 0.1633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08086485415697098, + "step": 5250, + "valid_targets_mean": 1458.6, + "valid_targets_min": 650 + }, + { + "epoch": 2.752750130958617, + "grad_norm": 0.37334798666819397, + "learning_rate": 3.041185704934759e-05, + "loss": 0.0989, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04849667102098465, + "step": 5255, + "valid_targets_mean": 3396.1, + "valid_targets_min": 1037 + }, + { + "epoch": 2.7553693033001574, + "grad_norm": 0.5441076998623068, + "learning_rate": 3.0389543935628438e-05, + "loss": 0.1245, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1124047264456749, + "step": 5260, + "valid_targets_mean": 2438.9, + "valid_targets_min": 883 + }, + { + "epoch": 2.7579884756416972, + "grad_norm": 0.24267328190315704, + "learning_rate": 3.0367213096601822e-05, + "loss": 0.1197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03160983324050903, + "step": 5265, + "valid_targets_mean": 4958.4, + "valid_targets_min": 3285 + }, + { + "epoch": 2.760607647983237, + "grad_norm": 0.3283148739817792, + "learning_rate": 3.0344864570365752e-05, + "loss": 0.0927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.039658188819885254, + "step": 5270, + "valid_targets_mean": 4092.4, + "valid_targets_min": 764 + }, + { + "epoch": 2.7632268203247774, + "grad_norm": 0.3607218133338841, + "learning_rate": 3.0322498395048422e-05, + "loss": 0.0983, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.050965845584869385, + "step": 5275, + "valid_targets_mean": 3804.9, + "valid_targets_min": 1290 + }, + { + "epoch": 2.7658459926663177, + "grad_norm": 0.4909546931767392, + "learning_rate": 3.030011460880812e-05, + "loss": 0.0981, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06120920181274414, + "step": 5280, + "valid_targets_mean": 2547.8, + "valid_targets_min": 729 + }, + { + "epoch": 2.7684651650078576, + "grad_norm": 0.3042317920249153, + "learning_rate": 3.027771324983321e-05, + "loss": 0.137, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.043728526681661606, + "step": 5285, + "valid_targets_mean": 4258.8, + "valid_targets_min": 1961 + }, + { + "epoch": 2.7710843373493974, + "grad_norm": 0.31391062046456664, + "learning_rate": 3.0255294356342e-05, + "loss": 0.0924, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04248586297035217, + "step": 5290, + "valid_targets_mean": 3557.5, + "valid_targets_min": 1822 + }, + { + "epoch": 2.7737035096909377, + "grad_norm": 0.4130453023231338, + "learning_rate": 3.0232857966582746e-05, + "loss": 0.1085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05159539356827736, + "step": 5295, + "valid_targets_mean": 2159.6, + "valid_targets_min": 841 + }, + { + "epoch": 2.776322682032478, + "grad_norm": 0.37793693540997453, + "learning_rate": 3.0210404118833527e-05, + "loss": 0.085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.045104995369911194, + "step": 5300, + "valid_targets_mean": 2735.1, + "valid_targets_min": 732 + }, + { + "epoch": 2.778941854374018, + "grad_norm": 0.7126770459670307, + "learning_rate": 3.0187932851402225e-05, + "loss": 0.1075, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0645991638302803, + "step": 5305, + "valid_targets_mean": 1669.0, + "valid_targets_min": 770 + }, + { + "epoch": 2.7815610267155577, + "grad_norm": 0.39540853200518833, + "learning_rate": 3.0165444202626433e-05, + "loss": 0.1099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.041591890156269073, + "step": 5310, + "valid_targets_mean": 2415.0, + "valid_targets_min": 847 + }, + { + "epoch": 2.784180199057098, + "grad_norm": 0.43367018565424464, + "learning_rate": 3.01429382108734e-05, + "loss": 0.1149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05857367068529129, + "step": 5315, + "valid_targets_mean": 3279.4, + "valid_targets_min": 2224 + }, + { + "epoch": 2.786799371398638, + "grad_norm": 0.4122107227346459, + "learning_rate": 3.012041491453996e-05, + "loss": 0.1146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05071114003658295, + "step": 5320, + "valid_targets_mean": 2944.5, + "valid_targets_min": 1341 + }, + { + "epoch": 2.789418543740178, + "grad_norm": 0.3863943077409809, + "learning_rate": 3.0097874352052477e-05, + "loss": 0.1475, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05821670591831207, + "step": 5325, + "valid_targets_mean": 3912.9, + "valid_targets_min": 3005 + }, + { + "epoch": 2.792037716081718, + "grad_norm": 0.363574384955353, + "learning_rate": 3.0075316561866766e-05, + "loss": 0.0925, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04231640696525574, + "step": 5330, + "valid_targets_mean": 2799.0, + "valid_targets_min": 669 + }, + { + "epoch": 2.7946568884232583, + "grad_norm": 0.6689930239576413, + "learning_rate": 3.0052741582468034e-05, + "loss": 0.1149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07634914666414261, + "step": 5335, + "valid_targets_mean": 1381.5, + "valid_targets_min": 702 + }, + { + "epoch": 2.797276060764798, + "grad_norm": 0.6259194767422449, + "learning_rate": 3.003014945237082e-05, + "loss": 0.1297, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04922054335474968, + "step": 5340, + "valid_targets_mean": 869.9, + "valid_targets_min": 15 + }, + { + "epoch": 2.7998952331063385, + "grad_norm": 0.35584135567152586, + "learning_rate": 3.0007540210118916e-05, + "loss": 0.1145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05319155752658844, + "step": 5345, + "valid_targets_mean": 3761.5, + "valid_targets_min": 2827 + }, + { + "epoch": 2.8025144054478783, + "grad_norm": 0.46814357476427576, + "learning_rate": 2.998491389428531e-05, + "loss": 0.1648, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10782517492771149, + "step": 5350, + "valid_targets_mean": 3383.4, + "valid_targets_min": 2079 + }, + { + "epoch": 2.8051335777894186, + "grad_norm": 0.3933848920767778, + "learning_rate": 2.9962270543472125e-05, + "loss": 0.2572, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.051113810390233994, + "step": 5355, + "valid_targets_mean": 3586.4, + "valid_targets_min": 1932 + }, + { + "epoch": 2.8077527501309585, + "grad_norm": 0.5260067132659276, + "learning_rate": 2.993961019631054e-05, + "loss": 0.1201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05595569685101509, + "step": 5360, + "valid_targets_mean": 1462.1, + "valid_targets_min": 820 + }, + { + "epoch": 2.810371922472499, + "grad_norm": 0.4903945335004159, + "learning_rate": 2.9916932891460732e-05, + "loss": 0.1173, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10142762213945389, + "step": 5365, + "valid_targets_mean": 2709.1, + "valid_targets_min": 965 + }, + { + "epoch": 2.8129910948140386, + "grad_norm": 0.3286219206131438, + "learning_rate": 2.9894238667611816e-05, + "loss": 0.1924, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04985406622290611, + "step": 5370, + "valid_targets_mean": 4498.0, + "valid_targets_min": 2262 + }, + { + "epoch": 2.815610267155579, + "grad_norm": 0.413834999480805, + "learning_rate": 2.987152756348176e-05, + "loss": 0.0962, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08123902976512909, + "step": 5375, + "valid_targets_mean": 4270.9, + "valid_targets_min": 2733 + }, + { + "epoch": 2.818229439497119, + "grad_norm": 0.38853493422731167, + "learning_rate": 2.9848799617817336e-05, + "loss": 0.1036, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07313060760498047, + "step": 5380, + "valid_targets_mean": 4916.5, + "valid_targets_min": 3028 + }, + { + "epoch": 2.820848611838659, + "grad_norm": 0.3180382314400335, + "learning_rate": 2.9826054869394054e-05, + "loss": 0.1041, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03528398275375366, + "step": 5385, + "valid_targets_mean": 4158.5, + "valid_targets_min": 3317 + }, + { + "epoch": 2.823467784180199, + "grad_norm": 0.3309466292419488, + "learning_rate": 2.9803293357016087e-05, + "loss": 0.0954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.041354067623615265, + "step": 5390, + "valid_targets_mean": 4017.0, + "valid_targets_min": 748 + }, + { + "epoch": 2.8260869565217392, + "grad_norm": 0.39593819578991357, + "learning_rate": 2.9780515119516208e-05, + "loss": 0.0951, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.059333547949790955, + "step": 5395, + "valid_targets_mean": 3627.6, + "valid_targets_min": 2904 + }, + { + "epoch": 2.828706128863279, + "grad_norm": 0.4648870637564455, + "learning_rate": 2.975772019575572e-05, + "loss": 0.1002, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05297884717583656, + "step": 5400, + "valid_targets_mean": 2574.8, + "valid_targets_min": 1939 + }, + { + "epoch": 2.8313253012048194, + "grad_norm": 0.402889325989699, + "learning_rate": 2.9734908624624407e-05, + "loss": 0.084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04135642200708389, + "step": 5405, + "valid_targets_mean": 2599.0, + "valid_targets_min": 772 + }, + { + "epoch": 2.8339444735463593, + "grad_norm": 0.5410229605482512, + "learning_rate": 2.971208044504044e-05, + "loss": 0.1508, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09342281520366669, + "step": 5410, + "valid_targets_mean": 2805.9, + "valid_targets_min": 1289 + }, + { + "epoch": 2.8365636458878996, + "grad_norm": 0.3768403055787591, + "learning_rate": 2.968923569595034e-05, + "loss": 0.0774, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04221757873892784, + "step": 5415, + "valid_targets_mean": 3667.9, + "valid_targets_min": 2730 + }, + { + "epoch": 2.8391828182294394, + "grad_norm": 0.38783078033593726, + "learning_rate": 2.9666374416328874e-05, + "loss": 0.0912, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0400664359331131, + "step": 5420, + "valid_targets_mean": 2270.9, + "valid_targets_min": 616 + }, + { + "epoch": 2.8418019905709797, + "grad_norm": 0.33047465013092353, + "learning_rate": 2.9643496645179034e-05, + "loss": 0.0862, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04919986054301262, + "step": 5425, + "valid_targets_mean": 4381.4, + "valid_targets_min": 3979 + }, + { + "epoch": 2.8444211629125196, + "grad_norm": 0.4061462618944902, + "learning_rate": 2.9620602421531944e-05, + "loss": 0.1029, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0646735206246376, + "step": 5430, + "valid_targets_mean": 2635.8, + "valid_targets_min": 795 + }, + { + "epoch": 2.84704033525406, + "grad_norm": 0.3296198223401941, + "learning_rate": 2.959769178444678e-05, + "loss": 0.1302, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04333513230085373, + "step": 5435, + "valid_targets_mean": 3182.4, + "valid_targets_min": 729 + }, + { + "epoch": 2.8496595075955997, + "grad_norm": 0.5134410202466364, + "learning_rate": 2.9574764773010743e-05, + "loss": 0.1258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05219130218029022, + "step": 5440, + "valid_targets_mean": 1878.5, + "valid_targets_min": 745 + }, + { + "epoch": 2.85227867993714, + "grad_norm": 0.603936272047619, + "learning_rate": 2.9551821426338958e-05, + "loss": 0.1134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09199359267950058, + "step": 5445, + "valid_targets_mean": 2249.8, + "valid_targets_min": 664 + }, + { + "epoch": 2.85489785227868, + "grad_norm": 0.4318924619202293, + "learning_rate": 2.9528861783574416e-05, + "loss": 0.1215, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.043887414038181305, + "step": 5450, + "valid_targets_mean": 2284.8, + "valid_targets_min": 890 + }, + { + "epoch": 2.85751702462022, + "grad_norm": 0.34140930648182255, + "learning_rate": 2.950588588388792e-05, + "loss": 0.1407, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.045628830790519714, + "step": 5455, + "valid_targets_mean": 3838.2, + "valid_targets_min": 2440 + }, + { + "epoch": 2.86013619696176, + "grad_norm": 0.400531024076249, + "learning_rate": 2.9482893766478e-05, + "loss": 0.1043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.041745901107788086, + "step": 5460, + "valid_targets_mean": 3074.5, + "valid_targets_min": 840 + }, + { + "epoch": 2.8627553693033003, + "grad_norm": 0.4452066763835879, + "learning_rate": 2.9459885470570856e-05, + "loss": 0.1263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05026886984705925, + "step": 5465, + "valid_targets_mean": 3609.8, + "valid_targets_min": 1014 + }, + { + "epoch": 2.86537454164484, + "grad_norm": 0.42926121252820065, + "learning_rate": 2.9436861035420298e-05, + "loss": 0.1082, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.044806621968746185, + "step": 5470, + "valid_targets_mean": 1142.9, + "valid_targets_min": 485 + }, + { + "epoch": 2.8679937139863805, + "grad_norm": 0.4386900241651716, + "learning_rate": 2.9413820500307665e-05, + "loss": 0.0971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04453166574239731, + "step": 5475, + "valid_targets_mean": 2665.6, + "valid_targets_min": 605 + }, + { + "epoch": 2.8706128863279203, + "grad_norm": 0.28254308805117223, + "learning_rate": 2.939076390454176e-05, + "loss": 0.0934, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03537259250879288, + "step": 5480, + "valid_targets_mean": 4443.1, + "valid_targets_min": 848 + }, + { + "epoch": 2.87323205866946, + "grad_norm": 0.3871232976277066, + "learning_rate": 2.9367691287458786e-05, + "loss": 0.093, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05675549805164337, + "step": 5485, + "valid_targets_mean": 4255.2, + "valid_targets_min": 884 + }, + { + "epoch": 2.8758512310110005, + "grad_norm": 0.3994867830249035, + "learning_rate": 2.9344602688422286e-05, + "loss": 0.0936, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.048137348145246506, + "step": 5490, + "valid_targets_mean": 3826.2, + "valid_targets_min": 1992 + }, + { + "epoch": 2.878470403352541, + "grad_norm": 0.37453332633288844, + "learning_rate": 2.932149814682308e-05, + "loss": 0.107, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06611055880784988, + "step": 5495, + "valid_targets_mean": 3189.2, + "valid_targets_min": 808 + }, + { + "epoch": 2.8810895756940806, + "grad_norm": 0.42821727671187865, + "learning_rate": 2.929837770207915e-05, + "loss": 0.1058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05029541254043579, + "step": 5500, + "valid_targets_mean": 3188.5, + "valid_targets_min": 1814 + }, + { + "epoch": 2.8837087480356205, + "grad_norm": 0.42426030057120456, + "learning_rate": 2.927524139363565e-05, + "loss": 0.1118, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05611751228570938, + "step": 5505, + "valid_targets_mean": 2962.6, + "valid_targets_min": 931 + }, + { + "epoch": 2.886327920377161, + "grad_norm": 0.3289453216560865, + "learning_rate": 2.925208926096478e-05, + "loss": 0.0852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04311997443437576, + "step": 5510, + "valid_targets_mean": 4098.5, + "valid_targets_min": 3848 + }, + { + "epoch": 2.888947092718701, + "grad_norm": 0.48169193309453806, + "learning_rate": 2.9228921343565733e-05, + "loss": 0.1014, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.052452776581048965, + "step": 5515, + "valid_targets_mean": 1851.2, + "valid_targets_min": 664 + }, + { + "epoch": 2.891566265060241, + "grad_norm": 0.37235486925460154, + "learning_rate": 2.9205737680964645e-05, + "loss": 0.1038, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05145837739109993, + "step": 5520, + "valid_targets_mean": 3527.9, + "valid_targets_min": 2309 + }, + { + "epoch": 2.894185437401781, + "grad_norm": 0.39994110176146797, + "learning_rate": 2.9182538312714506e-05, + "loss": 0.0827, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.041609033942222595, + "step": 5525, + "valid_targets_mean": 2707.0, + "valid_targets_min": 1003 + }, + { + "epoch": 2.896804609743321, + "grad_norm": 0.3375712957693352, + "learning_rate": 2.91593232783951e-05, + "loss": 0.1022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03793808072805405, + "step": 5530, + "valid_targets_mean": 3107.2, + "valid_targets_min": 531 + }, + { + "epoch": 2.8994237820848614, + "grad_norm": 0.35215830014753513, + "learning_rate": 2.913609261761295e-05, + "loss": 0.102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.046030208468437195, + "step": 5535, + "valid_targets_mean": 2845.9, + "valid_targets_min": 1003 + }, + { + "epoch": 2.9020429544264013, + "grad_norm": 0.4671244222007615, + "learning_rate": 2.9112846370001223e-05, + "loss": 0.1221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03913413733243942, + "step": 5540, + "valid_targets_mean": 1568.5, + "valid_targets_min": 597 + }, + { + "epoch": 2.904662126767941, + "grad_norm": 0.40153476187632986, + "learning_rate": 2.9089584575219688e-05, + "loss": 0.1006, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03844350203871727, + "step": 5545, + "valid_targets_mean": 1980.2, + "valid_targets_min": 665 + }, + { + "epoch": 2.9072812991094814, + "grad_norm": 0.49738924762354936, + "learning_rate": 2.906630727295463e-05, + "loss": 0.1192, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04668961465358734, + "step": 5550, + "valid_targets_mean": 1768.5, + "valid_targets_min": 853 + }, + { + "epoch": 2.9099004714510217, + "grad_norm": 0.44675384756678116, + "learning_rate": 2.9043014502918807e-05, + "loss": 0.1068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07055791467428207, + "step": 5555, + "valid_targets_mean": 2583.2, + "valid_targets_min": 997 + }, + { + "epoch": 2.9125196437925616, + "grad_norm": 0.5219035167189274, + "learning_rate": 2.9019706304851348e-05, + "loss": 0.1136, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06573070585727692, + "step": 5560, + "valid_targets_mean": 2746.6, + "valid_targets_min": 740 + }, + { + "epoch": 2.9151388161341014, + "grad_norm": 0.31231730341467273, + "learning_rate": 2.8996382718517724e-05, + "loss": 0.0937, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03759889677166939, + "step": 5565, + "valid_targets_mean": 3555.2, + "valid_targets_min": 2887 + }, + { + "epoch": 2.9177579884756417, + "grad_norm": 0.33964128112886155, + "learning_rate": 2.8973043783709628e-05, + "loss": 0.0946, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03595292568206787, + "step": 5570, + "valid_targets_mean": 3754.2, + "valid_targets_min": 2543 + }, + { + "epoch": 2.920377160817182, + "grad_norm": 0.48461253619580297, + "learning_rate": 2.894968954024497e-05, + "loss": 0.126, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05458501726388931, + "step": 5575, + "valid_targets_mean": 1742.1, + "valid_targets_min": 446 + }, + { + "epoch": 2.922996333158722, + "grad_norm": 0.36508330284009327, + "learning_rate": 2.8926320027967763e-05, + "loss": 0.0872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03947306424379349, + "step": 5580, + "valid_targets_mean": 2742.4, + "valid_targets_min": 681 + }, + { + "epoch": 2.9256155055002617, + "grad_norm": 0.39691509130909497, + "learning_rate": 2.8902935286748066e-05, + "loss": 0.0964, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07151953876018524, + "step": 5585, + "valid_targets_mean": 3844.6, + "valid_targets_min": 799 + }, + { + "epoch": 2.928234677841802, + "grad_norm": 0.37319668001393097, + "learning_rate": 2.8879535356481933e-05, + "loss": 0.0942, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04579343646764755, + "step": 5590, + "valid_targets_mean": 3546.4, + "valid_targets_min": 940 + }, + { + "epoch": 2.9308538501833423, + "grad_norm": 0.3072038585673081, + "learning_rate": 2.8856120277091326e-05, + "loss": 0.0829, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.034740135073661804, + "step": 5595, + "valid_targets_mean": 3592.6, + "valid_targets_min": 861 + }, + { + "epoch": 2.933473022524882, + "grad_norm": 0.4037290376400598, + "learning_rate": 2.8832690088524045e-05, + "loss": 0.0924, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06839783489704132, + "step": 5600, + "valid_targets_mean": 4078.1, + "valid_targets_min": 3024 + }, + { + "epoch": 2.936092194866422, + "grad_norm": 0.3119248430637808, + "learning_rate": 2.8809244830753667e-05, + "loss": 0.0974, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05406394228339195, + "step": 5605, + "valid_targets_mean": 3932.1, + "valid_targets_min": 3175 + }, + { + "epoch": 2.9387113672079623, + "grad_norm": 0.3498723220699873, + "learning_rate": 2.8785784543779497e-05, + "loss": 0.1182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04904625564813614, + "step": 5610, + "valid_targets_mean": 3798.4, + "valid_targets_min": 2652 + }, + { + "epoch": 2.9413305395495026, + "grad_norm": 0.4385505136502549, + "learning_rate": 2.8762309267626465e-05, + "loss": 0.121, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11120840162038803, + "step": 5615, + "valid_targets_mean": 2981.9, + "valid_targets_min": 764 + }, + { + "epoch": 2.9439497118910425, + "grad_norm": 0.4153393952520855, + "learning_rate": 2.8738819042345073e-05, + "loss": 0.0793, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05048034340143204, + "step": 5620, + "valid_targets_mean": 1483.8, + "valid_targets_min": 815 + }, + { + "epoch": 2.9465688842325823, + "grad_norm": 0.37736301208032946, + "learning_rate": 2.8715313908011332e-05, + "loss": 0.1187, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05640570446848869, + "step": 5625, + "valid_targets_mean": 3776.4, + "valid_targets_min": 2447 + }, + { + "epoch": 2.9491880565741226, + "grad_norm": 0.41033167104265644, + "learning_rate": 2.8691793904726685e-05, + "loss": 0.0941, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.053387630730867386, + "step": 5630, + "valid_targets_mean": 3455.1, + "valid_targets_min": 854 + }, + { + "epoch": 2.9518072289156625, + "grad_norm": 0.33174583059520024, + "learning_rate": 2.8668259072617946e-05, + "loss": 0.1028, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03358113765716553, + "step": 5635, + "valid_targets_mean": 3706.0, + "valid_targets_min": 743 + }, + { + "epoch": 2.954426401257203, + "grad_norm": 0.5185327579576747, + "learning_rate": 2.864470945183724e-05, + "loss": 0.1167, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09212501347064972, + "step": 5640, + "valid_targets_mean": 2587.1, + "valid_targets_min": 706 + }, + { + "epoch": 2.9570455735987426, + "grad_norm": 0.4414609757950001, + "learning_rate": 2.8621145082561886e-05, + "loss": 0.1415, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09895250201225281, + "step": 5645, + "valid_targets_mean": 3028.0, + "valid_targets_min": 2457 + }, + { + "epoch": 2.959664745940283, + "grad_norm": 0.41969596363187245, + "learning_rate": 2.8597566004994407e-05, + "loss": 0.1081, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0406753309071064, + "step": 5650, + "valid_targets_mean": 2147.2, + "valid_targets_min": 663 + }, + { + "epoch": 2.962283918281823, + "grad_norm": 0.4634764618622666, + "learning_rate": 2.8573972259362405e-05, + "loss": 0.1002, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.049560319632291794, + "step": 5655, + "valid_targets_mean": 1507.4, + "valid_targets_min": 716 + }, + { + "epoch": 2.964903090623363, + "grad_norm": 0.3753956288776308, + "learning_rate": 2.855036388591848e-05, + "loss": 0.0942, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.057809121906757355, + "step": 5660, + "valid_targets_mean": 3088.1, + "valid_targets_min": 760 + }, + { + "epoch": 2.967522262964903, + "grad_norm": 0.3927551212565586, + "learning_rate": 2.8526740924940234e-05, + "loss": 0.0959, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.052389007061719894, + "step": 5665, + "valid_targets_mean": 3074.9, + "valid_targets_min": 920 + }, + { + "epoch": 2.9701414353064433, + "grad_norm": 0.3920311639286199, + "learning_rate": 2.8503103416730123e-05, + "loss": 0.0845, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.032711006700992584, + "step": 5670, + "valid_targets_mean": 997.5, + "valid_targets_min": 635 + }, + { + "epoch": 2.972760607647983, + "grad_norm": 0.34637553831989293, + "learning_rate": 2.8479451401615434e-05, + "loss": 0.1191, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04361840337514877, + "step": 5675, + "valid_targets_mean": 2942.0, + "valid_targets_min": 920 + }, + { + "epoch": 2.9753797799895234, + "grad_norm": 0.39651341139648016, + "learning_rate": 2.8455784919948206e-05, + "loss": 0.0857, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.042224809527397156, + "step": 5680, + "valid_targets_mean": 1271.1, + "valid_targets_min": 704 + }, + { + "epoch": 2.9779989523310633, + "grad_norm": 0.38317061342586256, + "learning_rate": 2.8432104012105144e-05, + "loss": 0.0943, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.034398600459098816, + "step": 5685, + "valid_targets_mean": 2149.4, + "valid_targets_min": 529 + }, + { + "epoch": 2.9806181246726036, + "grad_norm": 0.3884152721470461, + "learning_rate": 2.8408408718487582e-05, + "loss": 0.1029, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05746208131313324, + "step": 5690, + "valid_targets_mean": 3471.9, + "valid_targets_min": 2017 + }, + { + "epoch": 2.9832372970141434, + "grad_norm": 0.30370806170817466, + "learning_rate": 2.8384699079521398e-05, + "loss": 0.0931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0494544580578804, + "step": 5695, + "valid_targets_mean": 4240.2, + "valid_targets_min": 516 + }, + { + "epoch": 2.9858564693556837, + "grad_norm": 0.30344571122795916, + "learning_rate": 2.836097513565693e-05, + "loss": 0.086, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04066718369722366, + "step": 5700, + "valid_targets_mean": 2583.9, + "valid_targets_min": 775 + }, + { + "epoch": 2.9884756416972236, + "grad_norm": 0.29743190177468465, + "learning_rate": 2.833723692736893e-05, + "loss": 0.0896, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04501290246844292, + "step": 5705, + "valid_targets_mean": 3741.6, + "valid_targets_min": 605 + }, + { + "epoch": 2.991094814038764, + "grad_norm": 0.47781571969317105, + "learning_rate": 2.8313484495156486e-05, + "loss": 0.1701, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16558252274990082, + "step": 5710, + "valid_targets_mean": 2971.0, + "valid_targets_min": 1907 + }, + { + "epoch": 2.9937139863803037, + "grad_norm": 0.3470372996331737, + "learning_rate": 2.828971787954295e-05, + "loss": 0.1148, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.044766783714294434, + "step": 5715, + "valid_targets_mean": 3138.5, + "valid_targets_min": 1235 + }, + { + "epoch": 2.996333158721844, + "grad_norm": 0.3702526905954634, + "learning_rate": 2.8265937121075873e-05, + "loss": 0.1012, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04486331343650818, + "step": 5720, + "valid_targets_mean": 2935.4, + "valid_targets_min": 759 + }, + { + "epoch": 2.998952331063384, + "grad_norm": 0.41766615047107897, + "learning_rate": 2.8242142260326937e-05, + "loss": 0.0931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06796953827142715, + "step": 5725, + "valid_targets_mean": 2050.0, + "valid_targets_min": 927 + }, + { + "epoch": 3.001571503404924, + "grad_norm": 0.7981101464361773, + "learning_rate": 2.8218333337891882e-05, + "loss": 0.1914, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0790286436676979, + "step": 5730, + "valid_targets_mean": 1270.1, + "valid_targets_min": 788 + }, + { + "epoch": 3.004190675746464, + "grad_norm": 0.7560583152250143, + "learning_rate": 2.8194510394390443e-05, + "loss": 0.1857, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08779201656579971, + "step": 5735, + "valid_targets_mean": 1545.5, + "valid_targets_min": 957 + }, + { + "epoch": 3.0068098480880043, + "grad_norm": 0.7348656221096983, + "learning_rate": 2.817067347046626e-05, + "loss": 0.1755, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08141259104013443, + "step": 5740, + "valid_targets_mean": 1351.6, + "valid_targets_min": 796 + }, + { + "epoch": 3.009429020429544, + "grad_norm": 0.7448213958029152, + "learning_rate": 2.814682260678684e-05, + "loss": 0.1734, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09365697205066681, + "step": 5745, + "valid_targets_mean": 1480.6, + "valid_targets_min": 839 + }, + { + "epoch": 3.0120481927710845, + "grad_norm": 0.7348628545274174, + "learning_rate": 2.8122957844043474e-05, + "loss": 0.1744, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07291596382856369, + "step": 5750, + "valid_targets_mean": 1344.9, + "valid_targets_min": 638 + }, + { + "epoch": 3.0146673651126243, + "grad_norm": 0.6685850834334908, + "learning_rate": 2.809907922295115e-05, + "loss": 0.1729, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08419374376535416, + "step": 5755, + "valid_targets_mean": 1538.4, + "valid_targets_min": 727 + }, + { + "epoch": 3.0172865374541646, + "grad_norm": 0.6793100238003746, + "learning_rate": 2.8075186784248517e-05, + "loss": 0.1767, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07691366970539093, + "step": 5760, + "valid_targets_mean": 1195.4, + "valid_targets_min": 761 + }, + { + "epoch": 3.0199057097957045, + "grad_norm": 0.7629492371583007, + "learning_rate": 2.805128056869779e-05, + "loss": 0.1641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08975130319595337, + "step": 5765, + "valid_targets_mean": 1309.1, + "valid_targets_min": 714 + }, + { + "epoch": 3.022524882137245, + "grad_norm": 0.8394951597437683, + "learning_rate": 2.8027360617084684e-05, + "loss": 0.1846, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08716186136007309, + "step": 5770, + "valid_targets_mean": 1417.9, + "valid_targets_min": 741 + }, + { + "epoch": 3.0251440544787846, + "grad_norm": 0.7196217010538367, + "learning_rate": 2.800342697021835e-05, + "loss": 0.1758, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10522545874118805, + "step": 5775, + "valid_targets_mean": 2031.6, + "valid_targets_min": 663 + }, + { + "epoch": 3.027763226820325, + "grad_norm": 0.6603324262189301, + "learning_rate": 2.797947966893131e-05, + "loss": 0.1673, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07629004120826721, + "step": 5780, + "valid_targets_mean": 1393.6, + "valid_targets_min": 696 + }, + { + "epoch": 3.030382399161865, + "grad_norm": 0.6645598545760699, + "learning_rate": 2.7955518754079382e-05, + "loss": 0.1785, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09426233172416687, + "step": 5785, + "valid_targets_mean": 1895.8, + "valid_targets_min": 1009 + }, + { + "epoch": 3.033001571503405, + "grad_norm": 0.6434178337672452, + "learning_rate": 2.7931544266541596e-05, + "loss": 0.1687, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07660476118326187, + "step": 5790, + "valid_targets_mean": 1525.5, + "valid_targets_min": 717 + }, + { + "epoch": 3.035620743844945, + "grad_norm": 0.7319443766974159, + "learning_rate": 2.7907556247220166e-05, + "loss": 0.1608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08354084193706512, + "step": 5795, + "valid_targets_mean": 1484.6, + "valid_targets_min": 659 + }, + { + "epoch": 3.0382399161864853, + "grad_norm": 0.6469303704614396, + "learning_rate": 2.788355473704036e-05, + "loss": 0.1608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.064138263463974, + "step": 5800, + "valid_targets_mean": 1206.5, + "valid_targets_min": 642 + }, + { + "epoch": 3.040859088528025, + "grad_norm": 0.6479047117986019, + "learning_rate": 2.7859539776950478e-05, + "loss": 0.1673, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.059673525393009186, + "step": 5805, + "valid_targets_mean": 1201.8, + "valid_targets_min": 765 + }, + { + "epoch": 3.0434782608695654, + "grad_norm": 0.7345623554093044, + "learning_rate": 2.7835511407921765e-05, + "loss": 0.1776, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07721047103404999, + "step": 5810, + "valid_targets_mean": 1359.4, + "valid_targets_min": 631 + }, + { + "epoch": 3.0460974332111053, + "grad_norm": 0.7742188256489263, + "learning_rate": 2.7811469670948348e-05, + "loss": 0.1755, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09204640984535217, + "step": 5815, + "valid_targets_mean": 1498.5, + "valid_targets_min": 623 + }, + { + "epoch": 3.0487166055526456, + "grad_norm": 0.7153340181131183, + "learning_rate": 2.778741460704715e-05, + "loss": 0.1711, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11384181678295135, + "step": 5820, + "valid_targets_mean": 2016.6, + "valid_targets_min": 973 + }, + { + "epoch": 3.0513357778941854, + "grad_norm": 0.6562771495413292, + "learning_rate": 2.7763346257257843e-05, + "loss": 0.171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07798384130001068, + "step": 5825, + "valid_targets_mean": 1504.4, + "valid_targets_min": 776 + }, + { + "epoch": 3.0539549502357257, + "grad_norm": 0.7155882622011773, + "learning_rate": 2.7739264662642754e-05, + "loss": 0.1696, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10642405599355698, + "step": 5830, + "valid_targets_mean": 1658.8, + "valid_targets_min": 623 + }, + { + "epoch": 3.0565741225772656, + "grad_norm": 0.7226093969321024, + "learning_rate": 2.771516986428681e-05, + "loss": 0.173, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09716735780239105, + "step": 5835, + "valid_targets_mean": 1586.8, + "valid_targets_min": 1243 + }, + { + "epoch": 3.059193294918806, + "grad_norm": 0.7236637463167985, + "learning_rate": 2.7691061903297466e-05, + "loss": 0.17, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.058030158281326294, + "step": 5840, + "valid_targets_mean": 1026.9, + "valid_targets_min": 611 + }, + { + "epoch": 3.0618124672603457, + "grad_norm": 0.7376730852977844, + "learning_rate": 2.7666940820804633e-05, + "loss": 0.1619, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0830594152212143, + "step": 5845, + "valid_targets_mean": 1498.2, + "valid_targets_min": 793 + }, + { + "epoch": 3.064431639601886, + "grad_norm": 0.6609142339695006, + "learning_rate": 2.7642806657960613e-05, + "loss": 0.1658, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.091240793466568, + "step": 5850, + "valid_targets_mean": 1812.6, + "valid_targets_min": 886 + }, + { + "epoch": 3.067050811943426, + "grad_norm": 0.7051693250614872, + "learning_rate": 2.761865945594002e-05, + "loss": 0.164, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08153796195983887, + "step": 5855, + "valid_targets_mean": 1643.8, + "valid_targets_min": 991 + }, + { + "epoch": 3.0696699842849657, + "grad_norm": 0.9082944258312199, + "learning_rate": 2.759449925593971e-05, + "loss": 0.1678, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10334397107362747, + "step": 5860, + "valid_targets_mean": 1784.2, + "valid_targets_min": 1107 + }, + { + "epoch": 3.072289156626506, + "grad_norm": 0.7095035432530095, + "learning_rate": 2.7570326099178716e-05, + "loss": 0.1761, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0884983241558075, + "step": 5865, + "valid_targets_mean": 1524.6, + "valid_targets_min": 680 + }, + { + "epoch": 3.074908328968046, + "grad_norm": 0.6555581714051659, + "learning_rate": 2.754614002689818e-05, + "loss": 0.1599, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1063360646367073, + "step": 5870, + "valid_targets_mean": 1774.9, + "valid_targets_min": 981 + }, + { + "epoch": 3.077527501309586, + "grad_norm": 0.735815034221504, + "learning_rate": 2.7521941080361275e-05, + "loss": 0.1689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09698130190372467, + "step": 5875, + "valid_targets_mean": 1748.0, + "valid_targets_min": 937 + }, + { + "epoch": 3.080146673651126, + "grad_norm": 0.7125484974425914, + "learning_rate": 2.749772930085315e-05, + "loss": 0.1692, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09398886561393738, + "step": 5880, + "valid_targets_mean": 1739.2, + "valid_targets_min": 804 + }, + { + "epoch": 3.0827658459926663, + "grad_norm": 0.9696180961709159, + "learning_rate": 2.7473504729680823e-05, + "loss": 0.1715, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06936175376176834, + "step": 5885, + "valid_targets_mean": 1306.5, + "valid_targets_min": 675 + }, + { + "epoch": 3.085385018334206, + "grad_norm": 0.7256259095947776, + "learning_rate": 2.744926740817316e-05, + "loss": 0.1635, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07942957431077957, + "step": 5890, + "valid_targets_mean": 1250.9, + "valid_targets_min": 882 + }, + { + "epoch": 3.0880041906757465, + "grad_norm": 0.6750034166270854, + "learning_rate": 2.742501737768077e-05, + "loss": 0.1632, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08731904625892639, + "step": 5895, + "valid_targets_mean": 1721.5, + "valid_targets_min": 1116 + }, + { + "epoch": 3.0906233630172864, + "grad_norm": 0.7339452739226756, + "learning_rate": 2.7400754679575948e-05, + "loss": 0.1528, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06412196904420853, + "step": 5900, + "valid_targets_mean": 1218.5, + "valid_targets_min": 678 + }, + { + "epoch": 3.0932425353588267, + "grad_norm": 0.7104961468611212, + "learning_rate": 2.7376479355252588e-05, + "loss": 0.1689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06227774918079376, + "step": 5905, + "valid_targets_mean": 1085.4, + "valid_targets_min": 676 + }, + { + "epoch": 3.0958617077003665, + "grad_norm": 0.6733244215312041, + "learning_rate": 2.7352191446126145e-05, + "loss": 0.1653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07951797544956207, + "step": 5910, + "valid_targets_mean": 1521.0, + "valid_targets_min": 849 + }, + { + "epoch": 3.098480880041907, + "grad_norm": 0.6663067364300812, + "learning_rate": 2.732789099363353e-05, + "loss": 0.1643, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08559563755989075, + "step": 5915, + "valid_targets_mean": 1485.2, + "valid_targets_min": 742 + }, + { + "epoch": 3.1011000523834467, + "grad_norm": 0.709938600907913, + "learning_rate": 2.7303578039233055e-05, + "loss": 0.1636, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10190951079130173, + "step": 5920, + "valid_targets_mean": 1642.5, + "valid_targets_min": 1077 + }, + { + "epoch": 3.103719224724987, + "grad_norm": 0.7754935357002035, + "learning_rate": 2.7279252624404374e-05, + "loss": 0.1727, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1033768430352211, + "step": 5925, + "valid_targets_mean": 1766.6, + "valid_targets_min": 858 + }, + { + "epoch": 3.106338397066527, + "grad_norm": 0.7090344892805982, + "learning_rate": 2.7254914790648387e-05, + "loss": 0.1547, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08158548176288605, + "step": 5930, + "valid_targets_mean": 1349.6, + "valid_targets_min": 689 + }, + { + "epoch": 3.108957569408067, + "grad_norm": 0.7331205271019855, + "learning_rate": 2.723056457948718e-05, + "loss": 0.1735, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08869096636772156, + "step": 5935, + "valid_targets_mean": 1466.2, + "valid_targets_min": 768 + }, + { + "epoch": 3.111576741749607, + "grad_norm": 0.7026004684688643, + "learning_rate": 2.7206202032463963e-05, + "loss": 0.1669, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07913877815008163, + "step": 5940, + "valid_targets_mean": 1471.5, + "valid_targets_min": 1058 + }, + { + "epoch": 3.1141959140911473, + "grad_norm": 0.6928949635881819, + "learning_rate": 2.7181827191142988e-05, + "loss": 0.1778, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08693772554397583, + "step": 5945, + "valid_targets_mean": 1477.9, + "valid_targets_min": 618 + }, + { + "epoch": 3.116815086432687, + "grad_norm": 0.7072944606587698, + "learning_rate": 2.7157440097109496e-05, + "loss": 0.1586, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08366671204566956, + "step": 5950, + "valid_targets_mean": 1510.1, + "valid_targets_min": 629 + }, + { + "epoch": 3.1194342587742274, + "grad_norm": 0.7155777290977046, + "learning_rate": 2.7133040791969597e-05, + "loss": 0.165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0935017466545105, + "step": 5955, + "valid_targets_mean": 1804.2, + "valid_targets_min": 1167 + }, + { + "epoch": 3.1220534311157673, + "grad_norm": 0.677362020785958, + "learning_rate": 2.7108629317350278e-05, + "loss": 0.1669, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08500826358795166, + "step": 5960, + "valid_targets_mean": 1497.8, + "valid_targets_min": 699 + }, + { + "epoch": 3.1246726034573076, + "grad_norm": 0.7286002740634437, + "learning_rate": 2.7084205714899247e-05, + "loss": 0.1582, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06782686710357666, + "step": 5965, + "valid_targets_mean": 1328.5, + "valid_targets_min": 679 + }, + { + "epoch": 3.1272917757988474, + "grad_norm": 0.7021339243865264, + "learning_rate": 2.705977002628494e-05, + "loss": 0.1596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08048438280820847, + "step": 5970, + "valid_targets_mean": 1501.8, + "valid_targets_min": 504 + }, + { + "epoch": 3.1299109481403877, + "grad_norm": 0.6830143227137973, + "learning_rate": 2.703532229319638e-05, + "loss": 0.1643, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0930556207895279, + "step": 5975, + "valid_targets_mean": 1900.4, + "valid_targets_min": 1331 + }, + { + "epoch": 3.1325301204819276, + "grad_norm": 0.6861135630337549, + "learning_rate": 2.7010862557343168e-05, + "loss": 0.1643, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04893141984939575, + "step": 5980, + "valid_targets_mean": 1172.0, + "valid_targets_min": 661 + }, + { + "epoch": 3.135149292823468, + "grad_norm": 0.6776084061989935, + "learning_rate": 2.698639086045536e-05, + "loss": 0.1694, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06864239275455475, + "step": 5985, + "valid_targets_mean": 1402.1, + "valid_targets_min": 958 + }, + { + "epoch": 3.1377684651650077, + "grad_norm": 0.6443724306278145, + "learning_rate": 2.6961907244283424e-05, + "loss": 0.1564, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09214092791080475, + "step": 5990, + "valid_targets_mean": 1866.2, + "valid_targets_min": 963 + }, + { + "epoch": 3.140387637506548, + "grad_norm": 0.6757253945114164, + "learning_rate": 2.6937411750598172e-05, + "loss": 0.1657, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06545227020978928, + "step": 5995, + "valid_targets_mean": 1191.1, + "valid_targets_min": 793 + }, + { + "epoch": 3.143006809848088, + "grad_norm": 0.7973697455117805, + "learning_rate": 2.6912904421190672e-05, + "loss": 0.1669, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11898652464151382, + "step": 6000, + "valid_targets_mean": 1563.2, + "valid_targets_min": 917 + }, + { + "epoch": 3.145625982189628, + "grad_norm": 0.722464004593059, + "learning_rate": 2.6888385297872194e-05, + "loss": 0.1629, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06986261904239655, + "step": 6005, + "valid_targets_mean": 1274.4, + "valid_targets_min": 752 + }, + { + "epoch": 3.148245154531168, + "grad_norm": 0.6946891567070904, + "learning_rate": 2.6863854422474108e-05, + "loss": 0.1647, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10306160897016525, + "step": 6010, + "valid_targets_mean": 1790.4, + "valid_targets_min": 1220 + }, + { + "epoch": 3.1508643268727083, + "grad_norm": 0.6969095258678409, + "learning_rate": 2.6839311836847856e-05, + "loss": 0.1516, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09284568578004837, + "step": 6015, + "valid_targets_mean": 1727.0, + "valid_targets_min": 953 + }, + { + "epoch": 3.153483499214248, + "grad_norm": 0.7707142300486267, + "learning_rate": 2.6814757582864847e-05, + "loss": 0.1582, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08388621360063553, + "step": 6020, + "valid_targets_mean": 1370.0, + "valid_targets_min": 639 + }, + { + "epoch": 3.1561026715557885, + "grad_norm": 0.666834244973884, + "learning_rate": 2.6790191702416405e-05, + "loss": 0.1704, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08771908283233643, + "step": 6025, + "valid_targets_mean": 1918.8, + "valid_targets_min": 746 + }, + { + "epoch": 3.1587218438973284, + "grad_norm": 0.7102588320192474, + "learning_rate": 2.676561423741368e-05, + "loss": 0.1574, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07976895570755005, + "step": 6030, + "valid_targets_mean": 1233.9, + "valid_targets_min": 781 + }, + { + "epoch": 3.1613410162388687, + "grad_norm": 0.6906103632403421, + "learning_rate": 2.6741025229787596e-05, + "loss": 0.1664, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08830182254314423, + "step": 6035, + "valid_targets_mean": 1608.4, + "valid_targets_min": 936 + }, + { + "epoch": 3.1639601885804085, + "grad_norm": 0.6967305793043933, + "learning_rate": 2.6716424721488752e-05, + "loss": 0.1628, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06965943425893784, + "step": 6040, + "valid_targets_mean": 1455.1, + "valid_targets_min": 902 + }, + { + "epoch": 3.166579360921949, + "grad_norm": 0.7506317658861008, + "learning_rate": 2.6691812754487395e-05, + "loss": 0.1675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07598876953125, + "step": 6045, + "valid_targets_mean": 1266.8, + "valid_targets_min": 986 + }, + { + "epoch": 3.1691985332634887, + "grad_norm": 0.7362679513515235, + "learning_rate": 2.6667189370773302e-05, + "loss": 0.1637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08343760669231415, + "step": 6050, + "valid_targets_mean": 1488.4, + "valid_targets_min": 1079 + }, + { + "epoch": 3.171817705605029, + "grad_norm": 0.6744924339491063, + "learning_rate": 2.664255461235573e-05, + "loss": 0.1608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07914218306541443, + "step": 6055, + "valid_targets_mean": 1512.0, + "valid_targets_min": 1290 + }, + { + "epoch": 3.174436877946569, + "grad_norm": 0.7327687496774006, + "learning_rate": 2.6617908521263344e-05, + "loss": 0.1675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08062729239463806, + "step": 6060, + "valid_targets_mean": 1439.5, + "valid_targets_min": 655 + }, + { + "epoch": 3.177056050288109, + "grad_norm": 0.7418671205008001, + "learning_rate": 2.659325113954415e-05, + "loss": 0.163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06643374264240265, + "step": 6065, + "valid_targets_mean": 1297.6, + "valid_targets_min": 667 + }, + { + "epoch": 3.179675222629649, + "grad_norm": 0.7196932247817096, + "learning_rate": 2.6568582509265403e-05, + "loss": 0.1712, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0984589010477066, + "step": 6070, + "valid_targets_mean": 1918.1, + "valid_targets_min": 1041 + }, + { + "epoch": 3.1822943949711893, + "grad_norm": 0.7471858549275774, + "learning_rate": 2.6543902672513562e-05, + "loss": 0.1682, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.062356751412153244, + "step": 6075, + "valid_targets_mean": 1216.2, + "valid_targets_min": 684 + }, + { + "epoch": 3.184913567312729, + "grad_norm": 0.6739018916560132, + "learning_rate": 2.6519211671394196e-05, + "loss": 0.1662, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08063490688800812, + "step": 6080, + "valid_targets_mean": 1757.2, + "valid_targets_min": 821 + }, + { + "epoch": 3.1875327396542694, + "grad_norm": 0.7460699909826294, + "learning_rate": 2.6494509548031926e-05, + "loss": 0.1579, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0652986541390419, + "step": 6085, + "valid_targets_mean": 1021.8, + "valid_targets_min": 620 + }, + { + "epoch": 3.1901519119958093, + "grad_norm": 0.691870261331958, + "learning_rate": 2.6469796344570348e-05, + "loss": 0.1616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09676294028759003, + "step": 6090, + "valid_targets_mean": 1853.4, + "valid_targets_min": 656 + }, + { + "epoch": 3.1927710843373496, + "grad_norm": 0.7070404191392444, + "learning_rate": 2.6445072103171952e-05, + "loss": 0.1657, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06507851183414459, + "step": 6095, + "valid_targets_mean": 1437.9, + "valid_targets_min": 697 + }, + { + "epoch": 3.1953902566788894, + "grad_norm": 0.7294314865976155, + "learning_rate": 2.6420336866018087e-05, + "loss": 0.1599, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08893925696611404, + "step": 6100, + "valid_targets_mean": 1716.4, + "valid_targets_min": 816 + }, + { + "epoch": 3.1980094290204297, + "grad_norm": 0.6705758424773739, + "learning_rate": 2.6395590675308826e-05, + "loss": 0.1553, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07986105233430862, + "step": 6105, + "valid_targets_mean": 1542.0, + "valid_targets_min": 959 + }, + { + "epoch": 3.2006286013619696, + "grad_norm": 0.7027299991646958, + "learning_rate": 2.6370833573262946e-05, + "loss": 0.1536, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06690247356891632, + "step": 6110, + "valid_targets_mean": 1193.2, + "valid_targets_min": 747 + }, + { + "epoch": 3.20324777370351, + "grad_norm": 0.7354964208411295, + "learning_rate": 2.634606560211785e-05, + "loss": 0.172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07954400777816772, + "step": 6115, + "valid_targets_mean": 1542.4, + "valid_targets_min": 933 + }, + { + "epoch": 3.2058669460450497, + "grad_norm": 0.7110894716658694, + "learning_rate": 2.6321286804129465e-05, + "loss": 0.161, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08626635372638702, + "step": 6120, + "valid_targets_mean": 1575.0, + "valid_targets_min": 827 + }, + { + "epoch": 3.20848611838659, + "grad_norm": 0.6549484866958899, + "learning_rate": 2.62964972215722e-05, + "loss": 0.155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06384006142616272, + "step": 6125, + "valid_targets_mean": 1332.8, + "valid_targets_min": 741 + }, + { + "epoch": 3.21110529072813, + "grad_norm": 0.6375353110419558, + "learning_rate": 2.6271696896738874e-05, + "loss": 0.1563, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06473011523485184, + "step": 6130, + "valid_targets_mean": 1391.2, + "valid_targets_min": 639 + }, + { + "epoch": 3.21372446306967, + "grad_norm": 0.7257128878637935, + "learning_rate": 2.62468858719406e-05, + "loss": 0.1481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06425201892852783, + "step": 6135, + "valid_targets_mean": 1068.9, + "valid_targets_min": 743 + }, + { + "epoch": 3.21634363541121, + "grad_norm": 0.6736038952728773, + "learning_rate": 2.6222064189506782e-05, + "loss": 0.163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06724032014608383, + "step": 6140, + "valid_targets_mean": 1378.8, + "valid_targets_min": 610 + }, + { + "epoch": 3.2189628077527503, + "grad_norm": 0.6862167359194624, + "learning_rate": 2.619723189178498e-05, + "loss": 0.1582, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07766151428222656, + "step": 6145, + "valid_targets_mean": 1417.6, + "valid_targets_min": 695 + }, + { + "epoch": 3.22158198009429, + "grad_norm": 0.6667822521852074, + "learning_rate": 2.6172389021140886e-05, + "loss": 0.1645, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10055532306432724, + "step": 6150, + "valid_targets_mean": 1966.2, + "valid_targets_min": 874 + }, + { + "epoch": 3.22420115243583, + "grad_norm": 0.6843734767884763, + "learning_rate": 2.6147535619958216e-05, + "loss": 0.1602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07212713360786438, + "step": 6155, + "valid_targets_mean": 1374.0, + "valid_targets_min": 765 + }, + { + "epoch": 3.2268203247773704, + "grad_norm": 0.7478392776507355, + "learning_rate": 2.6122671730638657e-05, + "loss": 0.1606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08449780195951462, + "step": 6160, + "valid_targets_mean": 1407.0, + "valid_targets_min": 816 + }, + { + "epoch": 3.2294394971189107, + "grad_norm": 0.6873028289484555, + "learning_rate": 2.6097797395601782e-05, + "loss": 0.1631, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07395478338003159, + "step": 6165, + "valid_targets_mean": 1474.1, + "valid_targets_min": 1054 + }, + { + "epoch": 3.2320586694604505, + "grad_norm": 0.4776467763544407, + "learning_rate": 2.6072912657285002e-05, + "loss": 0.1818, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0907076895236969, + "step": 6170, + "valid_targets_mean": 5532.4, + "valid_targets_min": 4247 + }, + { + "epoch": 3.2346778418019904, + "grad_norm": 0.3732618307241714, + "learning_rate": 2.6048017558143462e-05, + "loss": 0.1792, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09417170286178589, + "step": 6175, + "valid_targets_mean": 6763.9, + "valid_targets_min": 4329 + }, + { + "epoch": 3.2372970141435307, + "grad_norm": 0.38289420746438846, + "learning_rate": 2.602311214064998e-05, + "loss": 0.1681, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09114161133766174, + "step": 6180, + "valid_targets_mean": 5724.6, + "valid_targets_min": 4480 + }, + { + "epoch": 3.2399161864850705, + "grad_norm": 0.3836635906229439, + "learning_rate": 2.5998196447294996e-05, + "loss": 0.1735, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0969650000333786, + "step": 6185, + "valid_targets_mean": 5883.4, + "valid_targets_min": 4826 + }, + { + "epoch": 3.242535358826611, + "grad_norm": 0.3975060540969869, + "learning_rate": 2.5973270520586465e-05, + "loss": 0.1781, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09373161196708679, + "step": 6190, + "valid_targets_mean": 5766.0, + "valid_targets_min": 3983 + }, + { + "epoch": 3.2451545311681507, + "grad_norm": 0.37385141092856894, + "learning_rate": 2.5948334403049806e-05, + "loss": 0.1756, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08556351065635681, + "step": 6195, + "valid_targets_mean": 5980.8, + "valid_targets_min": 4998 + }, + { + "epoch": 3.247773703509691, + "grad_norm": 0.37349177636254594, + "learning_rate": 2.5923388137227825e-05, + "loss": 0.1826, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08874762803316116, + "step": 6200, + "valid_targets_mean": 5429.8, + "valid_targets_min": 4907 + }, + { + "epoch": 3.250392875851231, + "grad_norm": 0.4114694801622512, + "learning_rate": 2.5898431765680644e-05, + "loss": 0.1681, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11268821358680725, + "step": 6205, + "valid_targets_mean": 6900.6, + "valid_targets_min": 5066 + }, + { + "epoch": 3.253012048192771, + "grad_norm": 0.3587170860139122, + "learning_rate": 2.5873465330985625e-05, + "loss": 0.1901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08456286787986755, + "step": 6210, + "valid_targets_mean": 7580.8, + "valid_targets_min": 4500 + }, + { + "epoch": 3.255631220534311, + "grad_norm": 0.35279536697085795, + "learning_rate": 2.5848488875737293e-05, + "loss": 0.1711, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08426110446453094, + "step": 6215, + "valid_targets_mean": 7422.6, + "valid_targets_min": 5455 + }, + { + "epoch": 3.2582503928758513, + "grad_norm": 0.35830411133344736, + "learning_rate": 2.582350244254728e-05, + "loss": 0.1814, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08689013123512268, + "step": 6220, + "valid_targets_mean": 7564.4, + "valid_targets_min": 4236 + }, + { + "epoch": 3.260869565217391, + "grad_norm": 0.34967856809357584, + "learning_rate": 2.5798506074044225e-05, + "loss": 0.1622, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08358441293239594, + "step": 6225, + "valid_targets_mean": 6671.9, + "valid_targets_min": 5315 + }, + { + "epoch": 3.2634887375589314, + "grad_norm": 0.35882018746504213, + "learning_rate": 2.577349981287373e-05, + "loss": 0.177, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08513113856315613, + "step": 6230, + "valid_targets_mean": 6717.1, + "valid_targets_min": 4353 + }, + { + "epoch": 3.2661079099004713, + "grad_norm": 0.35269541833504336, + "learning_rate": 2.5748483701698268e-05, + "loss": 0.1558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0673292949795723, + "step": 6235, + "valid_targets_mean": 5959.0, + "valid_targets_min": 4890 + }, + { + "epoch": 3.2687270822420116, + "grad_norm": 0.3991951759169992, + "learning_rate": 2.5723457783197123e-05, + "loss": 0.1583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06948716938495636, + "step": 6240, + "valid_targets_mean": 5842.4, + "valid_targets_min": 4526 + }, + { + "epoch": 3.2713462545835514, + "grad_norm": 0.3992626001867334, + "learning_rate": 2.569842210006631e-05, + "loss": 0.1743, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09178012609481812, + "step": 6245, + "valid_targets_mean": 5798.9, + "valid_targets_min": 4793 + }, + { + "epoch": 3.2739654269250917, + "grad_norm": 0.4381857179992536, + "learning_rate": 2.56733766950185e-05, + "loss": 0.1749, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08497138321399689, + "step": 6250, + "valid_targets_mean": 6176.4, + "valid_targets_min": 3967 + }, + { + "epoch": 3.2765845992666316, + "grad_norm": 0.38177694056915856, + "learning_rate": 2.5648321610782943e-05, + "loss": 0.1518, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08642652630805969, + "step": 6255, + "valid_targets_mean": 6440.4, + "valid_targets_min": 5009 + }, + { + "epoch": 3.279203771608172, + "grad_norm": 0.385214253629684, + "learning_rate": 2.5623256890105422e-05, + "loss": 0.1568, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07483935356140137, + "step": 6260, + "valid_targets_mean": 5954.2, + "valid_targets_min": 4703 + }, + { + "epoch": 3.2818229439497117, + "grad_norm": 0.41522487533898733, + "learning_rate": 2.559818257574814e-05, + "loss": 0.1597, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07940084487199783, + "step": 6265, + "valid_targets_mean": 5829.8, + "valid_targets_min": 4385 + }, + { + "epoch": 3.284442116291252, + "grad_norm": 0.3264798440861103, + "learning_rate": 2.5573098710489683e-05, + "loss": 0.1849, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08041777461767197, + "step": 6270, + "valid_targets_mean": 7655.0, + "valid_targets_min": 5133 + }, + { + "epoch": 3.287061288632792, + "grad_norm": 0.35577133900676294, + "learning_rate": 2.5548005337124924e-05, + "loss": 0.1673, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08044205605983734, + "step": 6275, + "valid_targets_mean": 6274.6, + "valid_targets_min": 4792 + }, + { + "epoch": 3.289680460974332, + "grad_norm": 0.3676349884831182, + "learning_rate": 2.552290249846496e-05, + "loss": 0.1662, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07401085644960403, + "step": 6280, + "valid_targets_mean": 6152.8, + "valid_targets_min": 3742 + }, + { + "epoch": 3.292299633315872, + "grad_norm": 0.367132421344028, + "learning_rate": 2.5497790237337024e-05, + "loss": 0.1776, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09174760431051254, + "step": 6285, + "valid_targets_mean": 7111.8, + "valid_targets_min": 4062 + }, + { + "epoch": 3.2949188056574124, + "grad_norm": 0.3723449977990775, + "learning_rate": 2.5472668596584448e-05, + "loss": 0.1928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10043409466743469, + "step": 6290, + "valid_targets_mean": 6711.2, + "valid_targets_min": 4743 + }, + { + "epoch": 3.297537977998952, + "grad_norm": 0.37632408759519975, + "learning_rate": 2.5447537619066543e-05, + "loss": 0.2007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10895048826932907, + "step": 6295, + "valid_targets_mean": 7476.6, + "valid_targets_min": 5764 + }, + { + "epoch": 3.3001571503404925, + "grad_norm": 0.3641846475597183, + "learning_rate": 2.5422397347658575e-05, + "loss": 0.1763, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08448459208011627, + "step": 6300, + "valid_targets_mean": 6018.8, + "valid_targets_min": 4789 + }, + { + "epoch": 3.3027763226820324, + "grad_norm": 0.3750578971526196, + "learning_rate": 2.539724782525164e-05, + "loss": 0.1751, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08280646055936813, + "step": 6305, + "valid_targets_mean": 6307.5, + "valid_targets_min": 4828 + }, + { + "epoch": 3.3053954950235727, + "grad_norm": 0.3903161585255933, + "learning_rate": 2.537208909475263e-05, + "loss": 0.1715, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0846589058637619, + "step": 6310, + "valid_targets_mean": 6349.4, + "valid_targets_min": 4671 + }, + { + "epoch": 3.3080146673651125, + "grad_norm": 0.363785247862675, + "learning_rate": 2.534692119908414e-05, + "loss": 0.1805, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10132154822349548, + "step": 6315, + "valid_targets_mean": 7190.0, + "valid_targets_min": 3850 + }, + { + "epoch": 3.310633839706653, + "grad_norm": 0.3708807504191291, + "learning_rate": 2.532174418118442e-05, + "loss": 0.1691, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09385242313146591, + "step": 6320, + "valid_targets_mean": 6765.5, + "valid_targets_min": 4951 + }, + { + "epoch": 3.3132530120481927, + "grad_norm": 0.3752398723516199, + "learning_rate": 2.5296558084007253e-05, + "loss": 0.1778, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09168010950088501, + "step": 6325, + "valid_targets_mean": 8050.8, + "valid_targets_min": 4794 + }, + { + "epoch": 3.315872184389733, + "grad_norm": 0.42307307827222046, + "learning_rate": 2.5271362950521935e-05, + "loss": 0.178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09137772023677826, + "step": 6330, + "valid_targets_mean": 5186.9, + "valid_targets_min": 593 + }, + { + "epoch": 3.318491356731273, + "grad_norm": 0.3322795500595901, + "learning_rate": 2.5246158823713176e-05, + "loss": 0.1707, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07264706492424011, + "step": 6335, + "valid_targets_mean": 7296.5, + "valid_targets_min": 4633 + }, + { + "epoch": 3.321110529072813, + "grad_norm": 0.38299965795851554, + "learning_rate": 2.5220945746581014e-05, + "loss": 0.1528, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07251882553100586, + "step": 6340, + "valid_targets_mean": 6049.0, + "valid_targets_min": 5031 + }, + { + "epoch": 3.323729701414353, + "grad_norm": 0.41932734607392075, + "learning_rate": 2.5195723762140777e-05, + "loss": 0.1661, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08227471262216568, + "step": 6345, + "valid_targets_mean": 6290.0, + "valid_targets_min": 3987 + }, + { + "epoch": 3.3263488737558933, + "grad_norm": 0.404682250819354, + "learning_rate": 2.5170492913422973e-05, + "loss": 0.1794, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08566948771476746, + "step": 6350, + "valid_targets_mean": 6865.1, + "valid_targets_min": 5568 + }, + { + "epoch": 3.328968046097433, + "grad_norm": 0.4011956473179966, + "learning_rate": 2.514525324347325e-05, + "loss": 0.1775, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09244292974472046, + "step": 6355, + "valid_targets_mean": 6699.5, + "valid_targets_min": 4839 + }, + { + "epoch": 3.3315872184389734, + "grad_norm": 0.4092538401932468, + "learning_rate": 2.5120004795352287e-05, + "loss": 0.163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07024848461151123, + "step": 6360, + "valid_targets_mean": 4793.9, + "valid_targets_min": 3517 + }, + { + "epoch": 3.3342063907805133, + "grad_norm": 0.3919155985895916, + "learning_rate": 2.509474761213576e-05, + "loss": 0.1621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08399725705385208, + "step": 6365, + "valid_targets_mean": 6496.4, + "valid_targets_min": 4150 + }, + { + "epoch": 3.3368255631220536, + "grad_norm": 0.3956119853167681, + "learning_rate": 2.5069481736914218e-05, + "loss": 0.1712, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07363933324813843, + "step": 6370, + "valid_targets_mean": 5308.6, + "valid_targets_min": 4497 + }, + { + "epoch": 3.3394447354635934, + "grad_norm": 0.3820452027487794, + "learning_rate": 2.5044207212793073e-05, + "loss": 0.1754, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09037287533283234, + "step": 6375, + "valid_targets_mean": 7091.4, + "valid_targets_min": 6151 + }, + { + "epoch": 3.3420639078051337, + "grad_norm": 0.3997129999370939, + "learning_rate": 2.5018924082892465e-05, + "loss": 0.1641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08182957768440247, + "step": 6380, + "valid_targets_mean": 5894.9, + "valid_targets_min": 4661 + }, + { + "epoch": 3.3446830801466736, + "grad_norm": 0.4120300525624395, + "learning_rate": 2.4993632390347234e-05, + "loss": 0.1639, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07934527844190598, + "step": 6385, + "valid_targets_mean": 5986.8, + "valid_targets_min": 4634 + }, + { + "epoch": 3.347302252488214, + "grad_norm": 0.3614429555300503, + "learning_rate": 2.4968332178306826e-05, + "loss": 0.181, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06840213388204575, + "step": 6390, + "valid_targets_mean": 5988.5, + "valid_targets_min": 4711 + }, + { + "epoch": 3.3499214248297537, + "grad_norm": 0.3601445269199851, + "learning_rate": 2.4943023489935215e-05, + "loss": 0.1499, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0641680657863617, + "step": 6395, + "valid_targets_mean": 5294.5, + "valid_targets_min": 4430 + }, + { + "epoch": 3.352540597171294, + "grad_norm": 0.3443049477813852, + "learning_rate": 2.4917706368410838e-05, + "loss": 0.1473, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07176784425973892, + "step": 6400, + "valid_targets_mean": 5903.9, + "valid_targets_min": 4701 + }, + { + "epoch": 3.355159769512834, + "grad_norm": 0.3638713448262528, + "learning_rate": 2.4892380856926517e-05, + "loss": 0.1559, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.084088534116745, + "step": 6405, + "valid_targets_mean": 6680.9, + "valid_targets_min": 4501 + }, + { + "epoch": 3.357778941854374, + "grad_norm": 0.3849187164924035, + "learning_rate": 2.48670469986894e-05, + "loss": 0.1594, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07608664035797119, + "step": 6410, + "valid_targets_mean": 5788.4, + "valid_targets_min": 3287 + }, + { + "epoch": 3.360398114195914, + "grad_norm": 0.3772639442062634, + "learning_rate": 2.4841704836920862e-05, + "loss": 0.1769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08706492185592651, + "step": 6415, + "valid_targets_mean": 6215.6, + "valid_targets_min": 4881 + }, + { + "epoch": 3.3630172865374544, + "grad_norm": 0.41983338681278204, + "learning_rate": 2.481635441485645e-05, + "loss": 0.2065, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10334602743387222, + "step": 6420, + "valid_targets_mean": 7103.5, + "valid_targets_min": 4715 + }, + { + "epoch": 3.365636458878994, + "grad_norm": 0.3910223540701964, + "learning_rate": 2.479099577574581e-05, + "loss": 0.1692, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07273611426353455, + "step": 6425, + "valid_targets_mean": 5771.0, + "valid_targets_min": 4403 + }, + { + "epoch": 3.368255631220534, + "grad_norm": 0.41699640553441875, + "learning_rate": 2.4765628962852586e-05, + "loss": 0.1684, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08446206897497177, + "step": 6430, + "valid_targets_mean": 5611.8, + "valid_targets_min": 4657 + }, + { + "epoch": 3.3708748035620744, + "grad_norm": 0.36893431404927785, + "learning_rate": 2.474025401945439e-05, + "loss": 0.1673, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07603064179420471, + "step": 6435, + "valid_targets_mean": 6171.8, + "valid_targets_min": 4293 + }, + { + "epoch": 3.3734939759036147, + "grad_norm": 0.35851489921835866, + "learning_rate": 2.4714870988842696e-05, + "loss": 0.1805, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1075579822063446, + "step": 6440, + "valid_targets_mean": 6910.0, + "valid_targets_min": 6043 + }, + { + "epoch": 3.3761131482451545, + "grad_norm": 0.3877951110234821, + "learning_rate": 2.4689479914322777e-05, + "loss": 0.1807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09149368107318878, + "step": 6445, + "valid_targets_mean": 7532.6, + "valid_targets_min": 4876 + }, + { + "epoch": 3.3787323205866944, + "grad_norm": 0.3565687477905426, + "learning_rate": 2.466408083921363e-05, + "loss": 0.1714, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07170824706554413, + "step": 6450, + "valid_targets_mean": 5248.0, + "valid_targets_min": 2545 + }, + { + "epoch": 3.3813514929282347, + "grad_norm": 0.38380382136855723, + "learning_rate": 2.4638673806847883e-05, + "loss": 0.1782, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08993254601955414, + "step": 6455, + "valid_targets_mean": 6254.9, + "valid_targets_min": 4800 + }, + { + "epoch": 3.383970665269775, + "grad_norm": 0.34414237325334873, + "learning_rate": 2.4613258860571782e-05, + "loss": 0.1533, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07681073248386383, + "step": 6460, + "valid_targets_mean": 6607.8, + "valid_targets_min": 4228 + }, + { + "epoch": 3.386589837611315, + "grad_norm": 0.3908809599404283, + "learning_rate": 2.4587836043745027e-05, + "loss": 0.1657, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07173924148082733, + "step": 6465, + "valid_targets_mean": 5782.5, + "valid_targets_min": 5099 + }, + { + "epoch": 3.3892090099528547, + "grad_norm": 0.37696518161027326, + "learning_rate": 2.4562405399740778e-05, + "loss": 0.2121, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06864018738269806, + "step": 6470, + "valid_targets_mean": 5704.1, + "valid_targets_min": 4157 + }, + { + "epoch": 3.391828182294395, + "grad_norm": 0.3668486070721226, + "learning_rate": 2.4536966971945536e-05, + "loss": 0.162, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07351751625537872, + "step": 6475, + "valid_targets_mean": 5938.6, + "valid_targets_min": 3930 + }, + { + "epoch": 3.3944473546359353, + "grad_norm": 0.44902743122082356, + "learning_rate": 2.4511520803759083e-05, + "loss": 0.1692, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08883160352706909, + "step": 6480, + "valid_targets_mean": 5714.6, + "valid_targets_min": 4876 + }, + { + "epoch": 3.397066526977475, + "grad_norm": 0.35888992094307914, + "learning_rate": 2.448606693859442e-05, + "loss": 0.1701, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08407334983348846, + "step": 6485, + "valid_targets_mean": 6711.4, + "valid_targets_min": 3054 + }, + { + "epoch": 3.399685699319015, + "grad_norm": 0.3671497425717947, + "learning_rate": 2.4460605419877652e-05, + "loss": 0.1675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07031820714473724, + "step": 6490, + "valid_targets_mean": 6126.9, + "valid_targets_min": 4670 + }, + { + "epoch": 3.4023048716605553, + "grad_norm": 0.37887286091801736, + "learning_rate": 2.443513629104796e-05, + "loss": 0.1521, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08363084495067596, + "step": 6495, + "valid_targets_mean": 7143.2, + "valid_targets_min": 4806 + }, + { + "epoch": 3.4049240440020956, + "grad_norm": 0.3911340464093035, + "learning_rate": 2.4409659595557507e-05, + "loss": 0.1633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07207661122083664, + "step": 6500, + "valid_targets_mean": 5455.6, + "valid_targets_min": 4453 + }, + { + "epoch": 3.4075432163436354, + "grad_norm": 0.3721682476509893, + "learning_rate": 2.4384175376871366e-05, + "loss": 0.1597, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08851202577352524, + "step": 6505, + "valid_targets_mean": 7124.2, + "valid_targets_min": 4935 + }, + { + "epoch": 3.4101623886851753, + "grad_norm": 0.39766714127910935, + "learning_rate": 2.4358683678467442e-05, + "loss": 0.1544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07665763795375824, + "step": 6510, + "valid_targets_mean": 7344.5, + "valid_targets_min": 4964 + }, + { + "epoch": 3.4127815610267156, + "grad_norm": 0.3385291733527547, + "learning_rate": 2.43331845438364e-05, + "loss": 0.1649, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08365072309970856, + "step": 6515, + "valid_targets_mean": 7247.2, + "valid_targets_min": 5625 + }, + { + "epoch": 3.4154007333682554, + "grad_norm": 0.35181977929673425, + "learning_rate": 2.4307678016481595e-05, + "loss": 0.1668, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.087459996342659, + "step": 6520, + "valid_targets_mean": 7612.6, + "valid_targets_min": 5389 + }, + { + "epoch": 3.4180199057097957, + "grad_norm": 0.3599454329463783, + "learning_rate": 2.428216413991899e-05, + "loss": 0.1545, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07323252409696579, + "step": 6525, + "valid_targets_mean": 6254.5, + "valid_targets_min": 4220 + }, + { + "epoch": 3.4206390780513356, + "grad_norm": 0.3638509969197595, + "learning_rate": 2.4256642957677096e-05, + "loss": 0.1704, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09068848192691803, + "step": 6530, + "valid_targets_mean": 7109.0, + "valid_targets_min": 5071 + }, + { + "epoch": 3.423258250392876, + "grad_norm": 0.39786519172694557, + "learning_rate": 2.4231114513296868e-05, + "loss": 0.1699, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0803876668214798, + "step": 6535, + "valid_targets_mean": 5811.4, + "valid_targets_min": 2560 + }, + { + "epoch": 3.4258774227344158, + "grad_norm": 0.5287233305230999, + "learning_rate": 2.420557885033168e-05, + "loss": 0.1821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.106256864964962, + "step": 6540, + "valid_targets_mean": 4137.9, + "valid_targets_min": 1320 + }, + { + "epoch": 3.428496595075956, + "grad_norm": 0.4864357882653739, + "learning_rate": 2.4180036012347197e-05, + "loss": 0.2588, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08376993238925934, + "step": 6545, + "valid_targets_mean": 3768.8, + "valid_targets_min": 746 + }, + { + "epoch": 3.431115767417496, + "grad_norm": 0.4495192508104731, + "learning_rate": 2.415448604292133e-05, + "loss": 0.2463, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11839775741100311, + "step": 6550, + "valid_targets_mean": 5086.6, + "valid_targets_min": 1846 + }, + { + "epoch": 3.433734939759036, + "grad_norm": 0.45948985894295946, + "learning_rate": 2.4128928985644165e-05, + "loss": 0.2382, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0898493304848671, + "step": 6555, + "valid_targets_mean": 3826.8, + "valid_targets_min": 1321 + }, + { + "epoch": 3.436354112100576, + "grad_norm": 0.47832825522476635, + "learning_rate": 2.4103364884117878e-05, + "loss": 0.2433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13066086173057556, + "step": 6560, + "valid_targets_mean": 6475.0, + "valid_targets_min": 3049 + }, + { + "epoch": 3.4389732844421164, + "grad_norm": 0.5336403968678465, + "learning_rate": 2.4077793781956652e-05, + "loss": 0.2531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12808701395988464, + "step": 6565, + "valid_targets_mean": 4328.6, + "valid_targets_min": 2075 + }, + { + "epoch": 3.441592456783656, + "grad_norm": 0.4749600720867551, + "learning_rate": 2.4052215722786635e-05, + "loss": 0.2466, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12571166455745697, + "step": 6570, + "valid_targets_mean": 5135.4, + "valid_targets_min": 1991 + }, + { + "epoch": 3.4442116291251965, + "grad_norm": 0.5402532183284965, + "learning_rate": 2.4026630750245823e-05, + "loss": 0.239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11091949045658112, + "step": 6575, + "valid_targets_mean": 3699.0, + "valid_targets_min": 1665 + }, + { + "epoch": 3.4468308014667364, + "grad_norm": 0.49991999722513, + "learning_rate": 2.4001038907984015e-05, + "loss": 0.2452, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11975577473640442, + "step": 6580, + "valid_targets_mean": 4666.8, + "valid_targets_min": 578 + }, + { + "epoch": 3.4494499738082767, + "grad_norm": 0.49919660827363055, + "learning_rate": 2.3975440239662724e-05, + "loss": 0.2529, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11430370062589645, + "step": 6585, + "valid_targets_mean": 4916.1, + "valid_targets_min": 1241 + }, + { + "epoch": 3.4520691461498165, + "grad_norm": 0.5215501546589721, + "learning_rate": 2.3949834788955136e-05, + "loss": 0.2468, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12626492977142334, + "step": 6590, + "valid_targets_mean": 4525.4, + "valid_targets_min": 2726 + }, + { + "epoch": 3.454688318491357, + "grad_norm": 0.4371477610579171, + "learning_rate": 2.3924222599545967e-05, + "loss": 0.2403, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11062407493591309, + "step": 6595, + "valid_targets_mean": 6055.0, + "valid_targets_min": 2639 + }, + { + "epoch": 3.4573074908328967, + "grad_norm": 0.513368675015223, + "learning_rate": 2.3898603715131455e-05, + "loss": 0.2417, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1264042854309082, + "step": 6600, + "valid_targets_mean": 5447.0, + "valid_targets_min": 2244 + }, + { + "epoch": 3.459926663174437, + "grad_norm": 0.49105031757605666, + "learning_rate": 2.387297817941926e-05, + "loss": 0.2469, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1250518560409546, + "step": 6605, + "valid_targets_mean": 5634.1, + "valid_targets_min": 3076 + }, + { + "epoch": 3.462545835515977, + "grad_norm": 0.5547062342359849, + "learning_rate": 2.384734603612838e-05, + "loss": 0.2418, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13765278458595276, + "step": 6610, + "valid_targets_mean": 4215.6, + "valid_targets_min": 1721 + }, + { + "epoch": 3.465165007857517, + "grad_norm": 0.5817376589491438, + "learning_rate": 2.382170732898909e-05, + "loss": 0.2483, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11693128943443298, + "step": 6615, + "valid_targets_mean": 3667.0, + "valid_targets_min": 1705 + }, + { + "epoch": 3.467784180199057, + "grad_norm": 0.658845436501259, + "learning_rate": 2.3796062101742864e-05, + "loss": 0.2313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10137315094470978, + "step": 6620, + "valid_targets_mean": 3136.5, + "valid_targets_min": 1538 + }, + { + "epoch": 3.4704033525405973, + "grad_norm": 0.5716954504474003, + "learning_rate": 2.3770410398142307e-05, + "loss": 0.2416, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09106269478797913, + "step": 6625, + "valid_targets_mean": 3045.5, + "valid_targets_min": 1451 + }, + { + "epoch": 3.473022524882137, + "grad_norm": 0.560592583138159, + "learning_rate": 2.374475226195106e-05, + "loss": 0.2523, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12927128374576569, + "step": 6630, + "valid_targets_mean": 4635.6, + "valid_targets_min": 2560 + }, + { + "epoch": 3.4756416972236774, + "grad_norm": 0.579320179595869, + "learning_rate": 2.371908773694375e-05, + "loss": 0.2516, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11526928842067719, + "step": 6635, + "valid_targets_mean": 3925.4, + "valid_targets_min": 1612 + }, + { + "epoch": 3.4782608695652173, + "grad_norm": 0.5839141166219242, + "learning_rate": 2.3693416866905885e-05, + "loss": 0.2478, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14135050773620605, + "step": 6640, + "valid_targets_mean": 4462.9, + "valid_targets_min": 1921 + }, + { + "epoch": 3.4808800419067576, + "grad_norm": 0.5435071521477286, + "learning_rate": 2.3667739695633825e-05, + "loss": 0.2324, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11711271107196808, + "step": 6645, + "valid_targets_mean": 4697.6, + "valid_targets_min": 2004 + }, + { + "epoch": 3.4834992142482974, + "grad_norm": 0.5813285853264689, + "learning_rate": 2.364205626693466e-05, + "loss": 0.2436, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09046830236911774, + "step": 6650, + "valid_targets_mean": 3302.0, + "valid_targets_min": 1896 + }, + { + "epoch": 3.4861183865898377, + "grad_norm": 0.6399815223156761, + "learning_rate": 2.3616366624626165e-05, + "loss": 0.2234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1311061531305313, + "step": 6655, + "valid_targets_mean": 3412.4, + "valid_targets_min": 1846 + }, + { + "epoch": 3.4887375589313776, + "grad_norm": 0.6133645420794462, + "learning_rate": 2.3590670812536713e-05, + "loss": 0.2467, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15300464630126953, + "step": 6660, + "valid_targets_mean": 4289.0, + "valid_targets_min": 3360 + }, + { + "epoch": 3.491356731272918, + "grad_norm": 0.551325447894351, + "learning_rate": 2.3564968874505202e-05, + "loss": 0.2386, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11628319323062897, + "step": 6665, + "valid_targets_mean": 3717.1, + "valid_targets_min": 1475 + }, + { + "epoch": 3.4939759036144578, + "grad_norm": 0.5698229078957439, + "learning_rate": 2.3539260854380982e-05, + "loss": 0.2414, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1304197609424591, + "step": 6670, + "valid_targets_mean": 4400.9, + "valid_targets_min": 2229 + }, + { + "epoch": 3.496595075955998, + "grad_norm": 0.5828878520133568, + "learning_rate": 2.3513546796023783e-05, + "loss": 0.2437, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10436005890369415, + "step": 6675, + "valid_targets_mean": 3238.2, + "valid_targets_min": 1233 + }, + { + "epoch": 3.499214248297538, + "grad_norm": 0.5919028438370402, + "learning_rate": 2.348782674330363e-05, + "loss": 0.2283, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10672833770513535, + "step": 6680, + "valid_targets_mean": 3109.8, + "valid_targets_min": 869 + }, + { + "epoch": 3.501833420639078, + "grad_norm": 0.5296272359340188, + "learning_rate": 2.346210074010078e-05, + "loss": 0.2397, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1168830394744873, + "step": 6685, + "valid_targets_mean": 4352.0, + "valid_targets_min": 1781 + }, + { + "epoch": 3.504452592980618, + "grad_norm": 0.6155343206368286, + "learning_rate": 2.343636883030564e-05, + "loss": 0.2366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1330322027206421, + "step": 6690, + "valid_targets_mean": 3687.0, + "valid_targets_min": 1108 + }, + { + "epoch": 3.5070717653221584, + "grad_norm": 0.636116669556504, + "learning_rate": 2.3410631057818703e-05, + "loss": 0.2323, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11047638952732086, + "step": 6695, + "valid_targets_mean": 2814.9, + "valid_targets_min": 1913 + }, + { + "epoch": 3.509690937663698, + "grad_norm": 0.5987881246802838, + "learning_rate": 2.338488746655044e-05, + "loss": 0.2361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13345681130886078, + "step": 6700, + "valid_targets_mean": 4176.2, + "valid_targets_min": 1828 + }, + { + "epoch": 3.512310110005238, + "grad_norm": 0.5727757188547329, + "learning_rate": 2.3359138100421274e-05, + "loss": 0.2405, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10748310387134552, + "step": 6705, + "valid_targets_mean": 3962.1, + "valid_targets_min": 1589 + }, + { + "epoch": 3.5149292823467784, + "grad_norm": 0.6323122660725055, + "learning_rate": 2.333338300336147e-05, + "loss": 0.2282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11577625572681427, + "step": 6710, + "valid_targets_mean": 3307.2, + "valid_targets_min": 2289 + }, + { + "epoch": 3.5175484546883187, + "grad_norm": 0.605942931678382, + "learning_rate": 2.3307622219311078e-05, + "loss": 0.2331, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08664129674434662, + "step": 6715, + "valid_targets_mean": 2650.5, + "valid_targets_min": 1248 + }, + { + "epoch": 3.5201676270298585, + "grad_norm": 0.5885722207923769, + "learning_rate": 2.3281855792219834e-05, + "loss": 0.2449, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10523630678653717, + "step": 6720, + "valid_targets_mean": 3181.0, + "valid_targets_min": 1727 + }, + { + "epoch": 3.5227867993713984, + "grad_norm": 0.569475051288075, + "learning_rate": 2.3256083766047113e-05, + "loss": 0.2351, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13042029738426208, + "step": 6725, + "valid_targets_mean": 4625.5, + "valid_targets_min": 1965 + }, + { + "epoch": 3.5254059717129387, + "grad_norm": 0.583999831780277, + "learning_rate": 2.3230306184761853e-05, + "loss": 0.2294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13146890699863434, + "step": 6730, + "valid_targets_mean": 3945.2, + "valid_targets_min": 2018 + }, + { + "epoch": 3.528025144054479, + "grad_norm": 0.565115221902501, + "learning_rate": 2.3204523092342442e-05, + "loss": 0.2331, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11057507246732712, + "step": 6735, + "valid_targets_mean": 4180.6, + "valid_targets_min": 1730 + }, + { + "epoch": 3.530644316396019, + "grad_norm": 0.5907782420435588, + "learning_rate": 2.3178734532776685e-05, + "loss": 0.2432, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12093518674373627, + "step": 6740, + "valid_targets_mean": 3331.2, + "valid_targets_min": 2097 + }, + { + "epoch": 3.5332634887375587, + "grad_norm": 0.6428180267374662, + "learning_rate": 2.3152940550061728e-05, + "loss": 0.2298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13893792033195496, + "step": 6745, + "valid_targets_mean": 3802.9, + "valid_targets_min": 1648 + }, + { + "epoch": 3.535882661079099, + "grad_norm": 0.5816173407043932, + "learning_rate": 2.3127141188203948e-05, + "loss": 0.2391, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10701972246170044, + "step": 6750, + "valid_targets_mean": 3595.1, + "valid_targets_min": 1421 + }, + { + "epoch": 3.5385018334206393, + "grad_norm": 0.6058804924806588, + "learning_rate": 2.3101336491218916e-05, + "loss": 0.2344, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12693704664707184, + "step": 6755, + "valid_targets_mean": 3734.4, + "valid_targets_min": 2284 + }, + { + "epoch": 3.541121005762179, + "grad_norm": 0.5241777612491162, + "learning_rate": 2.3075526503131283e-05, + "loss": 0.2231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10609862208366394, + "step": 6760, + "valid_targets_mean": 4147.4, + "valid_targets_min": 2095 + }, + { + "epoch": 3.543740178103719, + "grad_norm": 0.5964242963664286, + "learning_rate": 2.304971126797475e-05, + "loss": 0.2321, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09846395254135132, + "step": 6765, + "valid_targets_mean": 3100.2, + "valid_targets_min": 1673 + }, + { + "epoch": 3.5463593504452593, + "grad_norm": 0.5303796472746766, + "learning_rate": 2.302389082979196e-05, + "loss": 0.24, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13052743673324585, + "step": 6770, + "valid_targets_mean": 4951.2, + "valid_targets_min": 2067 + }, + { + "epoch": 3.5489785227867996, + "grad_norm": 0.5751260888215624, + "learning_rate": 2.2998065232634428e-05, + "loss": 0.2326, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.087217777967453, + "step": 6775, + "valid_targets_mean": 2375.2, + "valid_targets_min": 742 + }, + { + "epoch": 3.5515976951283394, + "grad_norm": 0.5669176050593572, + "learning_rate": 2.2972234520562485e-05, + "loss": 0.2438, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1378200203180313, + "step": 6780, + "valid_targets_mean": 4786.8, + "valid_targets_min": 1766 + }, + { + "epoch": 3.5542168674698793, + "grad_norm": 0.6453716565668436, + "learning_rate": 2.2946398737645173e-05, + "loss": 0.2309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11073620617389679, + "step": 6785, + "valid_targets_mean": 3331.2, + "valid_targets_min": 1504 + }, + { + "epoch": 3.5568360398114196, + "grad_norm": 0.5577886544254315, + "learning_rate": 2.292055792796019e-05, + "loss": 0.2386, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10144495964050293, + "step": 6790, + "valid_targets_mean": 3742.8, + "valid_targets_min": 1170 + }, + { + "epoch": 3.55945521215296, + "grad_norm": 0.6007736438160111, + "learning_rate": 2.2894712135593816e-05, + "loss": 0.2297, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11968302726745605, + "step": 6795, + "valid_targets_mean": 3477.5, + "valid_targets_min": 2669 + }, + { + "epoch": 3.5620743844944998, + "grad_norm": 0.5852908871471947, + "learning_rate": 2.2868861404640826e-05, + "loss": 0.2415, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11945214867591858, + "step": 6800, + "valid_targets_mean": 3669.4, + "valid_targets_min": 2923 + }, + { + "epoch": 3.5646935568360396, + "grad_norm": 0.527808683195503, + "learning_rate": 2.2843005779204424e-05, + "loss": 0.225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09395307302474976, + "step": 6805, + "valid_targets_mean": 3643.6, + "valid_targets_min": 2756 + }, + { + "epoch": 3.56731272917758, + "grad_norm": 0.5576057861287207, + "learning_rate": 2.2817145303396155e-05, + "loss": 0.2229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11294896900653839, + "step": 6810, + "valid_targets_mean": 4241.8, + "valid_targets_min": 2526 + }, + { + "epoch": 3.56993190151912, + "grad_norm": 0.5501081807405083, + "learning_rate": 2.279128002133586e-05, + "loss": 0.2163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12715858221054077, + "step": 6815, + "valid_targets_mean": 5317.1, + "valid_targets_min": 464 + }, + { + "epoch": 3.57255107386066, + "grad_norm": 0.5597244011271181, + "learning_rate": 2.276540997715155e-05, + "loss": 0.2481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1311587691307068, + "step": 6820, + "valid_targets_mean": 4387.4, + "valid_targets_min": 1003 + }, + { + "epoch": 3.5751702462022, + "grad_norm": 0.5704061903557548, + "learning_rate": 2.273953521497938e-05, + "loss": 0.231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12439266592264175, + "step": 6825, + "valid_targets_mean": 3934.6, + "valid_targets_min": 1632 + }, + { + "epoch": 3.57778941854374, + "grad_norm": 0.5752906314810322, + "learning_rate": 2.2713655778963563e-05, + "loss": 0.2361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1213194727897644, + "step": 6830, + "valid_targets_mean": 3808.1, + "valid_targets_min": 1969 + }, + { + "epoch": 3.5804085908852805, + "grad_norm": 0.559386966041707, + "learning_rate": 2.268777171325626e-05, + "loss": 0.2282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09403820335865021, + "step": 6835, + "valid_targets_mean": 3318.8, + "valid_targets_min": 1491 + }, + { + "epoch": 3.5830277632268204, + "grad_norm": 0.6160088400557124, + "learning_rate": 2.2661883062017558e-05, + "loss": 0.247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13603980839252472, + "step": 6840, + "valid_targets_mean": 4169.9, + "valid_targets_min": 1637 + }, + { + "epoch": 3.5856469355683602, + "grad_norm": 0.522822036080833, + "learning_rate": 2.263598986941534e-05, + "loss": 0.2344, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10942547023296356, + "step": 6845, + "valid_targets_mean": 3640.1, + "valid_targets_min": 1818 + }, + { + "epoch": 3.5882661079099005, + "grad_norm": 0.5866234190352576, + "learning_rate": 2.261009217962526e-05, + "loss": 0.2264, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12125527113676071, + "step": 6850, + "valid_targets_mean": 3803.0, + "valid_targets_min": 1523 + }, + { + "epoch": 3.5908852802514404, + "grad_norm": 0.5786354258156285, + "learning_rate": 2.2584190036830635e-05, + "loss": 0.2248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1317993700504303, + "step": 6855, + "valid_targets_mean": 4696.1, + "valid_targets_min": 1814 + }, + { + "epoch": 3.5935044525929807, + "grad_norm": 0.6453915038756044, + "learning_rate": 2.2558283485222367e-05, + "loss": 0.2222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12326325476169586, + "step": 6860, + "valid_targets_mean": 3022.9, + "valid_targets_min": 1073 + }, + { + "epoch": 3.5961236249345205, + "grad_norm": 0.5588512120546468, + "learning_rate": 2.2532372568998903e-05, + "loss": 0.2207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10281728953123093, + "step": 6865, + "valid_targets_mean": 3355.5, + "valid_targets_min": 1654 + }, + { + "epoch": 3.598742797276061, + "grad_norm": 0.6307951883780548, + "learning_rate": 2.2506457332366124e-05, + "loss": 0.2149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1167975515127182, + "step": 6870, + "valid_targets_mean": 3669.1, + "valid_targets_min": 1079 + }, + { + "epoch": 3.6013619696176007, + "grad_norm": 0.6086990493021137, + "learning_rate": 2.2480537819537293e-05, + "loss": 0.2127, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08841513097286224, + "step": 6875, + "valid_targets_mean": 3073.5, + "valid_targets_min": 1143 + }, + { + "epoch": 3.603981141959141, + "grad_norm": 0.581842629892961, + "learning_rate": 2.2454614074732936e-05, + "loss": 0.2208, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0971125066280365, + "step": 6880, + "valid_targets_mean": 3300.2, + "valid_targets_min": 1853 + }, + { + "epoch": 3.606600314300681, + "grad_norm": 0.6784781899860668, + "learning_rate": 2.242868614218084e-05, + "loss": 0.2494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1171766147017479, + "step": 6885, + "valid_targets_mean": 3122.8, + "valid_targets_min": 1410 + }, + { + "epoch": 3.609219486642221, + "grad_norm": 0.6675489122087376, + "learning_rate": 2.2402754066115905e-05, + "loss": 0.2223, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09704920649528503, + "step": 6890, + "valid_targets_mean": 2564.8, + "valid_targets_min": 1566 + }, + { + "epoch": 3.611838658983761, + "grad_norm": 0.603871032055132, + "learning_rate": 2.2376817890780128e-05, + "loss": 0.2345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11461576819419861, + "step": 6895, + "valid_targets_mean": 3865.4, + "valid_targets_min": 2335 + }, + { + "epoch": 3.6144578313253013, + "grad_norm": 0.5921554960682128, + "learning_rate": 2.2350877660422475e-05, + "loss": 0.2244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11522124707698822, + "step": 6900, + "valid_targets_mean": 3269.5, + "valid_targets_min": 1255 + }, + { + "epoch": 3.617077003666841, + "grad_norm": 0.6134455521032701, + "learning_rate": 2.232493341929885e-05, + "loss": 0.2233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12292369455099106, + "step": 6905, + "valid_targets_mean": 3915.5, + "valid_targets_min": 2355 + }, + { + "epoch": 3.6196961760083814, + "grad_norm": 0.5872835124432654, + "learning_rate": 2.2298985211671975e-05, + "loss": 0.222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09926629066467285, + "step": 6910, + "valid_targets_mean": 3704.9, + "valid_targets_min": 1281 + }, + { + "epoch": 3.6223153483499213, + "grad_norm": 0.8559885474385842, + "learning_rate": 2.2273033081811367e-05, + "loss": 0.2233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12465713173151016, + "step": 6915, + "valid_targets_mean": 3788.6, + "valid_targets_min": 1836 + }, + { + "epoch": 3.6249345206914616, + "grad_norm": 0.5607531279508331, + "learning_rate": 2.2247077073993217e-05, + "loss": 0.2284, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15465277433395386, + "step": 6920, + "valid_targets_mean": 5778.1, + "valid_targets_min": 4218 + }, + { + "epoch": 3.6275536930330015, + "grad_norm": 0.5709923678031399, + "learning_rate": 2.222111723250034e-05, + "loss": 0.2229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11252649128437042, + "step": 6925, + "valid_targets_mean": 3982.6, + "valid_targets_min": 2717 + }, + { + "epoch": 3.6301728653745418, + "grad_norm": 0.6328013307602074, + "learning_rate": 2.219515360162208e-05, + "loss": 0.2268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11584963649511337, + "step": 6930, + "valid_targets_mean": 2804.9, + "valid_targets_min": 1171 + }, + { + "epoch": 3.6327920377160816, + "grad_norm": 0.5784454533017686, + "learning_rate": 2.2169186225654266e-05, + "loss": 0.2368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12169316411018372, + "step": 6935, + "valid_targets_mean": 4265.1, + "valid_targets_min": 2177 + }, + { + "epoch": 3.635411210057622, + "grad_norm": 0.5440171631544455, + "learning_rate": 2.2143215148899094e-05, + "loss": 0.2311, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11516569554805756, + "step": 6940, + "valid_targets_mean": 4090.0, + "valid_targets_min": 2368 + }, + { + "epoch": 3.6380303823991618, + "grad_norm": 0.5768498905763396, + "learning_rate": 2.2117240415665093e-05, + "loss": 0.2383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10153605788946152, + "step": 6945, + "valid_targets_mean": 4149.6, + "valid_targets_min": 2294 + }, + { + "epoch": 3.640649554740702, + "grad_norm": 0.6149359693531732, + "learning_rate": 2.2091262070267017e-05, + "loss": 0.2373, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13069310784339905, + "step": 6950, + "valid_targets_mean": 3977.1, + "valid_targets_min": 1135 + }, + { + "epoch": 3.643268727082242, + "grad_norm": 0.5984225983630644, + "learning_rate": 2.2065280157025786e-05, + "loss": 0.233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12294389307498932, + "step": 6955, + "valid_targets_mean": 4319.0, + "valid_targets_min": 1449 + }, + { + "epoch": 3.645887899423782, + "grad_norm": 0.6470752148570302, + "learning_rate": 2.2039294720268413e-05, + "loss": 0.2417, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13006079196929932, + "step": 6960, + "valid_targets_mean": 3227.5, + "valid_targets_min": 1400 + }, + { + "epoch": 3.648507071765322, + "grad_norm": 0.5732468220240098, + "learning_rate": 2.2013305804327923e-05, + "loss": 0.2405, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0939599871635437, + "step": 6965, + "valid_targets_mean": 3268.4, + "valid_targets_min": 1433 + }, + { + "epoch": 3.6511262441068624, + "grad_norm": 0.6066086118447095, + "learning_rate": 2.1987313453543254e-05, + "loss": 0.2222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08269931375980377, + "step": 6970, + "valid_targets_mean": 2946.5, + "valid_targets_min": 614 + }, + { + "epoch": 3.6537454164484022, + "grad_norm": 0.6271052804557808, + "learning_rate": 2.1961317712259237e-05, + "loss": 0.2292, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09952224791049957, + "step": 6975, + "valid_targets_mean": 3125.0, + "valid_targets_min": 2041 + }, + { + "epoch": 3.6563645887899425, + "grad_norm": 0.6305679688576481, + "learning_rate": 2.193531862482646e-05, + "loss": 0.2385, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12361295521259308, + "step": 6980, + "valid_targets_mean": 3852.9, + "valid_targets_min": 1333 + }, + { + "epoch": 3.6589837611314824, + "grad_norm": 0.5632433130439336, + "learning_rate": 2.1909316235601246e-05, + "loss": 0.2278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09937632083892822, + "step": 6985, + "valid_targets_mean": 3973.2, + "valid_targets_min": 1325 + }, + { + "epoch": 3.6616029334730227, + "grad_norm": 0.5264059565376541, + "learning_rate": 2.1883310588945523e-05, + "loss": 0.2266, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08674407750368118, + "step": 6990, + "valid_targets_mean": 3510.1, + "valid_targets_min": 2439 + }, + { + "epoch": 3.6642221058145625, + "grad_norm": 0.5763460513999769, + "learning_rate": 2.18573017292268e-05, + "loss": 0.2196, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11072199046611786, + "step": 6995, + "valid_targets_mean": 3699.4, + "valid_targets_min": 2651 + }, + { + "epoch": 3.666841278156103, + "grad_norm": 0.6203362612539552, + "learning_rate": 2.1831289700818058e-05, + "loss": 0.2313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1367991864681244, + "step": 7000, + "valid_targets_mean": 4253.4, + "valid_targets_min": 1076 + }, + { + "epoch": 3.6694604504976427, + "grad_norm": 0.5640191516108097, + "learning_rate": 2.1805274548097675e-05, + "loss": 0.2136, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12644751369953156, + "step": 7005, + "valid_targets_mean": 5076.9, + "valid_targets_min": 2127 + }, + { + "epoch": 3.672079622839183, + "grad_norm": 0.5677460744297587, + "learning_rate": 2.177925631544937e-05, + "loss": 0.2324, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11261679232120514, + "step": 7010, + "valid_targets_mean": 4415.2, + "valid_targets_min": 3904 + }, + { + "epoch": 3.674698795180723, + "grad_norm": 0.6044780997676237, + "learning_rate": 2.1753235047262124e-05, + "loss": 0.2288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08222821354866028, + "step": 7015, + "valid_targets_mean": 2814.0, + "valid_targets_min": 793 + }, + { + "epoch": 3.6773179675222627, + "grad_norm": 0.5698177819651197, + "learning_rate": 2.172721078793008e-05, + "loss": 0.2298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11177408695220947, + "step": 7020, + "valid_targets_mean": 4488.0, + "valid_targets_min": 1777 + }, + { + "epoch": 3.679937139863803, + "grad_norm": 0.5685644784817925, + "learning_rate": 2.1701183581852497e-05, + "loss": 0.2233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10050319135189056, + "step": 7025, + "valid_targets_mean": 3447.1, + "valid_targets_min": 1965 + }, + { + "epoch": 3.6825563122053433, + "grad_norm": 0.5914313903231709, + "learning_rate": 2.1675153473433653e-05, + "loss": 0.2323, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1289793699979782, + "step": 7030, + "valid_targets_mean": 4516.6, + "valid_targets_min": 1206 + }, + { + "epoch": 3.685175484546883, + "grad_norm": 0.5416343694362858, + "learning_rate": 2.1649120507082776e-05, + "loss": 0.2272, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1228301003575325, + "step": 7035, + "valid_targets_mean": 5388.2, + "valid_targets_min": 3599 + }, + { + "epoch": 3.687794656888423, + "grad_norm": 0.5824407282519591, + "learning_rate": 2.162308472721398e-05, + "loss": 0.2155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10571618378162384, + "step": 7040, + "valid_targets_mean": 3637.1, + "valid_targets_min": 1250 + }, + { + "epoch": 3.6904138292299633, + "grad_norm": 0.5941806822380946, + "learning_rate": 2.1597046178246174e-05, + "loss": 0.2169, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11149287968873978, + "step": 7045, + "valid_targets_mean": 4201.2, + "valid_targets_min": 1876 + }, + { + "epoch": 3.6930330015715036, + "grad_norm": 0.5393176593744349, + "learning_rate": 2.1571004904602993e-05, + "loss": 0.2183, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11081297695636749, + "step": 7050, + "valid_targets_mean": 4462.0, + "valid_targets_min": 2487 + }, + { + "epoch": 3.6956521739130435, + "grad_norm": 0.5873772296357762, + "learning_rate": 2.154496095071272e-05, + "loss": 0.2192, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09898903965950012, + "step": 7055, + "valid_targets_mean": 3380.9, + "valid_targets_min": 1360 + }, + { + "epoch": 3.6982713462545833, + "grad_norm": 0.589105360240938, + "learning_rate": 2.1518914361008197e-05, + "loss": 0.2138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11599930375814438, + "step": 7060, + "valid_targets_mean": 4094.6, + "valid_targets_min": 1496 + }, + { + "epoch": 3.7008905185961236, + "grad_norm": 0.6242763783101974, + "learning_rate": 2.1492865179926786e-05, + "loss": 0.2138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12099158763885498, + "step": 7065, + "valid_targets_mean": 3533.5, + "valid_targets_min": 2059 + }, + { + "epoch": 3.703509690937664, + "grad_norm": 0.579993260527459, + "learning_rate": 2.1466813451910253e-05, + "loss": 0.217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11872360855340958, + "step": 7070, + "valid_targets_mean": 4585.9, + "valid_targets_min": 2890 + }, + { + "epoch": 3.7061288632792038, + "grad_norm": 0.5772907462842918, + "learning_rate": 2.144075922140472e-05, + "loss": 0.224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08896462619304657, + "step": 7075, + "valid_targets_mean": 3349.1, + "valid_targets_min": 1598 + }, + { + "epoch": 3.7087480356207436, + "grad_norm": 0.5543791887751796, + "learning_rate": 2.1414702532860576e-05, + "loss": 0.2366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09576257318258286, + "step": 7080, + "valid_targets_mean": 3761.4, + "valid_targets_min": 2267 + }, + { + "epoch": 3.711367207962284, + "grad_norm": 0.6546215629725258, + "learning_rate": 2.1388643430732396e-05, + "loss": 0.2152, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1018991619348526, + "step": 7085, + "valid_targets_mean": 2590.0, + "valid_targets_min": 1279 + }, + { + "epoch": 3.713986380303824, + "grad_norm": 0.6337142610145704, + "learning_rate": 2.1362581959478877e-05, + "loss": 0.2172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11606380343437195, + "step": 7090, + "valid_targets_mean": 3247.0, + "valid_targets_min": 1730 + }, + { + "epoch": 3.716605552645364, + "grad_norm": 0.6550756025812633, + "learning_rate": 2.133651816356276e-05, + "loss": 0.2171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11128291487693787, + "step": 7095, + "valid_targets_mean": 3144.8, + "valid_targets_min": 1664 + }, + { + "epoch": 3.719224724986904, + "grad_norm": 0.6749025831860757, + "learning_rate": 2.1310452087450755e-05, + "loss": 0.2175, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08359639346599579, + "step": 7100, + "valid_targets_mean": 3659.5, + "valid_targets_min": 1945 + }, + { + "epoch": 3.7218438973284442, + "grad_norm": 0.5907450396294541, + "learning_rate": 2.1284383775613456e-05, + "loss": 0.2306, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12242050468921661, + "step": 7105, + "valid_targets_mean": 4016.2, + "valid_targets_min": 2418 + }, + { + "epoch": 3.7244630696699845, + "grad_norm": 0.5766563890693965, + "learning_rate": 2.1258313272525277e-05, + "loss": 0.2248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11721499264240265, + "step": 7110, + "valid_targets_mean": 4044.8, + "valid_targets_min": 2100 + }, + { + "epoch": 3.7270822420115244, + "grad_norm": 0.5765636261546505, + "learning_rate": 2.123224062266436e-05, + "loss": 0.2209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1124374270439148, + "step": 7115, + "valid_targets_mean": 3743.8, + "valid_targets_min": 1365 + }, + { + "epoch": 3.7297014143530642, + "grad_norm": 0.554981450703291, + "learning_rate": 2.1206165870512522e-05, + "loss": 0.2239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10184729099273682, + "step": 7120, + "valid_targets_mean": 4017.1, + "valid_targets_min": 1572 + }, + { + "epoch": 3.7323205866946045, + "grad_norm": 0.6135910413795018, + "learning_rate": 2.1180089060555162e-05, + "loss": 0.2292, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10245160758495331, + "step": 7125, + "valid_targets_mean": 3171.4, + "valid_targets_min": 876 + }, + { + "epoch": 3.734939759036145, + "grad_norm": 0.4202717422025161, + "learning_rate": 2.115401023728118e-05, + "loss": 0.1219, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.049300335347652435, + "step": 7130, + "valid_targets_mean": 2722.6, + "valid_targets_min": 458 + }, + { + "epoch": 3.7375589313776847, + "grad_norm": 0.42149866016405785, + "learning_rate": 2.112792944518293e-05, + "loss": 0.0921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0460713729262352, + "step": 7135, + "valid_targets_mean": 3113.1, + "valid_targets_min": 2461 + }, + { + "epoch": 3.7401781037192245, + "grad_norm": 0.375211518708931, + "learning_rate": 2.1101846728756107e-05, + "loss": 0.0844, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04961033910512924, + "step": 7140, + "valid_targets_mean": 3648.1, + "valid_targets_min": 2068 + }, + { + "epoch": 3.742797276060765, + "grad_norm": 0.43357057509450503, + "learning_rate": 2.1075762132499702e-05, + "loss": 0.1057, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.049306970089673996, + "step": 7145, + "valid_targets_mean": 3423.6, + "valid_targets_min": 2425 + }, + { + "epoch": 3.745416448402305, + "grad_norm": 0.46401565751483315, + "learning_rate": 2.104967570091591e-05, + "loss": 0.085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0431523360311985, + "step": 7150, + "valid_targets_mean": 2724.1, + "valid_targets_min": 1198 + }, + { + "epoch": 3.748035620743845, + "grad_norm": 0.7317628730767393, + "learning_rate": 2.1023587478510045e-05, + "loss": 0.1008, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07258038967847824, + "step": 7155, + "valid_targets_mean": 1232.5, + "valid_targets_min": 807 + }, + { + "epoch": 3.750654793085385, + "grad_norm": 0.4452913466256158, + "learning_rate": 2.0997497509790498e-05, + "loss": 0.1387, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05453608185052872, + "step": 7160, + "valid_targets_mean": 3487.4, + "valid_targets_min": 2351 + }, + { + "epoch": 3.753273965426925, + "grad_norm": 0.47561872194048394, + "learning_rate": 2.097140583926862e-05, + "loss": 0.0938, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07181800901889801, + "step": 7165, + "valid_targets_mean": 3126.4, + "valid_targets_min": 781 + }, + { + "epoch": 3.755893137768465, + "grad_norm": 0.34047866543595, + "learning_rate": 2.094531251145868e-05, + "loss": 0.1044, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.046262361109256744, + "step": 7170, + "valid_targets_mean": 3474.8, + "valid_targets_min": 799 + }, + { + "epoch": 3.7585123101100053, + "grad_norm": 0.3093023961260679, + "learning_rate": 2.0919217570877758e-05, + "loss": 0.1091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04107516258955002, + "step": 7175, + "valid_targets_mean": 5026.1, + "valid_targets_min": 2802 + }, + { + "epoch": 3.761131482451545, + "grad_norm": 0.33879537081383754, + "learning_rate": 2.0893121062045708e-05, + "loss": 0.0827, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.032565630972385406, + "step": 7180, + "valid_targets_mean": 2611.0, + "valid_targets_min": 574 + }, + { + "epoch": 3.7637506547930855, + "grad_norm": 0.34388373179864956, + "learning_rate": 2.0867023029485032e-05, + "loss": 0.0901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.042953215539455414, + "step": 7185, + "valid_targets_mean": 4036.5, + "valid_targets_min": 2642 + }, + { + "epoch": 3.7663698271346253, + "grad_norm": 0.5253315597352873, + "learning_rate": 2.0840923517720854e-05, + "loss": 0.0936, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06158360466361046, + "step": 7190, + "valid_targets_mean": 1960.5, + "valid_targets_min": 593 + }, + { + "epoch": 3.7689889994761656, + "grad_norm": 0.3903639599020791, + "learning_rate": 2.081482257128082e-05, + "loss": 0.1187, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03658132255077362, + "step": 7195, + "valid_targets_mean": 3354.2, + "valid_targets_min": 1353 + }, + { + "epoch": 3.7716081718177055, + "grad_norm": 0.4866331067485609, + "learning_rate": 2.078872023469501e-05, + "loss": 0.0865, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05128805711865425, + "step": 7200, + "valid_targets_mean": 2300.9, + "valid_targets_min": 818 + }, + { + "epoch": 3.7742273441592458, + "grad_norm": 0.3786582391494195, + "learning_rate": 2.076261655249588e-05, + "loss": 0.086, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.030418336391448975, + "step": 7205, + "valid_targets_mean": 2295.8, + "valid_targets_min": 934 + }, + { + "epoch": 3.7768465165007856, + "grad_norm": 0.34771139894436154, + "learning_rate": 2.0736511569218186e-05, + "loss": 0.0787, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04290395230054855, + "step": 7210, + "valid_targets_mean": 3524.4, + "valid_targets_min": 2798 + }, + { + "epoch": 3.779465688842326, + "grad_norm": 0.4755408422218981, + "learning_rate": 2.071040532939891e-05, + "loss": 0.099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03995596989989281, + "step": 7215, + "valid_targets_mean": 2810.1, + "valid_targets_min": 471 + }, + { + "epoch": 3.7820848611838658, + "grad_norm": 0.4321925357201202, + "learning_rate": 2.0684297877577165e-05, + "loss": 0.1004, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06376747786998749, + "step": 7220, + "valid_targets_mean": 3042.8, + "valid_targets_min": 903 + }, + { + "epoch": 3.784704033525406, + "grad_norm": 0.4072510935049014, + "learning_rate": 2.0658189258294144e-05, + "loss": 0.0996, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04013584181666374, + "step": 7225, + "valid_targets_mean": 3081.6, + "valid_targets_min": 474 + }, + { + "epoch": 3.787323205866946, + "grad_norm": 0.3969728795752201, + "learning_rate": 2.0632079516093015e-05, + "loss": 0.0999, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04627121612429619, + "step": 7230, + "valid_targets_mean": 3468.0, + "valid_targets_min": 640 + }, + { + "epoch": 3.7899423782084862, + "grad_norm": 0.3400736743267032, + "learning_rate": 2.0605968695518873e-05, + "loss": 0.1339, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03258595988154411, + "step": 7235, + "valid_targets_mean": 3438.4, + "valid_targets_min": 902 + }, + { + "epoch": 3.792561550550026, + "grad_norm": 0.4024576266908952, + "learning_rate": 2.057985684111866e-05, + "loss": 0.0842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.042630430310964584, + "step": 7240, + "valid_targets_mean": 3212.8, + "valid_targets_min": 1837 + }, + { + "epoch": 3.7951807228915664, + "grad_norm": 0.6884395421314213, + "learning_rate": 2.0553743997441066e-05, + "loss": 0.1157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08674518764019012, + "step": 7245, + "valid_targets_mean": 1358.8, + "valid_targets_min": 756 + }, + { + "epoch": 3.7977998952331062, + "grad_norm": 0.5349913749235634, + "learning_rate": 2.0527630209036474e-05, + "loss": 0.1116, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08277156949043274, + "step": 7250, + "valid_targets_mean": 2896.2, + "valid_targets_min": 1072 + }, + { + "epoch": 3.8004190675746465, + "grad_norm": 0.38558069149318935, + "learning_rate": 2.0501515520456895e-05, + "loss": 0.0913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02911374717950821, + "step": 7255, + "valid_targets_mean": 2908.1, + "valid_targets_min": 895 + }, + { + "epoch": 3.8030382399161864, + "grad_norm": 0.5790567115299913, + "learning_rate": 2.047539997625584e-05, + "loss": 0.2065, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1842120736837387, + "step": 7260, + "valid_targets_mean": 2562.2, + "valid_targets_min": 878 + }, + { + "epoch": 3.8056574122577267, + "grad_norm": 0.4662391343390448, + "learning_rate": 2.0449283620988322e-05, + "loss": 0.1919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04233997315168381, + "step": 7265, + "valid_targets_mean": 2087.6, + "valid_targets_min": 756 + }, + { + "epoch": 3.8082765845992665, + "grad_norm": 0.34993598136122933, + "learning_rate": 2.04231664992107e-05, + "loss": 0.1022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.036809686571359634, + "step": 7270, + "valid_targets_mean": 3421.8, + "valid_targets_min": 2963 + }, + { + "epoch": 3.810895756940807, + "grad_norm": 0.7997591185983286, + "learning_rate": 2.039704865548067e-05, + "loss": 0.1721, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22461523115634918, + "step": 7275, + "valid_targets_mean": 2375.2, + "valid_targets_min": 1153 + }, + { + "epoch": 3.8135149292823467, + "grad_norm": 0.3025477416479924, + "learning_rate": 2.0370930134357142e-05, + "loss": 0.1111, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03618280589580536, + "step": 7280, + "valid_targets_mean": 4886.2, + "valid_targets_min": 1700 + }, + { + "epoch": 3.816134101623887, + "grad_norm": 0.3336682191169776, + "learning_rate": 2.0344810980400185e-05, + "loss": 0.0902, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02956889010965824, + "step": 7285, + "valid_targets_mean": 3965.1, + "valid_targets_min": 789 + }, + { + "epoch": 3.818753273965427, + "grad_norm": 0.38169150485491554, + "learning_rate": 2.031869123817096e-05, + "loss": 0.0977, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.050395525991916656, + "step": 7290, + "valid_targets_mean": 3771.5, + "valid_targets_min": 995 + }, + { + "epoch": 3.821372446306967, + "grad_norm": 0.3567381546882948, + "learning_rate": 2.029257095223161e-05, + "loss": 0.087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.030895696952939034, + "step": 7295, + "valid_targets_mean": 2220.8, + "valid_targets_min": 488 + }, + { + "epoch": 3.823991618648507, + "grad_norm": 0.45080057733047246, + "learning_rate": 2.026645016714522e-05, + "loss": 0.0887, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05217716470360756, + "step": 7300, + "valid_targets_mean": 3635.4, + "valid_targets_min": 2437 + }, + { + "epoch": 3.8266107909900473, + "grad_norm": 0.48102035649069846, + "learning_rate": 2.024032892747573e-05, + "loss": 0.0846, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03712937980890274, + "step": 7305, + "valid_targets_mean": 1752.1, + "valid_targets_min": 712 + }, + { + "epoch": 3.829229963331587, + "grad_norm": 0.39783111724258796, + "learning_rate": 2.021420727778784e-05, + "loss": 0.0868, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04353148490190506, + "step": 7310, + "valid_targets_mean": 3713.4, + "valid_targets_min": 2422 + }, + { + "epoch": 3.831849135673127, + "grad_norm": 0.3553079012266278, + "learning_rate": 2.018808526264697e-05, + "loss": 0.0761, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04106612503528595, + "step": 7315, + "valid_targets_mean": 3998.5, + "valid_targets_min": 3643 + }, + { + "epoch": 3.8344683080146673, + "grad_norm": 0.3244256257152452, + "learning_rate": 2.0161962926619144e-05, + "loss": 0.1311, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.030028818175196648, + "step": 7320, + "valid_targets_mean": 3319.0, + "valid_targets_min": 772 + }, + { + "epoch": 3.8370874803562076, + "grad_norm": 0.38063110072772477, + "learning_rate": 2.013584031427094e-05, + "loss": 0.0705, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.029718592762947083, + "step": 7325, + "valid_targets_mean": 2934.8, + "valid_targets_min": 722 + }, + { + "epoch": 3.8397066526977475, + "grad_norm": 0.31637284793444953, + "learning_rate": 2.010971747016941e-05, + "loss": 0.079, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.031116031110286713, + "step": 7330, + "valid_targets_mean": 3656.4, + "valid_targets_min": 2788 + }, + { + "epoch": 3.8423258250392873, + "grad_norm": 0.37898954142065566, + "learning_rate": 2.0083594438882006e-05, + "loss": 0.0805, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04169466719031334, + "step": 7335, + "valid_targets_mean": 3202.5, + "valid_targets_min": 948 + }, + { + "epoch": 3.8449449973808276, + "grad_norm": 0.5617243089869247, + "learning_rate": 2.0057471264976493e-05, + "loss": 0.0983, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04837562143802643, + "step": 7340, + "valid_targets_mean": 1002.0, + "valid_targets_min": 490 + }, + { + "epoch": 3.847564169722368, + "grad_norm": 0.34839600190461567, + "learning_rate": 2.0031347993020876e-05, + "loss": 0.1101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04791203886270523, + "step": 7345, + "valid_targets_mean": 3751.9, + "valid_targets_min": 2800 + }, + { + "epoch": 3.8501833420639078, + "grad_norm": 0.4885743778972602, + "learning_rate": 2.0005224667583337e-05, + "loss": 0.1192, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07227519154548645, + "step": 7350, + "valid_targets_mean": 2641.8, + "valid_targets_min": 896 + }, + { + "epoch": 3.8528025144054476, + "grad_norm": 0.4448499530668694, + "learning_rate": 1.9979101333232136e-05, + "loss": 0.0949, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.052534934133291245, + "step": 7355, + "valid_targets_mean": 3199.0, + "valid_targets_min": 1333 + }, + { + "epoch": 3.855421686746988, + "grad_norm": 0.4615518720521214, + "learning_rate": 1.9952978034535556e-05, + "loss": 0.1093, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04913472756743431, + "step": 7360, + "valid_targets_mean": 2548.1, + "valid_targets_min": 693 + }, + { + "epoch": 3.8580408590885282, + "grad_norm": 0.4005004069162051, + "learning_rate": 1.9926854816061833e-05, + "loss": 0.1243, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03859833627939224, + "step": 7365, + "valid_targets_mean": 2482.9, + "valid_targets_min": 803 + }, + { + "epoch": 3.860660031430068, + "grad_norm": 0.4047788117435986, + "learning_rate": 1.990073172237904e-05, + "loss": 0.0931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04876485466957092, + "step": 7370, + "valid_targets_mean": 3239.2, + "valid_targets_min": 2525 + }, + { + "epoch": 3.863279203771608, + "grad_norm": 0.5068732170981666, + "learning_rate": 1.9874608798055045e-05, + "loss": 0.1149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04208771511912346, + "step": 7375, + "valid_targets_mean": 3806.1, + "valid_targets_min": 2393 + }, + { + "epoch": 3.8658983761131482, + "grad_norm": 0.3844447129019727, + "learning_rate": 1.9848486087657447e-05, + "loss": 0.0969, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.042661719024181366, + "step": 7380, + "valid_targets_mean": 2990.9, + "valid_targets_min": 804 + }, + { + "epoch": 3.8685175484546885, + "grad_norm": 0.3774126041995829, + "learning_rate": 1.982236363575345e-05, + "loss": 0.0899, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04523811489343643, + "step": 7385, + "valid_targets_mean": 4885.8, + "valid_targets_min": 3695 + }, + { + "epoch": 3.8711367207962284, + "grad_norm": 0.43172860492708126, + "learning_rate": 1.9796241486909836e-05, + "loss": 0.0805, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04847349226474762, + "step": 7390, + "valid_targets_mean": 3128.8, + "valid_targets_min": 596 + }, + { + "epoch": 3.8737558931377682, + "grad_norm": 0.2801146081181737, + "learning_rate": 1.9770119685692874e-05, + "loss": 0.0786, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03003329038619995, + "step": 7395, + "valid_targets_mean": 4567.8, + "valid_targets_min": 3804 + }, + { + "epoch": 3.8763750654793085, + "grad_norm": 0.35307733798335517, + "learning_rate": 1.974399827666822e-05, + "loss": 0.0861, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03416905924677849, + "step": 7400, + "valid_targets_mean": 3853.1, + "valid_targets_min": 2862 + }, + { + "epoch": 3.878994237820849, + "grad_norm": 0.5552958434920389, + "learning_rate": 1.971787730440087e-05, + "loss": 0.1055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06091686338186264, + "step": 7405, + "valid_targets_mean": 1072.6, + "valid_targets_min": 497 + }, + { + "epoch": 3.8816134101623887, + "grad_norm": 0.3890583830957186, + "learning_rate": 1.9691756813455084e-05, + "loss": 0.0897, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05139869451522827, + "step": 7410, + "valid_targets_mean": 4191.0, + "valid_targets_min": 3918 + }, + { + "epoch": 3.8842325825039286, + "grad_norm": 0.5350479091654851, + "learning_rate": 1.9665636848394297e-05, + "loss": 0.101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.045283541083335876, + "step": 7415, + "valid_targets_mean": 2121.9, + "valid_targets_min": 785 + }, + { + "epoch": 3.886851754845469, + "grad_norm": 0.33836036040841005, + "learning_rate": 1.9639517453781032e-05, + "loss": 0.0734, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.036470964550971985, + "step": 7420, + "valid_targets_mean": 3451.6, + "valid_targets_min": 905 + }, + { + "epoch": 3.889470927187009, + "grad_norm": 0.4235972082823505, + "learning_rate": 1.961339867417687e-05, + "loss": 0.0953, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06840990483760834, + "step": 7425, + "valid_targets_mean": 2929.2, + "valid_targets_min": 657 + }, + { + "epoch": 3.892090099528549, + "grad_norm": 0.4199428163888667, + "learning_rate": 1.9587280554142307e-05, + "loss": 0.0887, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04536977410316467, + "step": 7430, + "valid_targets_mean": 3798.9, + "valid_targets_min": 3184 + }, + { + "epoch": 3.894709271870089, + "grad_norm": 0.49563760382145616, + "learning_rate": 1.9561163138236723e-05, + "loss": 0.079, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04851203039288521, + "step": 7435, + "valid_targets_mean": 1463.9, + "valid_targets_min": 627 + }, + { + "epoch": 3.897328444211629, + "grad_norm": 0.46140585434038806, + "learning_rate": 1.9535046471018326e-05, + "loss": 0.0888, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04280813783407211, + "step": 7440, + "valid_targets_mean": 1701.5, + "valid_targets_min": 827 + }, + { + "epoch": 3.8999476165531695, + "grad_norm": 0.4696922128308981, + "learning_rate": 1.9508930597044e-05, + "loss": 0.0917, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04109931364655495, + "step": 7445, + "valid_targets_mean": 1789.9, + "valid_targets_min": 940 + }, + { + "epoch": 3.9025667888947093, + "grad_norm": 0.4046158647857266, + "learning_rate": 1.9482815560869327e-05, + "loss": 0.1068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.039725400507450104, + "step": 7450, + "valid_targets_mean": 2943.8, + "valid_targets_min": 958 + }, + { + "epoch": 3.905185961236249, + "grad_norm": 0.44635335729054926, + "learning_rate": 1.9456701407048414e-05, + "loss": 0.0879, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03700082004070282, + "step": 7455, + "valid_targets_mean": 1859.2, + "valid_targets_min": 719 + }, + { + "epoch": 3.9078051335777895, + "grad_norm": 0.48368109190536873, + "learning_rate": 1.943058818013388e-05, + "loss": 0.1076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.034503936767578125, + "step": 7460, + "valid_targets_mean": 1703.9, + "valid_targets_min": 759 + }, + { + "epoch": 3.9104243059193298, + "grad_norm": 0.749090481722063, + "learning_rate": 1.9404475924676777e-05, + "loss": 0.1094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11215709894895554, + "step": 7465, + "valid_targets_mean": 1556.6, + "valid_targets_min": 521 + }, + { + "epoch": 3.9130434782608696, + "grad_norm": 0.43379214835409946, + "learning_rate": 1.9378364685226468e-05, + "loss": 0.0894, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05452614277601242, + "step": 7470, + "valid_targets_mean": 3267.6, + "valid_targets_min": 1032 + }, + { + "epoch": 3.9156626506024095, + "grad_norm": 0.30781486338337427, + "learning_rate": 1.9352254506330626e-05, + "loss": 0.0755, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03051396831870079, + "step": 7475, + "valid_targets_mean": 3609.0, + "valid_targets_min": 2741 + }, + { + "epoch": 3.9182818229439498, + "grad_norm": 0.409820699570783, + "learning_rate": 1.932614543253506e-05, + "loss": 0.0868, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.036954060196876526, + "step": 7480, + "valid_targets_mean": 2735.8, + "valid_targets_min": 1692 + }, + { + "epoch": 3.9209009952854896, + "grad_norm": 0.3983827381797914, + "learning_rate": 1.9300037508383753e-05, + "loss": 0.1165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04921487346291542, + "step": 7485, + "valid_targets_mean": 3693.4, + "valid_targets_min": 2215 + }, + { + "epoch": 3.92352016762703, + "grad_norm": 0.34887223837531534, + "learning_rate": 1.9273930778418685e-05, + "loss": 0.0726, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03230620175600052, + "step": 7490, + "valid_targets_mean": 3109.9, + "valid_targets_min": 723 + }, + { + "epoch": 3.92613933996857, + "grad_norm": 0.3142371236980945, + "learning_rate": 1.9247825287179796e-05, + "loss": 0.0883, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03691818192601204, + "step": 7495, + "valid_targets_mean": 4984.2, + "valid_targets_min": 3282 + }, + { + "epoch": 3.92875851231011, + "grad_norm": 0.29035038233260285, + "learning_rate": 1.922172107920495e-05, + "loss": 0.0836, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.035114917904138565, + "step": 7500, + "valid_targets_mean": 3863.4, + "valid_targets_min": 995 + }, + { + "epoch": 3.93137768465165, + "grad_norm": 0.2625531451388003, + "learning_rate": 1.9195618199029783e-05, + "loss": 0.0714, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.033638183027505875, + "step": 7505, + "valid_targets_mean": 4201.0, + "valid_targets_min": 949 + }, + { + "epoch": 3.9339968569931902, + "grad_norm": 0.4064411831354708, + "learning_rate": 1.916951669118769e-05, + "loss": 0.0934, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.058708321303129196, + "step": 7510, + "valid_targets_mean": 4321.6, + "valid_targets_min": 2724 + }, + { + "epoch": 3.93661602933473, + "grad_norm": 0.305752485102919, + "learning_rate": 1.9143416600209716e-05, + "loss": 0.0777, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02644570730626583, + "step": 7515, + "valid_targets_mean": 3384.5, + "valid_targets_min": 424 + }, + { + "epoch": 3.9392352016762704, + "grad_norm": 0.38059536630926644, + "learning_rate": 1.9117317970624484e-05, + "loss": 0.1106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0355902835726738, + "step": 7520, + "valid_targets_mean": 2987.2, + "valid_targets_min": 531 + }, + { + "epoch": 3.9418543740178102, + "grad_norm": 0.3175284385746139, + "learning_rate": 1.9091220846958133e-05, + "loss": 0.1078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03525662422180176, + "step": 7525, + "valid_targets_mean": 3469.5, + "valid_targets_min": 1195 + }, + { + "epoch": 3.9444735463593505, + "grad_norm": 0.36278027512058986, + "learning_rate": 1.9065125273734228e-05, + "loss": 0.0737, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06611423939466476, + "step": 7530, + "valid_targets_mean": 2682.8, + "valid_targets_min": 722 + }, + { + "epoch": 3.9470927187008904, + "grad_norm": 0.36773275928544025, + "learning_rate": 1.903903129547369e-05, + "loss": 0.1036, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.037536874413490295, + "step": 7535, + "valid_targets_mean": 3496.9, + "valid_targets_min": 1251 + }, + { + "epoch": 3.9497118910424307, + "grad_norm": 0.4047648503696616, + "learning_rate": 1.9012938956694714e-05, + "loss": 0.0834, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04590514674782753, + "step": 7540, + "valid_targets_mean": 2912.5, + "valid_targets_min": 970 + }, + { + "epoch": 3.9523310633839706, + "grad_norm": 0.5394327284039387, + "learning_rate": 1.8986848301912707e-05, + "loss": 0.0954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04667893052101135, + "step": 7545, + "valid_targets_mean": 1423.6, + "valid_targets_min": 634 + }, + { + "epoch": 3.954950235725511, + "grad_norm": 0.5774321003985943, + "learning_rate": 1.8960759375640204e-05, + "loss": 0.109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07255034148693085, + "step": 7550, + "valid_targets_mean": 1423.9, + "valid_targets_min": 685 + }, + { + "epoch": 3.9575694080670507, + "grad_norm": 0.3963183109928674, + "learning_rate": 1.8934672222386762e-05, + "loss": 0.1191, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03373725712299347, + "step": 7555, + "valid_targets_mean": 2932.5, + "valid_targets_min": 593 + }, + { + "epoch": 3.960188580408591, + "grad_norm": 0.3216521588594565, + "learning_rate": 1.8908586886658967e-05, + "loss": 0.0908, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.033638566732406616, + "step": 7560, + "valid_targets_mean": 3945.8, + "valid_targets_min": 3129 + }, + { + "epoch": 3.962807752750131, + "grad_norm": 0.4168944532648461, + "learning_rate": 1.8882503412960247e-05, + "loss": 0.0939, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05136759579181671, + "step": 7565, + "valid_targets_mean": 3621.1, + "valid_targets_min": 859 + }, + { + "epoch": 3.965426925091671, + "grad_norm": 0.4678632826293506, + "learning_rate": 1.88564218457909e-05, + "loss": 0.0846, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04501301422715187, + "step": 7570, + "valid_targets_mean": 2553.0, + "valid_targets_min": 616 + }, + { + "epoch": 3.968046097433211, + "grad_norm": 0.3954471615047967, + "learning_rate": 1.8830342229647945e-05, + "loss": 0.0826, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03754996508359909, + "step": 7575, + "valid_targets_mean": 2690.5, + "valid_targets_min": 541 + }, + { + "epoch": 3.9706652697747513, + "grad_norm": 0.7106174824045168, + "learning_rate": 1.880426460902507e-05, + "loss": 0.0806, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05315547436475754, + "step": 7580, + "valid_targets_mean": 906.4, + "valid_targets_min": 598 + }, + { + "epoch": 3.973284442116291, + "grad_norm": 0.4165032943697711, + "learning_rate": 1.8778189028412574e-05, + "loss": 0.0972, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04184139892458916, + "step": 7585, + "valid_targets_mean": 3147.2, + "valid_targets_min": 1101 + }, + { + "epoch": 3.9759036144578315, + "grad_norm": 0.4802834714852666, + "learning_rate": 1.8752115532297263e-05, + "loss": 0.0789, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03538201004266739, + "step": 7590, + "valid_targets_mean": 2331.8, + "valid_targets_min": 680 + }, + { + "epoch": 3.9785227867993713, + "grad_norm": 0.393894429443511, + "learning_rate": 1.8726044165162406e-05, + "loss": 0.0813, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04353872686624527, + "step": 7595, + "valid_targets_mean": 2577.0, + "valid_targets_min": 774 + }, + { + "epoch": 3.9811419591409116, + "grad_norm": 0.38984281411916594, + "learning_rate": 1.869997497148761e-05, + "loss": 0.0952, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.050356339663267136, + "step": 7600, + "valid_targets_mean": 4140.1, + "valid_targets_min": 1474 + }, + { + "epoch": 3.9837611314824515, + "grad_norm": 0.2384552263579987, + "learning_rate": 1.8673907995748802e-05, + "loss": 0.0743, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02689472585916519, + "step": 7605, + "valid_targets_mean": 5498.9, + "valid_targets_min": 3677 + }, + { + "epoch": 3.9863803038239918, + "grad_norm": 0.38140640854743973, + "learning_rate": 1.8647843282418114e-05, + "loss": 0.082, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04897107183933258, + "step": 7610, + "valid_targets_mean": 3352.5, + "valid_targets_min": 675 + }, + { + "epoch": 3.9889994761655316, + "grad_norm": 0.354715669859789, + "learning_rate": 1.86217808759638e-05, + "loss": 0.0788, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03356082737445831, + "step": 7615, + "valid_targets_mean": 3902.5, + "valid_targets_min": 795 + }, + { + "epoch": 3.991618648507072, + "grad_norm": 0.5360196420481077, + "learning_rate": 1.8595720820850214e-05, + "loss": 0.1827, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08176171779632568, + "step": 7620, + "valid_targets_mean": 2495.0, + "valid_targets_min": 605 + }, + { + "epoch": 3.994237820848612, + "grad_norm": 0.3272683951673967, + "learning_rate": 1.8569663161537665e-05, + "loss": 0.0778, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.039716288447380066, + "step": 7625, + "valid_targets_mean": 3298.6, + "valid_targets_min": 985 + }, + { + "epoch": 3.9968569931901516, + "grad_norm": 0.4054114117257748, + "learning_rate": 1.854360794248241e-05, + "loss": 0.0915, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04544153809547424, + "step": 7630, + "valid_targets_mean": 3505.2, + "valid_targets_min": 878 + }, + { + "epoch": 3.999476165531692, + "grad_norm": 0.574865559161945, + "learning_rate": 1.8517555208136508e-05, + "loss": 0.1113, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12018486857414246, + "step": 7635, + "valid_targets_mean": 2289.5, + "valid_targets_min": 1214 + }, + { + "epoch": 4.002095337873232, + "grad_norm": 0.8147505408907869, + "learning_rate": 1.8491505002947784e-05, + "loss": 0.1637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07107695192098618, + "step": 7640, + "valid_targets_mean": 1391.0, + "valid_targets_min": 722 + }, + { + "epoch": 4.0047145102147725, + "grad_norm": 0.7834448703599444, + "learning_rate": 1.846545737135978e-05, + "loss": 0.1604, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0666496679186821, + "step": 7645, + "valid_targets_mean": 1389.0, + "valid_targets_min": 725 + }, + { + "epoch": 4.007333682556312, + "grad_norm": 0.7176476370684532, + "learning_rate": 1.8439412357811607e-05, + "loss": 0.1542, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07671309262514114, + "step": 7650, + "valid_targets_mean": 1432.1, + "valid_targets_min": 933 + }, + { + "epoch": 4.009952854897852, + "grad_norm": 0.7138731947033008, + "learning_rate": 1.8413370006737934e-05, + "loss": 0.1506, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07407839596271515, + "step": 7655, + "valid_targets_mean": 1396.4, + "valid_targets_min": 615 + }, + { + "epoch": 4.0125720272393925, + "grad_norm": 0.7590080786379892, + "learning_rate": 1.838733036256888e-05, + "loss": 0.1538, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07466895878314972, + "step": 7660, + "valid_targets_mean": 1552.1, + "valid_targets_min": 715 + }, + { + "epoch": 4.015191199580933, + "grad_norm": 0.832969840506494, + "learning_rate": 1.836129346972995e-05, + "loss": 0.1577, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11136734485626221, + "step": 7665, + "valid_targets_mean": 1899.1, + "valid_targets_min": 1090 + }, + { + "epoch": 4.017810371922472, + "grad_norm": 0.7439198656657051, + "learning_rate": 1.8335259372641945e-05, + "loss": 0.146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06305424869060516, + "step": 7670, + "valid_targets_mean": 1217.5, + "valid_targets_min": 761 + }, + { + "epoch": 4.0204295442640126, + "grad_norm": 0.6686768105488541, + "learning_rate": 1.8309228115720907e-05, + "loss": 0.1609, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06820094585418701, + "step": 7675, + "valid_targets_mean": 1600.6, + "valid_targets_min": 1182 + }, + { + "epoch": 4.023048716605553, + "grad_norm": 0.7986341260316357, + "learning_rate": 1.8283199743378028e-05, + "loss": 0.1496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07157409191131592, + "step": 7680, + "valid_targets_mean": 1476.8, + "valid_targets_min": 733 + }, + { + "epoch": 4.025667888947093, + "grad_norm": 0.7368932947097813, + "learning_rate": 1.8257174300019565e-05, + "loss": 0.156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06354066729545593, + "step": 7685, + "valid_targets_mean": 1622.1, + "valid_targets_min": 964 + }, + { + "epoch": 4.028287061288633, + "grad_norm": 0.7356153462819714, + "learning_rate": 1.8231151830046818e-05, + "loss": 0.1427, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08492037653923035, + "step": 7690, + "valid_targets_mean": 1614.6, + "valid_targets_min": 1046 + }, + { + "epoch": 4.030906233630173, + "grad_norm": 0.7331956418545665, + "learning_rate": 1.8205132377855974e-05, + "loss": 0.1558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08211348950862885, + "step": 7695, + "valid_targets_mean": 1828.8, + "valid_targets_min": 1434 + }, + { + "epoch": 4.033525405971713, + "grad_norm": 0.742440518015762, + "learning_rate": 1.8179115987838078e-05, + "loss": 0.143, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06464903056621552, + "step": 7700, + "valid_targets_mean": 1226.8, + "valid_targets_min": 570 + }, + { + "epoch": 4.036144578313253, + "grad_norm": 0.8092304133955073, + "learning_rate": 1.8153102704378975e-05, + "loss": 0.1421, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05798610299825668, + "step": 7705, + "valid_targets_mean": 1114.1, + "valid_targets_min": 548 + }, + { + "epoch": 4.038763750654793, + "grad_norm": 0.7007036076832147, + "learning_rate": 1.8127092571859173e-05, + "loss": 0.136, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05507735162973404, + "step": 7710, + "valid_targets_mean": 1238.2, + "valid_targets_min": 682 + }, + { + "epoch": 4.041382922996333, + "grad_norm": 0.7570528581637733, + "learning_rate": 1.8101085634653846e-05, + "loss": 0.148, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05682568997144699, + "step": 7715, + "valid_targets_mean": 1509.5, + "valid_targets_min": 968 + }, + { + "epoch": 4.0440020953378735, + "grad_norm": 0.7655927174644584, + "learning_rate": 1.8075081937132676e-05, + "loss": 0.1525, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07743413746356964, + "step": 7720, + "valid_targets_mean": 1428.2, + "valid_targets_min": 597 + }, + { + "epoch": 4.046621267679413, + "grad_norm": 0.7328719613273594, + "learning_rate": 1.8049081523659855e-05, + "loss": 0.1548, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07145942747592926, + "step": 7725, + "valid_targets_mean": 1484.6, + "valid_targets_min": 772 + }, + { + "epoch": 4.049240440020953, + "grad_norm": 0.722312852380765, + "learning_rate": 1.8023084438593945e-05, + "loss": 0.1473, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05349155515432358, + "step": 7730, + "valid_targets_mean": 1381.1, + "valid_targets_min": 978 + }, + { + "epoch": 4.0518596123624935, + "grad_norm": 0.6831881102657719, + "learning_rate": 1.7997090726287828e-05, + "loss": 0.1433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05978317931294441, + "step": 7735, + "valid_targets_mean": 1295.9, + "valid_targets_min": 785 + }, + { + "epoch": 4.054478784704034, + "grad_norm": 0.7914198620249139, + "learning_rate": 1.797110043108866e-05, + "loss": 0.1497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05559869110584259, + "step": 7740, + "valid_targets_mean": 1203.9, + "valid_targets_min": 617 + }, + { + "epoch": 4.057097957045573, + "grad_norm": 0.8442139413690831, + "learning_rate": 1.794511359733774e-05, + "loss": 0.1522, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06827697902917862, + "step": 7745, + "valid_targets_mean": 1205.5, + "valid_targets_min": 711 + }, + { + "epoch": 4.0597171293871135, + "grad_norm": 0.7380528812620671, + "learning_rate": 1.791913026937048e-05, + "loss": 0.1439, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07087908685207367, + "step": 7750, + "valid_targets_mean": 1532.2, + "valid_targets_min": 1190 + }, + { + "epoch": 4.062336301728654, + "grad_norm": 0.7754559109397527, + "learning_rate": 1.789315049151629e-05, + "loss": 0.141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07318627834320068, + "step": 7755, + "valid_targets_mean": 1501.0, + "valid_targets_min": 774 + }, + { + "epoch": 4.064955474070194, + "grad_norm": 0.6970757617812192, + "learning_rate": 1.7867174308098537e-05, + "loss": 0.1424, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08933094888925552, + "step": 7760, + "valid_targets_mean": 2143.0, + "valid_targets_min": 1057 + }, + { + "epoch": 4.0675746464117335, + "grad_norm": 0.8299370161831886, + "learning_rate": 1.7841201763434465e-05, + "loss": 0.143, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06878514587879181, + "step": 7765, + "valid_targets_mean": 1453.0, + "valid_targets_min": 1004 + }, + { + "epoch": 4.070193818753274, + "grad_norm": 0.7525883738507897, + "learning_rate": 1.781523290183508e-05, + "loss": 0.1465, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07721415162086487, + "step": 7770, + "valid_targets_mean": 1736.9, + "valid_targets_min": 803 + }, + { + "epoch": 4.072812991094814, + "grad_norm": 0.6769824810891483, + "learning_rate": 1.7789267767605145e-05, + "loss": 0.1526, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06848867982625961, + "step": 7775, + "valid_targets_mean": 1477.9, + "valid_targets_min": 830 + }, + { + "epoch": 4.075432163436354, + "grad_norm": 0.7061942178506194, + "learning_rate": 1.7763306405043027e-05, + "loss": 0.1415, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.062424588948488235, + "step": 7780, + "valid_targets_mean": 1463.9, + "valid_targets_min": 646 + }, + { + "epoch": 4.078051335777894, + "grad_norm": 0.7614928786964195, + "learning_rate": 1.773734885844068e-05, + "loss": 0.1496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07690142095088959, + "step": 7785, + "valid_targets_mean": 1431.2, + "valid_targets_min": 591 + }, + { + "epoch": 4.080670508119434, + "grad_norm": 0.7726308989574523, + "learning_rate": 1.7711395172083546e-05, + "loss": 0.1514, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09195318818092346, + "step": 7790, + "valid_targets_mean": 1579.6, + "valid_targets_min": 796 + }, + { + "epoch": 4.083289680460974, + "grad_norm": 0.7709271587907439, + "learning_rate": 1.768544539025046e-05, + "loss": 0.1432, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07206501066684723, + "step": 7795, + "valid_targets_mean": 1642.8, + "valid_targets_min": 903 + }, + { + "epoch": 4.085908852802515, + "grad_norm": 0.7563531244723153, + "learning_rate": 1.7659499557213624e-05, + "loss": 0.1408, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07513036578893661, + "step": 7800, + "valid_targets_mean": 1417.9, + "valid_targets_min": 665 + }, + { + "epoch": 4.088528025144054, + "grad_norm": 0.7261910183527875, + "learning_rate": 1.763355771723849e-05, + "loss": 0.14, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06454315036535263, + "step": 7805, + "valid_targets_mean": 1389.1, + "valid_targets_min": 652 + }, + { + "epoch": 4.091147197485594, + "grad_norm": 0.8458040723209423, + "learning_rate": 1.76076199145837e-05, + "loss": 0.141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.058387018740177155, + "step": 7810, + "valid_targets_mean": 1289.8, + "valid_targets_min": 662 + }, + { + "epoch": 4.093766369827135, + "grad_norm": 0.7930638210354205, + "learning_rate": 1.7581686193500997e-05, + "loss": 0.1435, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06643882393836975, + "step": 7815, + "valid_targets_mean": 1264.9, + "valid_targets_min": 770 + }, + { + "epoch": 4.096385542168675, + "grad_norm": 0.8133522359187357, + "learning_rate": 1.7555756598235178e-05, + "loss": 0.1398, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08015811443328857, + "step": 7820, + "valid_targets_mean": 1399.9, + "valid_targets_min": 966 + }, + { + "epoch": 4.099004714510214, + "grad_norm": 0.7293726199024233, + "learning_rate": 1.7529831173023994e-05, + "loss": 0.1427, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06379858404397964, + "step": 7825, + "valid_targets_mean": 1443.0, + "valid_targets_min": 773 + }, + { + "epoch": 4.101623886851755, + "grad_norm": 0.7568027073881571, + "learning_rate": 1.7503909962098075e-05, + "loss": 0.1413, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06921360641717911, + "step": 7830, + "valid_targets_mean": 1566.1, + "valid_targets_min": 940 + }, + { + "epoch": 4.104243059193295, + "grad_norm": 0.805512965299132, + "learning_rate": 1.7477993009680874e-05, + "loss": 0.1459, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05086955055594444, + "step": 7835, + "valid_targets_mean": 1089.4, + "valid_targets_min": 801 + }, + { + "epoch": 4.106862231534835, + "grad_norm": 0.7092495943845473, + "learning_rate": 1.745208035998857e-05, + "loss": 0.1381, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08520159125328064, + "step": 7840, + "valid_targets_mean": 1911.8, + "valid_targets_min": 634 + }, + { + "epoch": 4.109481403876375, + "grad_norm": 0.7503348918284387, + "learning_rate": 1.7426172057229987e-05, + "loss": 0.1511, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09396681934595108, + "step": 7845, + "valid_targets_mean": 1958.2, + "valid_targets_min": 919 + }, + { + "epoch": 4.112100576217915, + "grad_norm": 0.705556169148339, + "learning_rate": 1.7400268145606576e-05, + "loss": 0.1431, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08061669766902924, + "step": 7850, + "valid_targets_mean": 1991.5, + "valid_targets_min": 1102 + }, + { + "epoch": 4.114719748559455, + "grad_norm": 0.7455599835269692, + "learning_rate": 1.7374368669312245e-05, + "loss": 0.1481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05526871606707573, + "step": 7855, + "valid_targets_mean": 1266.5, + "valid_targets_min": 841 + }, + { + "epoch": 4.117338920900996, + "grad_norm": 0.7808324338281639, + "learning_rate": 1.7348473672533377e-05, + "loss": 0.1382, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05895335227251053, + "step": 7860, + "valid_targets_mean": 1280.8, + "valid_targets_min": 956 + }, + { + "epoch": 4.119958093242535, + "grad_norm": 0.8609518643491395, + "learning_rate": 1.732258319944868e-05, + "loss": 0.1439, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06586974114179611, + "step": 7865, + "valid_targets_mean": 1224.2, + "valid_targets_min": 857 + }, + { + "epoch": 4.122577265584075, + "grad_norm": 0.7522490704276529, + "learning_rate": 1.729669729422917e-05, + "loss": 0.1456, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07322436571121216, + "step": 7870, + "valid_targets_mean": 1312.2, + "valid_targets_min": 808 + }, + { + "epoch": 4.125196437925616, + "grad_norm": 0.7868336422863321, + "learning_rate": 1.727081600103806e-05, + "loss": 0.1342, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06527800858020782, + "step": 7875, + "valid_targets_mean": 1253.1, + "valid_targets_min": 817 + }, + { + "epoch": 4.127815610267156, + "grad_norm": 0.7608696113993708, + "learning_rate": 1.7244939364030676e-05, + "loss": 0.1365, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.057997383177280426, + "step": 7880, + "valid_targets_mean": 1261.5, + "valid_targets_min": 727 + }, + { + "epoch": 4.130434782608695, + "grad_norm": 0.746396394408531, + "learning_rate": 1.7219067427354436e-05, + "loss": 0.1426, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0750526711344719, + "step": 7885, + "valid_targets_mean": 1557.1, + "valid_targets_min": 907 + }, + { + "epoch": 4.133053954950236, + "grad_norm": 0.7734343498112959, + "learning_rate": 1.7193200235148706e-05, + "loss": 0.1436, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0678153932094574, + "step": 7890, + "valid_targets_mean": 1369.2, + "valid_targets_min": 669 + }, + { + "epoch": 4.135673127291776, + "grad_norm": 0.688620854608366, + "learning_rate": 1.716733783154479e-05, + "loss": 0.1434, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07749447226524353, + "step": 7895, + "valid_targets_mean": 1794.9, + "valid_targets_min": 750 + }, + { + "epoch": 4.138292299633316, + "grad_norm": 0.7462520237842121, + "learning_rate": 1.7141480260665794e-05, + "loss": 0.1382, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06762084364891052, + "step": 7900, + "valid_targets_mean": 1542.2, + "valid_targets_min": 736 + }, + { + "epoch": 4.140911471974856, + "grad_norm": 0.7705392056294689, + "learning_rate": 1.711562756662658e-05, + "loss": 0.1449, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08405694365501404, + "step": 7905, + "valid_targets_mean": 1618.6, + "valid_targets_min": 694 + }, + { + "epoch": 4.143530644316396, + "grad_norm": 0.7401935877883663, + "learning_rate": 1.7089779793533716e-05, + "loss": 0.1409, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08615291118621826, + "step": 7910, + "valid_targets_mean": 1725.2, + "valid_targets_min": 806 + }, + { + "epoch": 4.146149816657936, + "grad_norm": 0.8661918661157276, + "learning_rate": 1.706393698548534e-05, + "loss": 0.1437, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06610341370105743, + "step": 7915, + "valid_targets_mean": 1304.5, + "valid_targets_min": 809 + }, + { + "epoch": 4.1487689889994765, + "grad_norm": 0.724989948253216, + "learning_rate": 1.703809918657116e-05, + "loss": 0.1404, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04395994916558266, + "step": 7920, + "valid_targets_mean": 1106.8, + "valid_targets_min": 698 + }, + { + "epoch": 4.151388161341016, + "grad_norm": 0.7846331292623914, + "learning_rate": 1.7012266440872294e-05, + "loss": 0.1322, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0646669939160347, + "step": 7925, + "valid_targets_mean": 1276.2, + "valid_targets_min": 750 + }, + { + "epoch": 4.154007333682556, + "grad_norm": 0.822275111676299, + "learning_rate": 1.6986438792461272e-05, + "loss": 0.143, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09048368781805038, + "step": 7930, + "valid_targets_mean": 1869.1, + "valid_targets_min": 1003 + }, + { + "epoch": 4.156626506024097, + "grad_norm": 0.7688287932415243, + "learning_rate": 1.696061628540191e-05, + "loss": 0.1454, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0764274001121521, + "step": 7935, + "valid_targets_mean": 1735.8, + "valid_targets_min": 907 + }, + { + "epoch": 4.159245678365637, + "grad_norm": 0.7603343008442301, + "learning_rate": 1.6934798963749256e-05, + "loss": 0.1375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0774686336517334, + "step": 7940, + "valid_targets_mean": 1505.4, + "valid_targets_min": 1160 + }, + { + "epoch": 4.161864850707176, + "grad_norm": 0.7324817066259853, + "learning_rate": 1.6908986871549525e-05, + "loss": 0.1445, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07530603557825089, + "step": 7945, + "valid_targets_mean": 1562.1, + "valid_targets_min": 1119 + }, + { + "epoch": 4.164484023048717, + "grad_norm": 0.7355857744107196, + "learning_rate": 1.6883180052839975e-05, + "loss": 0.1443, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08236520737409592, + "step": 7950, + "valid_targets_mean": 1615.5, + "valid_targets_min": 700 + }, + { + "epoch": 4.167103195390257, + "grad_norm": 0.7494770260259638, + "learning_rate": 1.6857378551648918e-05, + "loss": 0.141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.055171504616737366, + "step": 7955, + "valid_targets_mean": 1330.6, + "valid_targets_min": 859 + }, + { + "epoch": 4.169722367731797, + "grad_norm": 0.8679246068657159, + "learning_rate": 1.6831582411995556e-05, + "loss": 0.1459, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06985874474048615, + "step": 7960, + "valid_targets_mean": 1289.4, + "valid_targets_min": 635 + }, + { + "epoch": 4.172341540073337, + "grad_norm": 0.8015833114321246, + "learning_rate": 1.680579167788994e-05, + "loss": 0.1371, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08213045448064804, + "step": 7965, + "valid_targets_mean": 1576.4, + "valid_targets_min": 673 + }, + { + "epoch": 4.174960712414877, + "grad_norm": 0.8100547386034976, + "learning_rate": 1.6780006393332934e-05, + "loss": 0.1468, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08223119378089905, + "step": 7970, + "valid_targets_mean": 1317.2, + "valid_targets_min": 851 + }, + { + "epoch": 4.177579884756417, + "grad_norm": 0.8021779391612973, + "learning_rate": 1.675422660231607e-05, + "loss": 0.1365, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0749107152223587, + "step": 7975, + "valid_targets_mean": 1581.0, + "valid_targets_min": 870 + }, + { + "epoch": 4.1801990570979575, + "grad_norm": 0.7954715334575904, + "learning_rate": 1.672845234882153e-05, + "loss": 0.1545, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10032214224338531, + "step": 7980, + "valid_targets_mean": 1962.4, + "valid_targets_min": 1156 + }, + { + "epoch": 4.182818229439497, + "grad_norm": 0.7187552218621887, + "learning_rate": 1.6702683676822028e-05, + "loss": 0.1404, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.054006561636924744, + "step": 7985, + "valid_targets_mean": 1244.0, + "valid_targets_min": 657 + }, + { + "epoch": 4.185437401781037, + "grad_norm": 0.7287158136368013, + "learning_rate": 1.6676920630280785e-05, + "loss": 0.144, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07185535877943039, + "step": 7990, + "valid_targets_mean": 1536.6, + "valid_targets_min": 672 + }, + { + "epoch": 4.1880565741225775, + "grad_norm": 0.7539873725776786, + "learning_rate": 1.66511632531514e-05, + "loss": 0.1401, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08302894979715347, + "step": 7995, + "valid_targets_mean": 1686.9, + "valid_targets_min": 1019 + }, + { + "epoch": 4.190675746464118, + "grad_norm": 0.8157626078261773, + "learning_rate": 1.6625411589377795e-05, + "loss": 0.1364, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06138870120048523, + "step": 8000, + "valid_targets_mean": 1172.5, + "valid_targets_min": 732 + }, + { + "epoch": 4.193294918805657, + "grad_norm": 0.8008925323806418, + "learning_rate": 1.659966568289417e-05, + "loss": 0.1448, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05657664313912392, + "step": 8005, + "valid_targets_mean": 1255.4, + "valid_targets_min": 634 + }, + { + "epoch": 4.1959140911471975, + "grad_norm": 0.7236013504321113, + "learning_rate": 1.6573925577624885e-05, + "loss": 0.1345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07120637595653534, + "step": 8010, + "valid_targets_mean": 1793.1, + "valid_targets_min": 905 + }, + { + "epoch": 4.198533263488738, + "grad_norm": 0.7366915314972589, + "learning_rate": 1.6548191317484405e-05, + "loss": 0.1337, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08546614646911621, + "step": 8015, + "valid_targets_mean": 1636.1, + "valid_targets_min": 596 + }, + { + "epoch": 4.201152435830277, + "grad_norm": 0.7310244741400327, + "learning_rate": 1.6522462946377233e-05, + "loss": 0.1335, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06330102682113647, + "step": 8020, + "valid_targets_mean": 1320.8, + "valid_targets_min": 687 + }, + { + "epoch": 4.2037716081718175, + "grad_norm": 0.7555194632894897, + "learning_rate": 1.6496740508197797e-05, + "loss": 0.1477, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06768176704645157, + "step": 8025, + "valid_targets_mean": 1494.8, + "valid_targets_min": 820 + }, + { + "epoch": 4.206390780513358, + "grad_norm": 0.7265269483373465, + "learning_rate": 1.647102404683044e-05, + "loss": 0.1384, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07998554408550262, + "step": 8030, + "valid_targets_mean": 2009.6, + "valid_targets_min": 1256 + }, + { + "epoch": 4.209009952854898, + "grad_norm": 0.7598587392455949, + "learning_rate": 1.6445313606149278e-05, + "loss": 0.1365, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07028426229953766, + "step": 8035, + "valid_targets_mean": 1477.8, + "valid_targets_min": 1122 + }, + { + "epoch": 4.2116291251964375, + "grad_norm": 0.7664829569108801, + "learning_rate": 1.6419609230018183e-05, + "loss": 0.1348, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06817641854286194, + "step": 8040, + "valid_targets_mean": 1564.5, + "valid_targets_min": 850 + }, + { + "epoch": 4.214248297537978, + "grad_norm": 0.7234625660676817, + "learning_rate": 1.639391096229065e-05, + "loss": 0.1262, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07557559013366699, + "step": 8045, + "valid_targets_mean": 1746.5, + "valid_targets_min": 1389 + }, + { + "epoch": 4.216867469879518, + "grad_norm": 0.7745049628839951, + "learning_rate": 1.6368218846809777e-05, + "loss": 0.1412, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0712113231420517, + "step": 8050, + "valid_targets_mean": 1474.5, + "valid_targets_min": 1196 + }, + { + "epoch": 4.219486642221058, + "grad_norm": 0.7587287795680999, + "learning_rate": 1.6342532927408153e-05, + "loss": 0.1386, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07678717374801636, + "step": 8055, + "valid_targets_mean": 1668.9, + "valid_targets_min": 684 + }, + { + "epoch": 4.222105814562598, + "grad_norm": 0.8432068094692399, + "learning_rate": 1.63168532479078e-05, + "loss": 0.1399, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07342837005853653, + "step": 8060, + "valid_targets_mean": 1506.5, + "valid_targets_min": 847 + }, + { + "epoch": 4.224724986904138, + "grad_norm": 0.6838792512397553, + "learning_rate": 1.6291179852120095e-05, + "loss": 0.1407, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07926402986049652, + "step": 8065, + "valid_targets_mean": 1890.0, + "valid_targets_min": 1399 + }, + { + "epoch": 4.227344159245678, + "grad_norm": 0.7674603399756434, + "learning_rate": 1.626551278384569e-05, + "loss": 0.1387, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07749255001544952, + "step": 8070, + "valid_targets_mean": 1633.8, + "valid_targets_min": 594 + }, + { + "epoch": 4.229963331587219, + "grad_norm": 0.7177674834291355, + "learning_rate": 1.623985208687445e-05, + "loss": 0.141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0683123916387558, + "step": 8075, + "valid_targets_mean": 1847.6, + "valid_targets_min": 958 + }, + { + "epoch": 4.232582503928758, + "grad_norm": 0.6146871340342175, + "learning_rate": 1.6214197804985364e-05, + "loss": 0.1738, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08079074323177338, + "step": 8080, + "valid_targets_mean": 6074.6, + "valid_targets_min": 4960 + }, + { + "epoch": 4.235201676270298, + "grad_norm": 0.40635000420186906, + "learning_rate": 1.6188549981946475e-05, + "loss": 0.1641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07531790435314178, + "step": 8085, + "valid_targets_mean": 7117.6, + "valid_targets_min": 4541 + }, + { + "epoch": 4.237820848611839, + "grad_norm": 0.41096452601330413, + "learning_rate": 1.616290866151481e-05, + "loss": 0.1583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08659469336271286, + "step": 8090, + "valid_targets_mean": 6001.4, + "valid_targets_min": 4245 + }, + { + "epoch": 4.240440020953379, + "grad_norm": 0.35428357067602523, + "learning_rate": 1.6137273887436302e-05, + "loss": 0.1585, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0781104564666748, + "step": 8095, + "valid_targets_mean": 7032.8, + "valid_targets_min": 4108 + }, + { + "epoch": 4.243059193294918, + "grad_norm": 0.37198233829614286, + "learning_rate": 1.611164570344572e-05, + "loss": 0.1656, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09088402986526489, + "step": 8100, + "valid_targets_mean": 7311.5, + "valid_targets_min": 4689 + }, + { + "epoch": 4.245678365636459, + "grad_norm": 0.40630240395512573, + "learning_rate": 1.6086024153266574e-05, + "loss": 0.1666, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09036040306091309, + "step": 8105, + "valid_targets_mean": 6030.6, + "valid_targets_min": 4398 + }, + { + "epoch": 4.248297537977999, + "grad_norm": 0.3658256328381038, + "learning_rate": 1.6060409280611083e-05, + "loss": 0.1634, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07792043685913086, + "step": 8110, + "valid_targets_mean": 6799.2, + "valid_targets_min": 4826 + }, + { + "epoch": 4.250916710319539, + "grad_norm": 0.3865735745584883, + "learning_rate": 1.6034801129180047e-05, + "loss": 0.1613, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08830088376998901, + "step": 8115, + "valid_targets_mean": 6354.9, + "valid_targets_min": 4525 + }, + { + "epoch": 4.253535882661079, + "grad_norm": 0.36501909862798587, + "learning_rate": 1.6009199742662804e-05, + "loss": 0.1724, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07458247244358063, + "step": 8120, + "valid_targets_mean": 7312.4, + "valid_targets_min": 4970 + }, + { + "epoch": 4.256155055002619, + "grad_norm": 0.3527712975682088, + "learning_rate": 1.5983605164737172e-05, + "loss": 0.1558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06650740653276443, + "step": 8125, + "valid_targets_mean": 6569.9, + "valid_targets_min": 4552 + }, + { + "epoch": 4.258774227344159, + "grad_norm": 0.359774858131024, + "learning_rate": 1.595801743906932e-05, + "loss": 0.1703, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07978302240371704, + "step": 8130, + "valid_targets_mean": 7362.2, + "valid_targets_min": 3009 + }, + { + "epoch": 4.2613933996857, + "grad_norm": 0.35719891992865205, + "learning_rate": 1.5932436609313762e-05, + "loss": 0.1529, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.080568328499794, + "step": 8135, + "valid_targets_mean": 7558.4, + "valid_targets_min": 5304 + }, + { + "epoch": 4.264012572027239, + "grad_norm": 0.371634257534297, + "learning_rate": 1.5906862719113223e-05, + "loss": 0.1606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07417374849319458, + "step": 8140, + "valid_targets_mean": 5596.0, + "valid_targets_min": 3815 + }, + { + "epoch": 4.266631744368779, + "grad_norm": 0.3557170988642468, + "learning_rate": 1.5881295812098584e-05, + "loss": 0.1447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06920690834522247, + "step": 8145, + "valid_targets_mean": 6001.6, + "valid_targets_min": 4084 + }, + { + "epoch": 4.26925091671032, + "grad_norm": 0.4126654897990094, + "learning_rate": 1.5855735931888837e-05, + "loss": 0.147, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08121057599782944, + "step": 8150, + "valid_targets_mean": 8326.1, + "valid_targets_min": 4939 + }, + { + "epoch": 4.27187008905186, + "grad_norm": 0.35655938026525325, + "learning_rate": 1.583018312209096e-05, + "loss": 0.1612, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07522504031658173, + "step": 8155, + "valid_targets_mean": 6924.6, + "valid_targets_min": 5701 + }, + { + "epoch": 4.274489261393399, + "grad_norm": 0.34066722460043874, + "learning_rate": 1.5804637426299894e-05, + "loss": 0.1573, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05872965604066849, + "step": 8160, + "valid_targets_mean": 6086.9, + "valid_targets_min": 4384 + }, + { + "epoch": 4.27710843373494, + "grad_norm": 0.3492835418379819, + "learning_rate": 1.5779098888098413e-05, + "loss": 0.1438, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08275985717773438, + "step": 8165, + "valid_targets_mean": 7030.6, + "valid_targets_min": 4823 + }, + { + "epoch": 4.27972760607648, + "grad_norm": 0.3846431823338006, + "learning_rate": 1.5753567551057112e-05, + "loss": 0.1432, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07181891798973083, + "step": 8170, + "valid_targets_mean": 6744.6, + "valid_targets_min": 5386 + }, + { + "epoch": 4.28234677841802, + "grad_norm": 0.3922439526902668, + "learning_rate": 1.5728043458734278e-05, + "loss": 0.1533, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08280803263187408, + "step": 8175, + "valid_targets_mean": 6975.9, + "valid_targets_min": 4868 + }, + { + "epoch": 4.28496595075956, + "grad_norm": 0.3705253592513052, + "learning_rate": 1.570252665467583e-05, + "loss": 0.1728, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09138161689043045, + "step": 8180, + "valid_targets_mean": 6363.0, + "valid_targets_min": 4898 + }, + { + "epoch": 4.2875851231011, + "grad_norm": 0.39750400903323196, + "learning_rate": 1.567701718241529e-05, + "loss": 0.1531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08012625575065613, + "step": 8185, + "valid_targets_mean": 5625.8, + "valid_targets_min": 3834 + }, + { + "epoch": 4.29020429544264, + "grad_norm": 0.43953803462340063, + "learning_rate": 1.565151508547363e-05, + "loss": 0.157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10322760045528412, + "step": 8190, + "valid_targets_mean": 6519.0, + "valid_targets_min": 4551 + }, + { + "epoch": 4.292823467784181, + "grad_norm": 0.4045476476035004, + "learning_rate": 1.5626020407359266e-05, + "loss": 0.1648, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08422790467739105, + "step": 8195, + "valid_targets_mean": 5930.0, + "valid_targets_min": 4462 + }, + { + "epoch": 4.29544264012572, + "grad_norm": 0.37836438305764863, + "learning_rate": 1.560053319156795e-05, + "loss": 0.1835, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07530433684587479, + "step": 8200, + "valid_targets_mean": 5775.8, + "valid_targets_min": 4973 + }, + { + "epoch": 4.29806181246726, + "grad_norm": 0.37808126695418026, + "learning_rate": 1.5575053481582694e-05, + "loss": 0.1863, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08002137392759323, + "step": 8205, + "valid_targets_mean": 6459.4, + "valid_targets_min": 4619 + }, + { + "epoch": 4.300680984808801, + "grad_norm": 0.3833585919515166, + "learning_rate": 1.5549581320873715e-05, + "loss": 0.1578, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07882620394229889, + "step": 8210, + "valid_targets_mean": 6217.4, + "valid_targets_min": 5647 + }, + { + "epoch": 4.303300157150341, + "grad_norm": 0.36986935643126034, + "learning_rate": 1.5524116752898347e-05, + "loss": 0.1609, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07829003036022186, + "step": 8215, + "valid_targets_mean": 7183.4, + "valid_targets_min": 4398 + }, + { + "epoch": 4.30591932949188, + "grad_norm": 0.4002580775962094, + "learning_rate": 1.5498659821100975e-05, + "loss": 0.1619, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09484715759754181, + "step": 8220, + "valid_targets_mean": 6605.8, + "valid_targets_min": 4418 + }, + { + "epoch": 4.308538501833421, + "grad_norm": 0.3925185745729677, + "learning_rate": 1.5473210568912935e-05, + "loss": 0.1672, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07751842588186264, + "step": 8225, + "valid_targets_mean": 5922.4, + "valid_targets_min": 4969 + }, + { + "epoch": 4.311157674174961, + "grad_norm": 0.37590531017000645, + "learning_rate": 1.54477690397525e-05, + "loss": 0.1545, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08296653628349304, + "step": 8230, + "valid_targets_mean": 7903.5, + "valid_targets_min": 5042 + }, + { + "epoch": 4.313776846516501, + "grad_norm": 0.44387549334873155, + "learning_rate": 1.5422335277024733e-05, + "loss": 0.1693, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08491471409797668, + "step": 8235, + "valid_targets_mean": 7043.1, + "valid_targets_min": 4625 + }, + { + "epoch": 4.316396018858041, + "grad_norm": 0.4238226569876959, + "learning_rate": 1.5396909324121446e-05, + "loss": 0.1657, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0797121524810791, + "step": 8240, + "valid_targets_mean": 6242.0, + "valid_targets_min": 4820 + }, + { + "epoch": 4.319015191199581, + "grad_norm": 0.3864608870176148, + "learning_rate": 1.5371491224421165e-05, + "loss": 0.1532, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07022988796234131, + "step": 8245, + "valid_targets_mean": 5716.8, + "valid_targets_min": 4337 + }, + { + "epoch": 4.321634363541121, + "grad_norm": 0.3244819918244311, + "learning_rate": 1.5346081021288967e-05, + "loss": 0.1416, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07506868243217468, + "step": 8250, + "valid_targets_mean": 7500.8, + "valid_targets_min": 3794 + }, + { + "epoch": 4.3242535358826615, + "grad_norm": 0.4429870159176524, + "learning_rate": 1.5320678758076504e-05, + "loss": 0.1575, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07346892356872559, + "step": 8255, + "valid_targets_mean": 6387.5, + "valid_targets_min": 5298 + }, + { + "epoch": 4.326872708224201, + "grad_norm": 0.40158137143360445, + "learning_rate": 1.5295284478121847e-05, + "loss": 0.169, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08658412098884583, + "step": 8260, + "valid_targets_mean": 6235.0, + "valid_targets_min": 4543 + }, + { + "epoch": 4.329491880565741, + "grad_norm": 0.4174231059537175, + "learning_rate": 1.5269898224749454e-05, + "loss": 0.1645, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08053864538669586, + "step": 8265, + "valid_targets_mean": 6094.1, + "valid_targets_min": 4713 + }, + { + "epoch": 4.3321110529072815, + "grad_norm": 0.3911365100150199, + "learning_rate": 1.5244520041270114e-05, + "loss": 0.1503, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07582774758338928, + "step": 8270, + "valid_targets_mean": 6039.5, + "valid_targets_min": 5269 + }, + { + "epoch": 4.334730225248821, + "grad_norm": 0.38473495145801856, + "learning_rate": 1.5219149970980809e-05, + "loss": 0.1504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08208172768354416, + "step": 8275, + "valid_targets_mean": 6892.6, + "valid_targets_min": 3450 + }, + { + "epoch": 4.337349397590361, + "grad_norm": 0.37531303252658804, + "learning_rate": 1.5193788057164716e-05, + "loss": 0.1592, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07927361130714417, + "step": 8280, + "valid_targets_mean": 6732.4, + "valid_targets_min": 4549 + }, + { + "epoch": 4.3399685699319015, + "grad_norm": 0.3707714784701887, + "learning_rate": 1.5168434343091061e-05, + "loss": 0.1629, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0851498544216156, + "step": 8285, + "valid_targets_mean": 6249.5, + "valid_targets_min": 4838 + }, + { + "epoch": 4.342587742273442, + "grad_norm": 0.38722948193703377, + "learning_rate": 1.5143088872015121e-05, + "loss": 0.1525, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08623776584863663, + "step": 8290, + "valid_targets_mean": 6519.8, + "valid_targets_min": 4716 + }, + { + "epoch": 4.345206914614982, + "grad_norm": 0.44394643149366275, + "learning_rate": 1.511775168717808e-05, + "loss": 0.1567, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08702689409255981, + "step": 8295, + "valid_targets_mean": 5549.1, + "valid_targets_min": 4309 + }, + { + "epoch": 4.3478260869565215, + "grad_norm": 0.38937467723302926, + "learning_rate": 1.5092422831806981e-05, + "loss": 0.1636, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0843573585152626, + "step": 8300, + "valid_targets_mean": 6353.5, + "valid_targets_min": 4923 + }, + { + "epoch": 4.350445259298062, + "grad_norm": 0.35874973212622546, + "learning_rate": 1.5067102349114686e-05, + "loss": 0.1355, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06433399021625519, + "step": 8305, + "valid_targets_mean": 6128.0, + "valid_targets_min": 4112 + }, + { + "epoch": 4.353064431639602, + "grad_norm": 0.37073705519190303, + "learning_rate": 1.5041790282299742e-05, + "loss": 0.1363, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0748823881149292, + "step": 8310, + "valid_targets_mean": 5755.4, + "valid_targets_min": 3761 + }, + { + "epoch": 4.3556836039811415, + "grad_norm": 0.3665699262275065, + "learning_rate": 1.5016486674546367e-05, + "loss": 0.1445, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06569778919219971, + "step": 8315, + "valid_targets_mean": 6331.2, + "valid_targets_min": 4928 + }, + { + "epoch": 4.358302776322682, + "grad_norm": 0.4175247424390106, + "learning_rate": 1.499119156902432e-05, + "loss": 0.151, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07225983589887619, + "step": 8320, + "valid_targets_mean": 5321.1, + "valid_targets_min": 3853 + }, + { + "epoch": 4.360921948664222, + "grad_norm": 0.5019380728771753, + "learning_rate": 1.4965905008888864e-05, + "loss": 0.1717, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09124556183815002, + "step": 8325, + "valid_targets_mean": 6596.5, + "valid_targets_min": 4989 + }, + { + "epoch": 4.363541121005762, + "grad_norm": 0.4131044204920539, + "learning_rate": 1.4940627037280693e-05, + "loss": 0.1906, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08972490578889847, + "step": 8330, + "valid_targets_mean": 6367.1, + "valid_targets_min": 4487 + }, + { + "epoch": 4.366160293347303, + "grad_norm": 0.3813952818346332, + "learning_rate": 1.4915357697325834e-05, + "loss": 0.1512, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06765107810497284, + "step": 8335, + "valid_targets_mean": 5445.4, + "valid_targets_min": 4773 + }, + { + "epoch": 4.368779465688842, + "grad_norm": 0.3979086901828073, + "learning_rate": 1.48900970321356e-05, + "loss": 0.1583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08942441642284393, + "step": 8340, + "valid_targets_mean": 6128.0, + "valid_targets_min": 4608 + }, + { + "epoch": 4.371398638030382, + "grad_norm": 0.3792761939688784, + "learning_rate": 1.4864845084806492e-05, + "loss": 0.1548, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07978663593530655, + "step": 8345, + "valid_targets_mean": 6867.9, + "valid_targets_min": 4896 + }, + { + "epoch": 4.374017810371923, + "grad_norm": 0.3965678390767401, + "learning_rate": 1.4839601898420153e-05, + "loss": 0.1772, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08483615517616272, + "step": 8350, + "valid_targets_mean": 6932.2, + "valid_targets_min": 4949 + }, + { + "epoch": 4.376636982713462, + "grad_norm": 0.44849932550494337, + "learning_rate": 1.4814367516043263e-05, + "loss": 0.1638, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08830994367599487, + "step": 8355, + "valid_targets_mean": 6357.8, + "valid_targets_min": 4489 + }, + { + "epoch": 4.379256155055002, + "grad_norm": 0.4033732904904218, + "learning_rate": 1.4789141980727488e-05, + "loss": 0.1576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07515868544578552, + "step": 8360, + "valid_targets_mean": 5858.9, + "valid_targets_min": 4865 + }, + { + "epoch": 4.381875327396543, + "grad_norm": 0.3966493629251246, + "learning_rate": 1.4763925335509411e-05, + "loss": 0.1625, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07647809386253357, + "step": 8365, + "valid_targets_mean": 6141.9, + "valid_targets_min": 4452 + }, + { + "epoch": 4.384494499738083, + "grad_norm": 0.3614593249290682, + "learning_rate": 1.473871762341042e-05, + "loss": 0.1414, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07073986530303955, + "step": 8370, + "valid_targets_mean": 6311.6, + "valid_targets_min": 4915 + }, + { + "epoch": 4.387113672079622, + "grad_norm": 0.35566488596181045, + "learning_rate": 1.4713518887436702e-05, + "loss": 0.1564, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06397022306919098, + "step": 8375, + "valid_targets_mean": 5685.0, + "valid_targets_min": 3727 + }, + { + "epoch": 4.389732844421163, + "grad_norm": 0.38131493278440376, + "learning_rate": 1.46883291705791e-05, + "loss": 0.1998, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07835820317268372, + "step": 8380, + "valid_targets_mean": 6329.0, + "valid_targets_min": 4482 + }, + { + "epoch": 4.392352016762703, + "grad_norm": 0.38581415170959144, + "learning_rate": 1.4663148515813066e-05, + "loss": 0.1488, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07043133676052094, + "step": 8385, + "valid_targets_mean": 6156.1, + "valid_targets_min": 3362 + }, + { + "epoch": 4.394971189104243, + "grad_norm": 0.4008182160511644, + "learning_rate": 1.4637976966098628e-05, + "loss": 0.1612, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07270411401987076, + "step": 8390, + "valid_targets_mean": 5596.8, + "valid_targets_min": 4395 + }, + { + "epoch": 4.397590361445783, + "grad_norm": 0.40338277115891336, + "learning_rate": 1.4612814564380231e-05, + "loss": 0.1608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07577487826347351, + "step": 8395, + "valid_targets_mean": 5501.1, + "valid_targets_min": 4135 + }, + { + "epoch": 4.400209533787323, + "grad_norm": 0.37926452431990737, + "learning_rate": 1.4587661353586761e-05, + "loss": 0.1508, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06744927912950516, + "step": 8400, + "valid_targets_mean": 5784.1, + "valid_targets_min": 4262 + }, + { + "epoch": 4.402828706128863, + "grad_norm": 0.3872729945282216, + "learning_rate": 1.456251737663138e-05, + "loss": 0.1416, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08369916677474976, + "step": 8405, + "valid_targets_mean": 7510.2, + "valid_targets_min": 5149 + }, + { + "epoch": 4.405447878470404, + "grad_norm": 0.38975460785350247, + "learning_rate": 1.4537382676411536e-05, + "loss": 0.1476, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06407198309898376, + "step": 8410, + "valid_targets_mean": 5908.6, + "valid_targets_min": 3437 + }, + { + "epoch": 4.408067050811943, + "grad_norm": 0.394670282237162, + "learning_rate": 1.451225729580882e-05, + "loss": 0.1535, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07432819157838821, + "step": 8415, + "valid_targets_mean": 6852.4, + "valid_targets_min": 3535 + }, + { + "epoch": 4.410686223153483, + "grad_norm": 0.3901780229884973, + "learning_rate": 1.448714127768893e-05, + "loss": 0.1484, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08478435128927231, + "step": 8420, + "valid_targets_mean": 6686.4, + "valid_targets_min": 4712 + }, + { + "epoch": 4.413305395495024, + "grad_norm": 0.3489415062198455, + "learning_rate": 1.4462034664901608e-05, + "loss": 0.1505, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07812289893627167, + "step": 8425, + "valid_targets_mean": 7596.2, + "valid_targets_min": 4987 + }, + { + "epoch": 4.415924567836564, + "grad_norm": 0.376974197859487, + "learning_rate": 1.4436937500280522e-05, + "loss": 0.1583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07755880057811737, + "step": 8430, + "valid_targets_mean": 6937.0, + "valid_targets_min": 3577 + }, + { + "epoch": 4.418543740178103, + "grad_norm": 0.40396905556405893, + "learning_rate": 1.4411849826643252e-05, + "loss": 0.1383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07415942847728729, + "step": 8435, + "valid_targets_mean": 5414.4, + "valid_targets_min": 3665 + }, + { + "epoch": 4.421162912519644, + "grad_norm": 0.4660682122084262, + "learning_rate": 1.4386771686791161e-05, + "loss": 0.1597, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07723142951726913, + "step": 8440, + "valid_targets_mean": 6955.4, + "valid_targets_min": 5409 + }, + { + "epoch": 4.423782084861184, + "grad_norm": 0.40122313872101795, + "learning_rate": 1.4361703123509347e-05, + "loss": 0.1606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08311334252357483, + "step": 8445, + "valid_targets_mean": 6058.8, + "valid_targets_min": 3545 + }, + { + "epoch": 4.426401257202724, + "grad_norm": 0.6657607597510616, + "learning_rate": 1.4336644179566595e-05, + "loss": 0.186, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1686384677886963, + "step": 8450, + "valid_targets_mean": 5807.8, + "valid_targets_min": 2317 + }, + { + "epoch": 4.429020429544264, + "grad_norm": 0.531777753535127, + "learning_rate": 1.4311594897715249e-05, + "loss": 0.2296, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1320067048072815, + "step": 8455, + "valid_targets_mean": 5801.6, + "valid_targets_min": 2453 + }, + { + "epoch": 4.431639601885804, + "grad_norm": 0.5398361384530933, + "learning_rate": 1.4286555320691182e-05, + "loss": 0.2268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12875959277153015, + "step": 8460, + "valid_targets_mean": 5075.4, + "valid_targets_min": 835 + }, + { + "epoch": 4.434258774227344, + "grad_norm": 0.5868007605547965, + "learning_rate": 1.4261525491213712e-05, + "loss": 0.2241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13063159584999084, + "step": 8465, + "valid_targets_mean": 4082.1, + "valid_targets_min": 1201 + }, + { + "epoch": 4.436877946568885, + "grad_norm": 0.5381634816077148, + "learning_rate": 1.4236505451985533e-05, + "loss": 0.2138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1091819629073143, + "step": 8470, + "valid_targets_mean": 4560.0, + "valid_targets_min": 1880 + }, + { + "epoch": 4.439497118910424, + "grad_norm": 0.5310120711737825, + "learning_rate": 1.4211495245692608e-05, + "loss": 0.2381, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16839918494224548, + "step": 8475, + "valid_targets_mean": 6637.9, + "valid_targets_min": 2171 + }, + { + "epoch": 4.442116291251964, + "grad_norm": 0.5190278146440941, + "learning_rate": 1.4186494915004159e-05, + "loss": 0.216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1253286898136139, + "step": 8480, + "valid_targets_mean": 6562.5, + "valid_targets_min": 1789 + }, + { + "epoch": 4.444735463593505, + "grad_norm": 0.4867697495156829, + "learning_rate": 1.4161504502572541e-05, + "loss": 0.2226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09787391126155853, + "step": 8485, + "valid_targets_mean": 5572.5, + "valid_targets_min": 1855 + }, + { + "epoch": 4.447354635935045, + "grad_norm": 0.5822314957768182, + "learning_rate": 1.4136524051033181e-05, + "loss": 0.2232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11792335659265518, + "step": 8490, + "valid_targets_mean": 3913.8, + "valid_targets_min": 1024 + }, + { + "epoch": 4.449973808276584, + "grad_norm": 0.5158227550646646, + "learning_rate": 1.4111553603004538e-05, + "loss": 0.2314, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11358408629894257, + "step": 8495, + "valid_targets_mean": 4908.0, + "valid_targets_min": 2107 + }, + { + "epoch": 4.452592980618125, + "grad_norm": 0.5869961539965604, + "learning_rate": 1.4086593201087979e-05, + "loss": 0.2274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12451714277267456, + "step": 8500, + "valid_targets_mean": 4423.2, + "valid_targets_min": 802 + }, + { + "epoch": 4.455212152959665, + "grad_norm": 0.4611985891917862, + "learning_rate": 1.4061642887867732e-05, + "loss": 0.2133, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08776941895484924, + "step": 8505, + "valid_targets_mean": 4354.5, + "valid_targets_min": 1597 + }, + { + "epoch": 4.457831325301205, + "grad_norm": 0.5688775918226212, + "learning_rate": 1.4036702705910842e-05, + "loss": 0.2269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11041654646396637, + "step": 8510, + "valid_targets_mean": 3518.2, + "valid_targets_min": 1650 + }, + { + "epoch": 4.460450497642745, + "grad_norm": 0.5518642875567444, + "learning_rate": 1.401177269776703e-05, + "loss": 0.2216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1132279559969902, + "step": 8515, + "valid_targets_mean": 4340.0, + "valid_targets_min": 1385 + }, + { + "epoch": 4.463069669984285, + "grad_norm": 0.6094475008163417, + "learning_rate": 1.3986852905968694e-05, + "loss": 0.2154, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1261036992073059, + "step": 8520, + "valid_targets_mean": 4061.2, + "valid_targets_min": 3087 + }, + { + "epoch": 4.465688842325825, + "grad_norm": 0.5162864921806446, + "learning_rate": 1.396194337303078e-05, + "loss": 0.2208, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10235683619976044, + "step": 8525, + "valid_targets_mean": 5073.4, + "valid_targets_min": 2785 + }, + { + "epoch": 4.4683080146673655, + "grad_norm": 0.6088077594799497, + "learning_rate": 1.393704414145073e-05, + "loss": 0.2158, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11759968847036362, + "step": 8530, + "valid_targets_mean": 4354.0, + "valid_targets_min": 1210 + }, + { + "epoch": 4.470927187008905, + "grad_norm": 0.6151449199270609, + "learning_rate": 1.3912155253708437e-05, + "loss": 0.2196, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11967704445123672, + "step": 8535, + "valid_targets_mean": 3266.6, + "valid_targets_min": 1064 + }, + { + "epoch": 4.473546359350445, + "grad_norm": 0.6436183746478787, + "learning_rate": 1.3887276752266113e-05, + "loss": 0.2281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11920354515314102, + "step": 8540, + "valid_targets_mean": 3360.6, + "valid_targets_min": 1678 + }, + { + "epoch": 4.4761655316919855, + "grad_norm": 0.589124862126253, + "learning_rate": 1.3862408679568282e-05, + "loss": 0.2215, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10800355672836304, + "step": 8545, + "valid_targets_mean": 3776.0, + "valid_targets_min": 671 + }, + { + "epoch": 4.478784704033526, + "grad_norm": 0.6317737872398538, + "learning_rate": 1.3837551078041644e-05, + "loss": 0.2233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11351955682039261, + "step": 8550, + "valid_targets_mean": 3642.9, + "valid_targets_min": 2000 + }, + { + "epoch": 4.481403876375065, + "grad_norm": 0.6298128571652256, + "learning_rate": 1.381270399009507e-05, + "loss": 0.2096, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13147234916687012, + "step": 8555, + "valid_targets_mean": 4261.9, + "valid_targets_min": 1532 + }, + { + "epoch": 4.4840230487166055, + "grad_norm": 0.5943111027501365, + "learning_rate": 1.3787867458119464e-05, + "loss": 0.2116, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07439844310283661, + "step": 8560, + "valid_targets_mean": 3298.9, + "valid_targets_min": 1051 + }, + { + "epoch": 4.486642221058146, + "grad_norm": 0.5826298433530936, + "learning_rate": 1.3763041524487721e-05, + "loss": 0.2047, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09946641325950623, + "step": 8565, + "valid_targets_mean": 3058.1, + "valid_targets_min": 1345 + }, + { + "epoch": 4.489261393399686, + "grad_norm": 0.5620343902348789, + "learning_rate": 1.3738226231554687e-05, + "loss": 0.2191, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09985310584306717, + "step": 8570, + "valid_targets_mean": 4157.6, + "valid_targets_min": 2231 + }, + { + "epoch": 4.4918805657412255, + "grad_norm": 0.6195213507564987, + "learning_rate": 1.3713421621657015e-05, + "loss": 0.2231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08839579671621323, + "step": 8575, + "valid_targets_mean": 3561.4, + "valid_targets_min": 2127 + }, + { + "epoch": 4.494499738082766, + "grad_norm": 0.6569017535266028, + "learning_rate": 1.3688627737113163e-05, + "loss": 0.2134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11849110573530197, + "step": 8580, + "valid_targets_mean": 3363.4, + "valid_targets_min": 1265 + }, + { + "epoch": 4.497118910424306, + "grad_norm": 0.564846860750686, + "learning_rate": 1.3663844620223272e-05, + "loss": 0.2114, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08929997682571411, + "step": 8585, + "valid_targets_mean": 3700.0, + "valid_targets_min": 908 + }, + { + "epoch": 4.499738082765846, + "grad_norm": 0.6512149054655086, + "learning_rate": 1.3639072313269106e-05, + "loss": 0.2141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11318524181842804, + "step": 8590, + "valid_targets_mean": 2910.9, + "valid_targets_min": 1264 + }, + { + "epoch": 4.502357255107386, + "grad_norm": 0.6465709019919834, + "learning_rate": 1.3614310858514016e-05, + "loss": 0.2102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1102558895945549, + "step": 8595, + "valid_targets_mean": 2855.2, + "valid_targets_min": 926 + }, + { + "epoch": 4.504976427448926, + "grad_norm": 0.6563597261559485, + "learning_rate": 1.3589560298202811e-05, + "loss": 0.2115, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08837442845106125, + "step": 8600, + "valid_targets_mean": 2905.6, + "valid_targets_min": 1016 + }, + { + "epoch": 4.507595599790466, + "grad_norm": 0.6180672798730263, + "learning_rate": 1.3564820674561726e-05, + "loss": 0.2081, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09526603668928146, + "step": 8605, + "valid_targets_mean": 3499.9, + "valid_targets_min": 2019 + }, + { + "epoch": 4.510214772132006, + "grad_norm": 0.602696371537178, + "learning_rate": 1.354009202979833e-05, + "loss": 0.2165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13709108531475067, + "step": 8610, + "valid_targets_mean": 4911.0, + "valid_targets_min": 3583 + }, + { + "epoch": 4.512833944473546, + "grad_norm": 0.5830142516755014, + "learning_rate": 1.3515374406101476e-05, + "loss": 0.2088, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09028695523738861, + "step": 8615, + "valid_targets_mean": 3381.5, + "valid_targets_min": 1110 + }, + { + "epoch": 4.515453116815086, + "grad_norm": 0.6140449216611795, + "learning_rate": 1.3490667845641188e-05, + "loss": 0.2076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12959925830364227, + "step": 8620, + "valid_targets_mean": 4497.9, + "valid_targets_min": 1460 + }, + { + "epoch": 4.518072289156627, + "grad_norm": 0.6397151511956849, + "learning_rate": 1.3465972390568643e-05, + "loss": 0.2057, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12052600830793381, + "step": 8625, + "valid_targets_mean": 3962.4, + "valid_targets_min": 2719 + }, + { + "epoch": 4.520691461498167, + "grad_norm": 0.6190465441758102, + "learning_rate": 1.3441288083016058e-05, + "loss": 0.2182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09589071571826935, + "step": 8630, + "valid_targets_mean": 3175.9, + "valid_targets_min": 1673 + }, + { + "epoch": 4.523310633839706, + "grad_norm": 0.5992094789548759, + "learning_rate": 1.3416614965096622e-05, + "loss": 0.212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09990492463111877, + "step": 8635, + "valid_targets_mean": 3482.6, + "valid_targets_min": 1860 + }, + { + "epoch": 4.525929806181247, + "grad_norm": 0.5499261289440762, + "learning_rate": 1.3391953078904458e-05, + "loss": 0.2085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1030711829662323, + "step": 8640, + "valid_targets_mean": 4597.0, + "valid_targets_min": 2934 + }, + { + "epoch": 4.528548978522787, + "grad_norm": 0.6006706484609484, + "learning_rate": 1.3367302466514514e-05, + "loss": 0.2055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10380536317825317, + "step": 8645, + "valid_targets_mean": 3667.6, + "valid_targets_min": 1945 + }, + { + "epoch": 4.5311681508643264, + "grad_norm": 0.5931622596203528, + "learning_rate": 1.3342663169982486e-05, + "loss": 0.2162, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10778256505727768, + "step": 8650, + "valid_targets_mean": 4618.9, + "valid_targets_min": 1908 + }, + { + "epoch": 4.533787323205867, + "grad_norm": 0.6151803569221982, + "learning_rate": 1.3318035231344806e-05, + "loss": 0.2108, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1142893061041832, + "step": 8655, + "valid_targets_mean": 3561.0, + "valid_targets_min": 2250 + }, + { + "epoch": 4.536406495547407, + "grad_norm": 0.583305321099175, + "learning_rate": 1.3293418692618483e-05, + "loss": 0.2099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08924940228462219, + "step": 8660, + "valid_targets_mean": 4291.5, + "valid_targets_min": 2492 + }, + { + "epoch": 4.539025667888947, + "grad_norm": 0.7014814716734583, + "learning_rate": 1.3268813595801113e-05, + "loss": 0.2126, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10996967554092407, + "step": 8665, + "valid_targets_mean": 4467.1, + "valid_targets_min": 3059 + }, + { + "epoch": 4.541644840230488, + "grad_norm": 0.6206863740286671, + "learning_rate": 1.3244219982870748e-05, + "loss": 0.2049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1131991371512413, + "step": 8670, + "valid_targets_mean": 4255.2, + "valid_targets_min": 2283 + }, + { + "epoch": 4.544264012572027, + "grad_norm": 0.6771063630964453, + "learning_rate": 1.3219637895785864e-05, + "loss": 0.2082, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11287044733762741, + "step": 8675, + "valid_targets_mean": 3564.6, + "valid_targets_min": 1182 + }, + { + "epoch": 4.546883184913567, + "grad_norm": 0.5413704303329966, + "learning_rate": 1.3195067376485264e-05, + "loss": 0.2078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09840285032987595, + "step": 8680, + "valid_targets_mean": 4895.6, + "valid_targets_min": 1869 + }, + { + "epoch": 4.549502357255108, + "grad_norm": 0.5874254960826278, + "learning_rate": 1.3170508466888009e-05, + "loss": 0.2142, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12842625379562378, + "step": 8685, + "valid_targets_mean": 4721.1, + "valid_targets_min": 2498 + }, + { + "epoch": 4.552121529596647, + "grad_norm": 0.6533078396292977, + "learning_rate": 1.3145961208893372e-05, + "loss": 0.2198, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1062917560338974, + "step": 8690, + "valid_targets_mean": 2935.6, + "valid_targets_min": 988 + }, + { + "epoch": 4.554740701938187, + "grad_norm": 0.6391898982211924, + "learning_rate": 1.312142564438072e-05, + "loss": 0.2062, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11164413392543793, + "step": 8695, + "valid_targets_mean": 4191.4, + "valid_targets_min": 1534 + }, + { + "epoch": 4.557359874279728, + "grad_norm": 0.6046360407355982, + "learning_rate": 1.309690181520951e-05, + "loss": 0.2117, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10599304735660553, + "step": 8700, + "valid_targets_mean": 3546.4, + "valid_targets_min": 2252 + }, + { + "epoch": 4.559979046621268, + "grad_norm": 0.8632738414383352, + "learning_rate": 1.3072389763219144e-05, + "loss": 0.2167, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1250210702419281, + "step": 8705, + "valid_targets_mean": 3548.0, + "valid_targets_min": 1436 + }, + { + "epoch": 4.562598218962807, + "grad_norm": 0.6118169461610888, + "learning_rate": 1.3047889530228928e-05, + "loss": 0.2099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1000833511352539, + "step": 8710, + "valid_targets_mean": 4002.1, + "valid_targets_min": 2333 + }, + { + "epoch": 4.565217391304348, + "grad_norm": 0.6094791048918677, + "learning_rate": 1.3023401158038038e-05, + "loss": 0.204, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0900658667087555, + "step": 8715, + "valid_targets_mean": 3507.9, + "valid_targets_min": 1259 + }, + { + "epoch": 4.567836563645888, + "grad_norm": 0.6202992915362916, + "learning_rate": 1.2998924688425377e-05, + "loss": 0.2032, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08818884193897247, + "step": 8720, + "valid_targets_mean": 2891.5, + "valid_targets_min": 1319 + }, + { + "epoch": 4.570455735987428, + "grad_norm": 0.6106657583472571, + "learning_rate": 1.2974460163149575e-05, + "loss": 0.1924, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09374313056468964, + "step": 8725, + "valid_targets_mean": 3002.8, + "valid_targets_min": 1194 + }, + { + "epoch": 4.573074908328968, + "grad_norm": 0.6611859041510075, + "learning_rate": 1.2950007623948857e-05, + "loss": 0.2274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0970490351319313, + "step": 8730, + "valid_targets_mean": 2704.0, + "valid_targets_min": 1453 + }, + { + "epoch": 4.575694080670508, + "grad_norm": 0.5176574483366256, + "learning_rate": 1.292556711254101e-05, + "loss": 0.2018, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09145693480968475, + "step": 8735, + "valid_targets_mean": 5175.9, + "valid_targets_min": 3011 + }, + { + "epoch": 4.578313253012048, + "grad_norm": 0.5876009983134065, + "learning_rate": 1.2901138670623308e-05, + "loss": 0.2178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0815117210149765, + "step": 8740, + "valid_targets_mean": 2915.9, + "valid_targets_min": 1256 + }, + { + "epoch": 4.580932425353589, + "grad_norm": 0.6349592745954749, + "learning_rate": 1.2876722339872414e-05, + "loss": 0.2085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1345708966255188, + "step": 8745, + "valid_targets_mean": 4661.6, + "valid_targets_min": 1336 + }, + { + "epoch": 4.583551597695128, + "grad_norm": 0.6521800380858361, + "learning_rate": 1.2852318161944348e-05, + "loss": 0.2209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10511691123247147, + "step": 8750, + "valid_targets_mean": 3390.4, + "valid_targets_min": 1275 + }, + { + "epoch": 4.586170770036668, + "grad_norm": 0.6147533075586407, + "learning_rate": 1.2827926178474388e-05, + "loss": 0.2079, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11512017250061035, + "step": 8755, + "valid_targets_mean": 3660.0, + "valid_targets_min": 2202 + }, + { + "epoch": 4.588789942378209, + "grad_norm": 0.605091604756251, + "learning_rate": 1.2803546431077008e-05, + "loss": 0.2036, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11255483329296112, + "step": 8760, + "valid_targets_mean": 4094.2, + "valid_targets_min": 3236 + }, + { + "epoch": 4.591409114719749, + "grad_norm": 0.6660110056330647, + "learning_rate": 1.2779178961345804e-05, + "loss": 0.1998, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10259729623794556, + "step": 8765, + "valid_targets_mean": 3057.6, + "valid_targets_min": 1573 + }, + { + "epoch": 4.594028287061288, + "grad_norm": 0.6149358237464726, + "learning_rate": 1.2754823810853427e-05, + "loss": 0.1977, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0949232429265976, + "step": 8770, + "valid_targets_mean": 3780.9, + "valid_targets_min": 2343 + }, + { + "epoch": 4.596647459402829, + "grad_norm": 0.5747609813308386, + "learning_rate": 1.2730481021151518e-05, + "loss": 0.193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08529553562402725, + "step": 8775, + "valid_targets_mean": 2815.8, + "valid_targets_min": 1026 + }, + { + "epoch": 4.599266631744369, + "grad_norm": 0.6395929759195625, + "learning_rate": 1.2706150633770612e-05, + "loss": 0.1972, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09475855529308319, + "step": 8780, + "valid_targets_mean": 3460.9, + "valid_targets_min": 1042 + }, + { + "epoch": 4.601885804085909, + "grad_norm": 0.6147297344304274, + "learning_rate": 1.268183269022011e-05, + "loss": 0.1841, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08383920788764954, + "step": 8785, + "valid_targets_mean": 3172.8, + "valid_targets_min": 1274 + }, + { + "epoch": 4.604504976427449, + "grad_norm": 0.6828514781586573, + "learning_rate": 1.2657527231988151e-05, + "loss": 0.2002, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10674040764570236, + "step": 8790, + "valid_targets_mean": 3939.5, + "valid_targets_min": 1575 + }, + { + "epoch": 4.607124148768989, + "grad_norm": 0.5924182910795877, + "learning_rate": 1.2633234300541612e-05, + "loss": 0.2237, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07903445512056351, + "step": 8795, + "valid_targets_mean": 3739.0, + "valid_targets_min": 1312 + }, + { + "epoch": 4.609743321110529, + "grad_norm": 0.614605999726541, + "learning_rate": 1.2608953937325965e-05, + "loss": 0.2019, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09165416657924652, + "step": 8800, + "valid_targets_mean": 3187.8, + "valid_targets_min": 1683 + }, + { + "epoch": 4.6123624934520695, + "grad_norm": 0.5661510792836556, + "learning_rate": 1.2584686183765245e-05, + "loss": 0.2065, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09626249969005585, + "step": 8805, + "valid_targets_mean": 3945.8, + "valid_targets_min": 1743 + }, + { + "epoch": 4.614981665793609, + "grad_norm": 0.6096210195459415, + "learning_rate": 1.2560431081261997e-05, + "loss": 0.2033, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10719242691993713, + "step": 8810, + "valid_targets_mean": 3953.8, + "valid_targets_min": 2213 + }, + { + "epoch": 4.617600838135149, + "grad_norm": 0.6494948532806525, + "learning_rate": 1.253618867119715e-05, + "loss": 0.2054, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10217788815498352, + "step": 8815, + "valid_targets_mean": 3690.4, + "valid_targets_min": 1586 + }, + { + "epoch": 4.6202200104766895, + "grad_norm": 0.6640530052773205, + "learning_rate": 1.251195899493001e-05, + "loss": 0.2026, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10520057380199432, + "step": 8820, + "valid_targets_mean": 3381.4, + "valid_targets_min": 2033 + }, + { + "epoch": 4.62283918281823, + "grad_norm": 0.5569491511306094, + "learning_rate": 1.248774209379814e-05, + "loss": 0.1914, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08458670973777771, + "step": 8825, + "valid_targets_mean": 3651.2, + "valid_targets_min": 1616 + }, + { + "epoch": 4.625458355159769, + "grad_norm": 0.6330676503326945, + "learning_rate": 1.2463538009117296e-05, + "loss": 0.2085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09859472513198853, + "step": 8830, + "valid_targets_mean": 3462.6, + "valid_targets_min": 2000 + }, + { + "epoch": 4.6280775275013095, + "grad_norm": 0.5956085487061661, + "learning_rate": 1.2439346782181407e-05, + "loss": 0.1984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10616499185562134, + "step": 8835, + "valid_targets_mean": 3591.0, + "valid_targets_min": 1750 + }, + { + "epoch": 4.63069669984285, + "grad_norm": 0.6329298549757268, + "learning_rate": 1.2415168454262418e-05, + "loss": 0.2061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12511585652828217, + "step": 8840, + "valid_targets_mean": 4291.8, + "valid_targets_min": 2429 + }, + { + "epoch": 4.63331587218439, + "grad_norm": 0.6358613876406229, + "learning_rate": 1.2391003066610314e-05, + "loss": 0.2131, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10768921673297882, + "step": 8845, + "valid_targets_mean": 3645.9, + "valid_targets_min": 2342 + }, + { + "epoch": 4.6359350445259295, + "grad_norm": 0.650281533288699, + "learning_rate": 1.2366850660452965e-05, + "loss": 0.2068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09575870633125305, + "step": 8850, + "valid_targets_mean": 3556.8, + "valid_targets_min": 1571 + }, + { + "epoch": 4.63855421686747, + "grad_norm": 0.6685805031293942, + "learning_rate": 1.2342711276996113e-05, + "loss": 0.2146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0916060209274292, + "step": 8855, + "valid_targets_mean": 2768.0, + "valid_targets_min": 1487 + }, + { + "epoch": 4.64117338920901, + "grad_norm": 0.5820326114744039, + "learning_rate": 1.2318584957423286e-05, + "loss": 0.2056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08970531821250916, + "step": 8860, + "valid_targets_mean": 3589.1, + "valid_targets_min": 1970 + }, + { + "epoch": 4.6437925615505495, + "grad_norm": 0.5992598789489589, + "learning_rate": 1.22944717428957e-05, + "loss": 0.218, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0977601408958435, + "step": 8865, + "valid_targets_mean": 4087.2, + "valid_targets_min": 2794 + }, + { + "epoch": 4.64641173389209, + "grad_norm": 0.6474027107259887, + "learning_rate": 1.2270371674552242e-05, + "loss": 0.2122, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0806116908788681, + "step": 8870, + "valid_targets_mean": 2785.5, + "valid_targets_min": 1066 + }, + { + "epoch": 4.64903090623363, + "grad_norm": 0.6027629773312335, + "learning_rate": 1.2246284793509355e-05, + "loss": 0.2126, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09002608805894852, + "step": 8875, + "valid_targets_mean": 3409.9, + "valid_targets_min": 2281 + }, + { + "epoch": 4.65165007857517, + "grad_norm": 0.6146930851839235, + "learning_rate": 1.222221114086099e-05, + "loss": 0.2093, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10688142478466034, + "step": 8880, + "valid_targets_mean": 4227.4, + "valid_targets_min": 1969 + }, + { + "epoch": 4.654269250916711, + "grad_norm": 0.637652856281438, + "learning_rate": 1.2198150757678518e-05, + "loss": 0.2052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08704520016908646, + "step": 8885, + "valid_targets_mean": 2942.6, + "valid_targets_min": 1005 + }, + { + "epoch": 4.65688842325825, + "grad_norm": 0.6166255110417656, + "learning_rate": 1.2174103685010682e-05, + "loss": 0.2052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09632515907287598, + "step": 8890, + "valid_targets_mean": 3895.9, + "valid_targets_min": 1980 + }, + { + "epoch": 4.65950759559979, + "grad_norm": 0.6358729645012968, + "learning_rate": 1.2150069963883517e-05, + "loss": 0.2113, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12068484723567963, + "step": 8895, + "valid_targets_mean": 4768.2, + "valid_targets_min": 1257 + }, + { + "epoch": 4.662126767941331, + "grad_norm": 0.6516633702770698, + "learning_rate": 1.2126049635300268e-05, + "loss": 0.1997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1033945083618164, + "step": 8900, + "valid_targets_mean": 3240.4, + "valid_targets_min": 1357 + }, + { + "epoch": 4.66474594028287, + "grad_norm": 0.6050422744445452, + "learning_rate": 1.2102042740241351e-05, + "loss": 0.191, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08464160561561584, + "step": 8905, + "valid_targets_mean": 4587.8, + "valid_targets_min": 1410 + }, + { + "epoch": 4.6673651126244105, + "grad_norm": 0.5991597385320386, + "learning_rate": 1.207804931966424e-05, + "loss": 0.2087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1021055206656456, + "step": 8910, + "valid_targets_mean": 3696.5, + "valid_targets_min": 1390 + }, + { + "epoch": 4.669984284965951, + "grad_norm": 0.6664424300772166, + "learning_rate": 1.2054069414503442e-05, + "loss": 0.1948, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08218555897474289, + "step": 8915, + "valid_targets_mean": 2997.4, + "valid_targets_min": 790 + }, + { + "epoch": 4.672603457307491, + "grad_norm": 0.5828292771920752, + "learning_rate": 1.2030103065670393e-05, + "loss": 0.2097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10508102178573608, + "step": 8920, + "valid_targets_mean": 4428.5, + "valid_targets_min": 1901 + }, + { + "epoch": 4.675222629649031, + "grad_norm": 0.6601174887657705, + "learning_rate": 1.2006150314053393e-05, + "loss": 0.207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0941559448838234, + "step": 8925, + "valid_targets_mean": 2790.1, + "valid_targets_min": 1460 + }, + { + "epoch": 4.677841801990571, + "grad_norm": 0.6374464539298814, + "learning_rate": 1.1982211200517573e-05, + "loss": 0.2066, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11535796523094177, + "step": 8930, + "valid_targets_mean": 4607.4, + "valid_targets_min": 952 + }, + { + "epoch": 4.680460974332111, + "grad_norm": 0.7119024765620463, + "learning_rate": 1.195828576590476e-05, + "loss": 0.2022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09456755220890045, + "step": 8935, + "valid_targets_mean": 2605.1, + "valid_targets_min": 1551 + }, + { + "epoch": 4.683080146673651, + "grad_norm": 0.5781354468810069, + "learning_rate": 1.1934374051033482e-05, + "loss": 0.2022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08129958063364029, + "step": 8940, + "valid_targets_mean": 3755.8, + "valid_targets_min": 2267 + }, + { + "epoch": 4.685699319015191, + "grad_norm": 0.5551995108738447, + "learning_rate": 1.1910476096698828e-05, + "loss": 0.2036, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08932093530893326, + "step": 8945, + "valid_targets_mean": 5198.8, + "valid_targets_min": 1233 + }, + { + "epoch": 4.688318491356731, + "grad_norm": 0.5508827780675954, + "learning_rate": 1.1886591943672418e-05, + "loss": 0.1925, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0868104100227356, + "step": 8950, + "valid_targets_mean": 4899.5, + "valid_targets_min": 1741 + }, + { + "epoch": 4.690937663698271, + "grad_norm": 0.621708285770408, + "learning_rate": 1.1862721632702347e-05, + "loss": 0.2026, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10903164744377136, + "step": 8955, + "valid_targets_mean": 4473.5, + "valid_targets_min": 856 + }, + { + "epoch": 4.693556836039812, + "grad_norm": 0.616603535846322, + "learning_rate": 1.1838865204513061e-05, + "loss": 0.1989, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11983565986156464, + "step": 8960, + "valid_targets_mean": 4047.8, + "valid_targets_min": 1062 + }, + { + "epoch": 4.696176008381352, + "grad_norm": 0.559030691721046, + "learning_rate": 1.1815022699805355e-05, + "loss": 0.1926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08906766027212143, + "step": 8965, + "valid_targets_mean": 4106.0, + "valid_targets_min": 974 + }, + { + "epoch": 4.698795180722891, + "grad_norm": 0.631272737359263, + "learning_rate": 1.1791194159256235e-05, + "loss": 0.1926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09801031649112701, + "step": 8970, + "valid_targets_mean": 3092.2, + "valid_targets_min": 1447 + }, + { + "epoch": 4.701414353064432, + "grad_norm": 0.6340130444613701, + "learning_rate": 1.1767379623518919e-05, + "loss": 0.1898, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.106422558426857, + "step": 8975, + "valid_targets_mean": 4404.8, + "valid_targets_min": 1744 + }, + { + "epoch": 4.704033525405972, + "grad_norm": 0.6797587465450963, + "learning_rate": 1.1743579133222707e-05, + "loss": 0.1938, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11266933381557465, + "step": 8980, + "valid_targets_mean": 4678.9, + "valid_targets_min": 1515 + }, + { + "epoch": 4.706652697747511, + "grad_norm": 0.7201255929766432, + "learning_rate": 1.1719792728972932e-05, + "loss": 0.2118, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12300004810094833, + "step": 8985, + "valid_targets_mean": 3396.1, + "valid_targets_min": 1349 + }, + { + "epoch": 4.709271870089052, + "grad_norm": 0.6591457046315632, + "learning_rate": 1.1696020451350924e-05, + "loss": 0.2008, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0994521751999855, + "step": 8990, + "valid_targets_mean": 3056.6, + "valid_targets_min": 1156 + }, + { + "epoch": 4.711891042430592, + "grad_norm": 0.6613931388079063, + "learning_rate": 1.1672262340913884e-05, + "loss": 0.194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1038329005241394, + "step": 8995, + "valid_targets_mean": 3856.4, + "valid_targets_min": 2076 + }, + { + "epoch": 4.714510214772132, + "grad_norm": 0.594735974520261, + "learning_rate": 1.1648518438194853e-05, + "loss": 0.1896, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09430505335330963, + "step": 9000, + "valid_targets_mean": 3352.8, + "valid_targets_min": 1021 + }, + { + "epoch": 4.717129387113673, + "grad_norm": 0.681225593238549, + "learning_rate": 1.1624788783702647e-05, + "loss": 0.1989, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10264322906732559, + "step": 9005, + "valid_targets_mean": 3367.0, + "valid_targets_min": 654 + }, + { + "epoch": 4.719748559455212, + "grad_norm": 0.6283800600755348, + "learning_rate": 1.1601073417921729e-05, + "loss": 0.1931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10935042798519135, + "step": 9010, + "valid_targets_mean": 4698.5, + "valid_targets_min": 2336 + }, + { + "epoch": 4.722367731796752, + "grad_norm": 0.7413035203402667, + "learning_rate": 1.1577372381312251e-05, + "loss": 0.2067, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09140511602163315, + "step": 9015, + "valid_targets_mean": 2237.0, + "valid_targets_min": 815 + }, + { + "epoch": 4.724986904138293, + "grad_norm": 0.5940483417790948, + "learning_rate": 1.155368571430985e-05, + "loss": 0.1994, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08947218954563141, + "step": 9020, + "valid_targets_mean": 3623.5, + "valid_targets_min": 2389 + }, + { + "epoch": 4.727606076479832, + "grad_norm": 0.6492608693015333, + "learning_rate": 1.1530013457325708e-05, + "loss": 0.2028, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10537391901016235, + "step": 9025, + "valid_targets_mean": 3766.9, + "valid_targets_min": 1793 + }, + { + "epoch": 4.730225248821372, + "grad_norm": 0.6693284764498884, + "learning_rate": 1.1506355650746364e-05, + "loss": 0.2031, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0952562540769577, + "step": 9030, + "valid_targets_mean": 3133.1, + "valid_targets_min": 1217 + }, + { + "epoch": 4.732844421162913, + "grad_norm": 0.6464798992791625, + "learning_rate": 1.1482712334933769e-05, + "loss": 0.1868, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06148266792297363, + "step": 9035, + "valid_targets_mean": 1525.2, + "valid_targets_min": 534 + }, + { + "epoch": 4.735463593504453, + "grad_norm": 0.3997519225286325, + "learning_rate": 1.1459083550225088e-05, + "loss": 0.1007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03425814211368561, + "step": 9040, + "valid_targets_mean": 2735.4, + "valid_targets_min": 834 + }, + { + "epoch": 4.738082765845992, + "grad_norm": 0.3805866264698184, + "learning_rate": 1.1435469336932731e-05, + "loss": 0.0832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03802028298377991, + "step": 9045, + "valid_targets_mean": 3253.9, + "valid_targets_min": 2790 + }, + { + "epoch": 4.740701938187533, + "grad_norm": 0.5271227522994802, + "learning_rate": 1.141186973534424e-05, + "loss": 0.0779, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.038571856915950775, + "step": 9050, + "valid_targets_mean": 3383.1, + "valid_targets_min": 2133 + }, + { + "epoch": 4.743321110529073, + "grad_norm": 0.42506608635375265, + "learning_rate": 1.1388284785722235e-05, + "loss": 0.0968, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04349125921726227, + "step": 9055, + "valid_targets_mean": 2954.8, + "valid_targets_min": 2338 + }, + { + "epoch": 4.745940282870613, + "grad_norm": 0.4400398864057771, + "learning_rate": 1.1364714528304325e-05, + "loss": 0.0762, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.039018213748931885, + "step": 9060, + "valid_targets_mean": 2680.4, + "valid_targets_min": 662 + }, + { + "epoch": 4.748559455212153, + "grad_norm": 1.0406638024773125, + "learning_rate": 1.1341159003303075e-05, + "loss": 0.1052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07803843915462494, + "step": 9065, + "valid_targets_mean": 1101.0, + "valid_targets_min": 559 + }, + { + "epoch": 4.751178627553693, + "grad_norm": 0.4234808201914869, + "learning_rate": 1.131761825090588e-05, + "loss": 0.1146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.035465411841869354, + "step": 9070, + "valid_targets_mean": 3490.6, + "valid_targets_min": 1091 + }, + { + "epoch": 4.753797799895233, + "grad_norm": 0.4052125616024461, + "learning_rate": 1.129409231127496e-05, + "loss": 0.0871, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04046661779284477, + "step": 9075, + "valid_targets_mean": 3061.8, + "valid_targets_min": 947 + }, + { + "epoch": 4.7564169722367735, + "grad_norm": 0.5151153926725468, + "learning_rate": 1.1270581224547258e-05, + "loss": 0.1124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09529449045658112, + "step": 9080, + "valid_targets_mean": 2125.4, + "valid_targets_min": 859 + }, + { + "epoch": 4.759036144578313, + "grad_norm": 0.30622345996440775, + "learning_rate": 1.1247085030834378e-05, + "loss": 0.0798, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.043526582419872284, + "step": 9085, + "valid_targets_mean": 5837.8, + "valid_targets_min": 636 + }, + { + "epoch": 4.761655316919853, + "grad_norm": 0.3911448819762176, + "learning_rate": 1.1223603770222509e-05, + "loss": 0.0785, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.043331749737262726, + "step": 9090, + "valid_targets_mean": 2185.0, + "valid_targets_min": 826 + }, + { + "epoch": 4.7642744892613935, + "grad_norm": 0.3070158190135269, + "learning_rate": 1.1200137482772369e-05, + "loss": 0.0778, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03534020483493805, + "step": 9095, + "valid_targets_mean": 3446.5, + "valid_targets_min": 1096 + }, + { + "epoch": 4.766893661602934, + "grad_norm": 0.4828342763934001, + "learning_rate": 1.1176686208519131e-05, + "loss": 0.096, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04079655930399895, + "step": 9100, + "valid_targets_mean": 2343.1, + "valid_targets_min": 688 + }, + { + "epoch": 4.769512833944473, + "grad_norm": 0.3721916673928446, + "learning_rate": 1.1153249987472332e-05, + "loss": 0.097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.028864160180091858, + "step": 9105, + "valid_targets_mean": 2938.5, + "valid_targets_min": 553 + }, + { + "epoch": 4.7721320062860135, + "grad_norm": 0.4579098193653015, + "learning_rate": 1.1129828859615879e-05, + "loss": 0.0802, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04318414255976677, + "step": 9110, + "valid_targets_mean": 2988.9, + "valid_targets_min": 566 + }, + { + "epoch": 4.774751178627554, + "grad_norm": 0.38923712166486607, + "learning_rate": 1.1106422864907863e-05, + "loss": 0.0739, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.029954858124256134, + "step": 9115, + "valid_targets_mean": 3230.2, + "valid_targets_min": 1111 + }, + { + "epoch": 4.777370350969094, + "grad_norm": 0.4561912850348876, + "learning_rate": 1.1083032043280624e-05, + "loss": 0.0786, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05434397608041763, + "step": 9120, + "valid_targets_mean": 1232.1, + "valid_targets_min": 622 + }, + { + "epoch": 4.7799895233106335, + "grad_norm": 0.5383278388405104, + "learning_rate": 1.1059656434640557e-05, + "loss": 0.09, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.042419224977493286, + "step": 9125, + "valid_targets_mean": 2132.5, + "valid_targets_min": 696 + }, + { + "epoch": 4.782608695652174, + "grad_norm": 0.46478132442947867, + "learning_rate": 1.1036296078868136e-05, + "loss": 0.0881, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0451333187520504, + "step": 9130, + "valid_targets_mean": 3225.2, + "valid_targets_min": 1922 + }, + { + "epoch": 4.785227867993714, + "grad_norm": 0.4698233923807494, + "learning_rate": 1.1012951015817804e-05, + "loss": 0.0891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.032914064824581146, + "step": 9135, + "valid_targets_mean": 2008.5, + "valid_targets_min": 802 + }, + { + "epoch": 4.787847040335254, + "grad_norm": 0.5308778820315359, + "learning_rate": 1.0989621285317913e-05, + "loss": 0.0962, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06775735318660736, + "step": 9140, + "valid_targets_mean": 1754.1, + "valid_targets_min": 957 + }, + { + "epoch": 4.790466212676794, + "grad_norm": 0.4084670385575034, + "learning_rate": 1.0966306927170658e-05, + "loss": 0.1154, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.043514907360076904, + "step": 9145, + "valid_targets_mean": 2498.5, + "valid_targets_min": 641 + }, + { + "epoch": 4.793085385018334, + "grad_norm": 0.4279232378741644, + "learning_rate": 1.094300798115201e-05, + "loss": 0.0756, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04977592080831528, + "step": 9150, + "valid_targets_mean": 2364.6, + "valid_targets_min": 924 + }, + { + "epoch": 4.795704557359874, + "grad_norm": 0.5275163178993386, + "learning_rate": 1.0919724487011636e-05, + "loss": 0.1134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08120264858007431, + "step": 9155, + "valid_targets_mean": 2385.5, + "valid_targets_min": 700 + }, + { + "epoch": 4.798323729701415, + "grad_norm": 0.49257488007398736, + "learning_rate": 1.0896456484472862e-05, + "loss": 0.0941, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07682208716869354, + "step": 9160, + "valid_targets_mean": 3363.2, + "valid_targets_min": 2731 + }, + { + "epoch": 4.800942902042954, + "grad_norm": 0.5415718875503004, + "learning_rate": 1.0873204013232544e-05, + "loss": 0.084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07005016505718231, + "step": 9165, + "valid_targets_mean": 2615.0, + "valid_targets_min": 893 + }, + { + "epoch": 4.8035620743844945, + "grad_norm": 0.6949620057147603, + "learning_rate": 1.0849967112961097e-05, + "loss": 0.2478, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26949775218963623, + "step": 9170, + "valid_targets_mean": 2615.9, + "valid_targets_min": 922 + }, + { + "epoch": 4.806181246726035, + "grad_norm": 0.4735129998424099, + "learning_rate": 1.0826745823302312e-05, + "loss": 0.1188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03111286647617817, + "step": 9175, + "valid_targets_mean": 1357.4, + "valid_targets_min": 507 + }, + { + "epoch": 4.808800419067575, + "grad_norm": 0.41949657373235166, + "learning_rate": 1.0803540183873399e-05, + "loss": 0.0969, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04782308638095856, + "step": 9180, + "valid_targets_mean": 3236.9, + "valid_targets_min": 615 + }, + { + "epoch": 4.8114195914091145, + "grad_norm": 0.4706428085338741, + "learning_rate": 1.078035023426483e-05, + "loss": 0.1776, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06388384103775024, + "step": 9185, + "valid_targets_mean": 3023.1, + "valid_targets_min": 826 + }, + { + "epoch": 4.814038763750655, + "grad_norm": 0.4592019713471492, + "learning_rate": 1.0757176014040325e-05, + "loss": 0.0824, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04213862866163254, + "step": 9190, + "valid_targets_mean": 2924.4, + "valid_targets_min": 851 + }, + { + "epoch": 4.816657936092195, + "grad_norm": 0.4632823742735354, + "learning_rate": 1.073401756273677e-05, + "loss": 0.0831, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05453056842088699, + "step": 9195, + "valid_targets_mean": 4528.4, + "valid_targets_min": 2665 + }, + { + "epoch": 4.8192771084337345, + "grad_norm": 0.3609215644783444, + "learning_rate": 1.0710874919864143e-05, + "loss": 0.0856, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02940385788679123, + "step": 9200, + "valid_targets_mean": 2820.6, + "valid_targets_min": 595 + }, + { + "epoch": 4.821896280775275, + "grad_norm": 0.44209632448122455, + "learning_rate": 1.0687748124905451e-05, + "loss": 0.0781, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05022032558917999, + "step": 9205, + "valid_targets_mean": 2583.1, + "valid_targets_min": 825 + }, + { + "epoch": 4.824515453116815, + "grad_norm": 0.44249999142815694, + "learning_rate": 1.066463721731667e-05, + "loss": 0.0786, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03852751478552818, + "step": 9210, + "valid_targets_mean": 3771.5, + "valid_targets_min": 672 + }, + { + "epoch": 4.827134625458355, + "grad_norm": 0.3611442497021939, + "learning_rate": 1.0641542236526672e-05, + "loss": 0.0729, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.029995795339345932, + "step": 9215, + "valid_targets_mean": 3165.0, + "valid_targets_min": 1956 + }, + { + "epoch": 4.829753797799896, + "grad_norm": 0.6706741443758514, + "learning_rate": 1.0618463221937136e-05, + "loss": 0.0802, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03590845689177513, + "step": 9220, + "valid_targets_mean": 3719.8, + "valid_targets_min": 2540 + }, + { + "epoch": 4.832372970141435, + "grad_norm": 0.45590454833112176, + "learning_rate": 1.0595400212922526e-05, + "loss": 0.0705, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04903195798397064, + "step": 9225, + "valid_targets_mean": 3447.5, + "valid_targets_min": 1240 + }, + { + "epoch": 4.834992142482975, + "grad_norm": 0.42236440086752497, + "learning_rate": 1.0572353248829988e-05, + "loss": 0.1105, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.022666532546281815, + "step": 9230, + "valid_targets_mean": 2975.2, + "valid_targets_min": 623 + }, + { + "epoch": 4.837611314824516, + "grad_norm": 0.3818881079962277, + "learning_rate": 1.0549322368979298e-05, + "loss": 0.0668, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03372521325945854, + "step": 9235, + "valid_targets_mean": 2960.1, + "valid_targets_min": 583 + }, + { + "epoch": 4.840230487166055, + "grad_norm": 0.3751963558558432, + "learning_rate": 1.0526307612662792e-05, + "loss": 0.0715, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03359278291463852, + "step": 9240, + "valid_targets_mean": 3723.5, + "valid_targets_min": 3230 + }, + { + "epoch": 4.842849659507595, + "grad_norm": 0.4184602801803382, + "learning_rate": 1.05033090191453e-05, + "loss": 0.0693, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.028666600584983826, + "step": 9245, + "valid_targets_mean": 2520.9, + "valid_targets_min": 647 + }, + { + "epoch": 4.845468831849136, + "grad_norm": 0.7642504032655404, + "learning_rate": 1.048032662766405e-05, + "loss": 0.1154, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08870033919811249, + "step": 9250, + "valid_targets_mean": 1094.5, + "valid_targets_min": 195 + }, + { + "epoch": 4.848088004190676, + "grad_norm": 0.3969633343007265, + "learning_rate": 1.0457360477428682e-05, + "loss": 0.0782, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05737834423780441, + "step": 9255, + "valid_targets_mean": 3635.9, + "valid_targets_min": 3050 + }, + { + "epoch": 4.850707176532216, + "grad_norm": 0.5763074321343137, + "learning_rate": 1.0434410607621065e-05, + "loss": 0.1106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06752394139766693, + "step": 9260, + "valid_targets_mean": 2382.9, + "valid_targets_min": 1087 + }, + { + "epoch": 4.853326348873756, + "grad_norm": 0.4031647724187547, + "learning_rate": 1.0411477057395358e-05, + "loss": 0.0786, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.034291207790374756, + "step": 9265, + "valid_targets_mean": 3025.5, + "valid_targets_min": 847 + }, + { + "epoch": 4.855945521215296, + "grad_norm": 0.5587627567342315, + "learning_rate": 1.0388559865877816e-05, + "loss": 0.1038, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05773116275668144, + "step": 9270, + "valid_targets_mean": 2263.1, + "valid_targets_min": 916 + }, + { + "epoch": 4.858564693556836, + "grad_norm": 0.46595019245947983, + "learning_rate": 1.0365659072166823e-05, + "loss": 0.1078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03987809270620346, + "step": 9275, + "valid_targets_mean": 2567.0, + "valid_targets_min": 1062 + }, + { + "epoch": 4.861183865898376, + "grad_norm": 0.6864424953181596, + "learning_rate": 1.0342774715332776e-05, + "loss": 0.1078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06730234622955322, + "step": 9280, + "valid_targets_mean": 1443.4, + "valid_targets_min": 771 + }, + { + "epoch": 4.863803038239916, + "grad_norm": 0.4289349949699643, + "learning_rate": 1.0319906834418027e-05, + "loss": 0.0791, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.036795586347579956, + "step": 9285, + "valid_targets_mean": 2753.2, + "valid_targets_min": 707 + }, + { + "epoch": 4.866422210581456, + "grad_norm": 0.38043262212418566, + "learning_rate": 1.0297055468436823e-05, + "loss": 0.0854, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.038165103644132614, + "step": 9290, + "valid_targets_mean": 3665.8, + "valid_targets_min": 2850 + }, + { + "epoch": 4.869041382922997, + "grad_norm": 0.43476779566750035, + "learning_rate": 1.0274220656375235e-05, + "loss": 0.0842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03128594160079956, + "step": 9295, + "valid_targets_mean": 2238.2, + "valid_targets_min": 749 + }, + { + "epoch": 4.871660555264537, + "grad_norm": 0.370313368646326, + "learning_rate": 1.0251402437191089e-05, + "loss": 0.0708, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.038706958293914795, + "step": 9300, + "valid_targets_mean": 4488.2, + "valid_targets_min": 1052 + }, + { + "epoch": 4.874279727606076, + "grad_norm": 0.319750712033594, + "learning_rate": 1.0228600849813915e-05, + "loss": 0.0671, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.036063797771930695, + "step": 9305, + "valid_targets_mean": 4258.2, + "valid_targets_min": 2540 + }, + { + "epoch": 4.876898899947617, + "grad_norm": 0.33029579924082025, + "learning_rate": 1.0205815933144833e-05, + "loss": 0.0799, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.029350923374295235, + "step": 9310, + "valid_targets_mean": 3782.5, + "valid_targets_min": 1859 + }, + { + "epoch": 4.879518072289157, + "grad_norm": 0.38085938971164035, + "learning_rate": 1.0183047726056574e-05, + "loss": 0.0938, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03152487426996231, + "step": 9315, + "valid_targets_mean": 2879.5, + "valid_targets_min": 893 + }, + { + "epoch": 4.882137244630696, + "grad_norm": 0.4831945174173879, + "learning_rate": 1.0160296267393308e-05, + "loss": 0.0889, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04167293757200241, + "step": 9320, + "valid_targets_mean": 2072.6, + "valid_targets_min": 753 + }, + { + "epoch": 4.884756416972237, + "grad_norm": 0.3146208676922227, + "learning_rate": 1.013756159597068e-05, + "loss": 0.0827, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.024426061660051346, + "step": 9325, + "valid_targets_mean": 4205.6, + "valid_targets_min": 3934 + }, + { + "epoch": 4.887375589313777, + "grad_norm": 0.4519748356721149, + "learning_rate": 1.0114843750575654e-05, + "loss": 0.0738, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04126317426562309, + "step": 9330, + "valid_targets_mean": 3174.9, + "valid_targets_min": 1576 + }, + { + "epoch": 4.889994761655317, + "grad_norm": 0.48719835907350145, + "learning_rate": 1.0092142769966506e-05, + "loss": 0.0862, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04686902463436127, + "step": 9335, + "valid_targets_mean": 3241.8, + "valid_targets_min": 1006 + }, + { + "epoch": 4.892613933996857, + "grad_norm": 0.32010999479451724, + "learning_rate": 1.0069458692872742e-05, + "loss": 0.0714, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02505858615040779, + "step": 9340, + "valid_targets_mean": 3445.5, + "valid_targets_min": 980 + }, + { + "epoch": 4.895233106338397, + "grad_norm": 0.5725901656192572, + "learning_rate": 1.0046791557995023e-05, + "loss": 0.0804, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05188882350921631, + "step": 9345, + "valid_targets_mean": 2083.9, + "valid_targets_min": 745 + }, + { + "epoch": 4.897852278679937, + "grad_norm": 0.5549702485809708, + "learning_rate": 1.002414140400511e-05, + "loss": 0.0788, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.050374835729599, + "step": 9350, + "valid_targets_mean": 2768.8, + "valid_targets_min": 1020 + }, + { + "epoch": 4.9004714510214775, + "grad_norm": 0.4836784282793694, + "learning_rate": 1.000150826954579e-05, + "loss": 0.0797, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.051911644637584686, + "step": 9355, + "valid_targets_mean": 2314.8, + "valid_targets_min": 967 + }, + { + "epoch": 4.903090623363017, + "grad_norm": 0.4360657137850092, + "learning_rate": 9.978892193230821e-06, + "loss": 0.0971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03503736853599548, + "step": 9360, + "valid_targets_mean": 2462.0, + "valid_targets_min": 1015 + }, + { + "epoch": 4.905709795704557, + "grad_norm": 0.5904512749187, + "learning_rate": 9.956293213644839e-06, + "loss": 0.0774, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.044043950736522675, + "step": 9365, + "valid_targets_mean": 1214.9, + "valid_targets_min": 705 + }, + { + "epoch": 4.9083289680460975, + "grad_norm": 0.3881901935145882, + "learning_rate": 9.933711369343329e-06, + "loss": 0.0883, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02765190787613392, + "step": 9370, + "valid_targets_mean": 2364.8, + "valid_targets_min": 622 + }, + { + "epoch": 4.910948140387638, + "grad_norm": 0.5521495497495682, + "learning_rate": 9.91114669885254e-06, + "loss": 0.1031, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.033989161252975464, + "step": 9375, + "valid_targets_mean": 3702.2, + "valid_targets_min": 1322 + }, + { + "epoch": 4.913567312729177, + "grad_norm": 0.41071973811584744, + "learning_rate": 9.888599240669419e-06, + "loss": 0.0804, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04003782570362091, + "step": 9380, + "valid_targets_mean": 2863.1, + "valid_targets_min": 1011 + }, + { + "epoch": 4.9161864850707175, + "grad_norm": 0.49161604591708735, + "learning_rate": 9.866069033261548e-06, + "loss": 0.0701, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.044861674308776855, + "step": 9385, + "valid_targets_mean": 3106.1, + "valid_targets_min": 874 + }, + { + "epoch": 4.918805657412258, + "grad_norm": 0.583969785929338, + "learning_rate": 9.843556115067083e-06, + "loss": 0.0848, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0578463077545166, + "step": 9390, + "valid_targets_mean": 3161.4, + "valid_targets_min": 1420 + }, + { + "epoch": 4.921424829753798, + "grad_norm": 0.4137817721617095, + "learning_rate": 9.821060524494658e-06, + "loss": 0.0959, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03279948607087135, + "step": 9395, + "valid_targets_mean": 2796.0, + "valid_targets_min": 1109 + }, + { + "epoch": 4.9240440020953375, + "grad_norm": 0.40270192516132824, + "learning_rate": 9.798582299923393e-06, + "loss": 0.0629, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03196260333061218, + "step": 9400, + "valid_targets_mean": 1822.9, + "valid_targets_min": 684 + }, + { + "epoch": 4.926663174436878, + "grad_norm": 0.46867222941763004, + "learning_rate": 9.776121479702722e-06, + "loss": 0.0825, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03990498185157776, + "step": 9405, + "valid_targets_mean": 2389.8, + "valid_targets_min": 671 + }, + { + "epoch": 4.929282346778418, + "grad_norm": 0.36127700554593084, + "learning_rate": 9.753678102152449e-06, + "loss": 0.0727, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.034535013139247894, + "step": 9410, + "valid_targets_mean": 4513.8, + "valid_targets_min": 1057 + }, + { + "epoch": 4.931901519119958, + "grad_norm": 0.3633748308439699, + "learning_rate": 9.731252205562551e-06, + "loss": 0.0643, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.030670013278722763, + "step": 9415, + "valid_targets_mean": 3533.1, + "valid_targets_min": 1243 + }, + { + "epoch": 4.934520691461498, + "grad_norm": 0.3800339958338929, + "learning_rate": 9.708843828193251e-06, + "loss": 0.086, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03751269355416298, + "step": 9420, + "valid_targets_mean": 3911.2, + "valid_targets_min": 3322 + }, + { + "epoch": 4.937139863803038, + "grad_norm": 0.5273963512085883, + "learning_rate": 9.686453008274825e-06, + "loss": 0.0728, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04546033591032028, + "step": 9425, + "valid_targets_mean": 1820.0, + "valid_targets_min": 680 + }, + { + "epoch": 4.9397590361445785, + "grad_norm": 0.43278411601206196, + "learning_rate": 9.664079784007627e-06, + "loss": 0.1015, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.043846093118190765, + "step": 9430, + "valid_targets_mean": 3371.9, + "valid_targets_min": 640 + }, + { + "epoch": 4.942378208486119, + "grad_norm": 0.27838898081111807, + "learning_rate": 9.64172419356198e-06, + "loss": 0.0881, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02142597734928131, + "step": 9435, + "valid_targets_mean": 3327.0, + "valid_targets_min": 929 + }, + { + "epoch": 4.944997380827658, + "grad_norm": 0.6142096335256088, + "learning_rate": 9.619386275078129e-06, + "loss": 0.0925, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05631929636001587, + "step": 9440, + "valid_targets_mean": 3318.0, + "valid_targets_min": 2380 + }, + { + "epoch": 4.9476165531691985, + "grad_norm": 0.38334975674724514, + "learning_rate": 9.597066066666164e-06, + "loss": 0.0717, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03687911853194237, + "step": 9445, + "valid_targets_mean": 3709.4, + "valid_targets_min": 2619 + }, + { + "epoch": 4.950235725510739, + "grad_norm": 0.67861113279472, + "learning_rate": 9.574763606405968e-06, + "loss": 0.0815, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.049105964601039886, + "step": 9450, + "valid_targets_mean": 1574.6, + "valid_targets_min": 693 + }, + { + "epoch": 4.952854897852279, + "grad_norm": 0.3957068978774986, + "learning_rate": 9.55247893234712e-06, + "loss": 0.0781, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.041627075523138046, + "step": 9455, + "valid_targets_mean": 3885.1, + "valid_targets_min": 3129 + }, + { + "epoch": 4.9554740701938185, + "grad_norm": 0.7326783103878073, + "learning_rate": 9.5302120825089e-06, + "loss": 0.1037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04959501326084137, + "step": 9460, + "valid_targets_mean": 1611.0, + "valid_targets_min": 543 + }, + { + "epoch": 4.958093242535359, + "grad_norm": 0.44825197019491486, + "learning_rate": 9.507963094880124e-06, + "loss": 0.1051, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.047432661056518555, + "step": 9465, + "valid_targets_mean": 2319.6, + "valid_targets_min": 503 + }, + { + "epoch": 4.960712414876899, + "grad_norm": 0.510071533666162, + "learning_rate": 9.485732007419188e-06, + "loss": 0.0827, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.053640030324459076, + "step": 9470, + "valid_targets_mean": 1987.9, + "valid_targets_min": 625 + }, + { + "epoch": 4.963331587218439, + "grad_norm": 0.43448292051944704, + "learning_rate": 9.463518858053904e-06, + "loss": 0.0786, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03527310863137245, + "step": 9475, + "valid_targets_mean": 3822.8, + "valid_targets_min": 2822 + }, + { + "epoch": 4.965950759559979, + "grad_norm": 0.42248384226037244, + "learning_rate": 9.441323684681502e-06, + "loss": 0.0773, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.046227335929870605, + "step": 9480, + "valid_targets_mean": 3724.5, + "valid_targets_min": 2987 + }, + { + "epoch": 4.968569931901519, + "grad_norm": 0.382801073687794, + "learning_rate": 9.419146525168545e-06, + "loss": 0.0685, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.028592493385076523, + "step": 9485, + "valid_targets_mean": 3022.0, + "valid_targets_min": 856 + }, + { + "epoch": 4.971189104243059, + "grad_norm": 0.9587364146007591, + "learning_rate": 9.396987417350856e-06, + "loss": 0.0807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0448029451072216, + "step": 9490, + "valid_targets_mean": 764.2, + "valid_targets_min": 563 + }, + { + "epoch": 4.973808276584599, + "grad_norm": 0.39898776336005193, + "learning_rate": 9.374846399033469e-06, + "loss": 0.0795, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.033013638108968735, + "step": 9495, + "valid_targets_mean": 3117.1, + "valid_targets_min": 751 + }, + { + "epoch": 4.976427448926139, + "grad_norm": 0.5255979997506766, + "learning_rate": 9.352723507990528e-06, + "loss": 0.0714, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.046126432716846466, + "step": 9500, + "valid_targets_mean": 3566.1, + "valid_targets_min": 980 + }, + { + "epoch": 4.979046621267679, + "grad_norm": 0.446781363338972, + "learning_rate": 9.330618781965305e-06, + "loss": 0.0727, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.038315288722515106, + "step": 9505, + "valid_targets_mean": 3589.8, + "valid_targets_min": 2538 + }, + { + "epoch": 4.98166579360922, + "grad_norm": 0.3124386468514202, + "learning_rate": 9.308532258670025e-06, + "loss": 0.0806, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.027780020609498024, + "step": 9510, + "valid_targets_mean": 4182.8, + "valid_targets_min": 485 + }, + { + "epoch": 4.98428496595076, + "grad_norm": 0.30054591798536434, + "learning_rate": 9.28646397578589e-06, + "loss": 0.069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.033520281314849854, + "step": 9515, + "valid_targets_mean": 4832.8, + "valid_targets_min": 2551 + }, + { + "epoch": 4.986904138292299, + "grad_norm": 0.33328379929575486, + "learning_rate": 9.264413970962969e-06, + "loss": 0.0742, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.037390343844890594, + "step": 9520, + "valid_targets_mean": 4733.6, + "valid_targets_min": 3365 + }, + { + "epoch": 4.98952331063384, + "grad_norm": 0.44878278869138466, + "learning_rate": 9.24238228182016e-06, + "loss": 0.0791, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05923148989677429, + "step": 9525, + "valid_targets_mean": 2954.4, + "valid_targets_min": 872 + }, + { + "epoch": 4.99214248297538, + "grad_norm": 0.3811491511881796, + "learning_rate": 9.220368945945103e-06, + "loss": 0.1636, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03844798728823662, + "step": 9530, + "valid_targets_mean": 2590.9, + "valid_targets_min": 1015 + }, + { + "epoch": 4.994761655316919, + "grad_norm": 0.4348334992325256, + "learning_rate": 9.198374000894123e-06, + "loss": 0.074, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05938860401511192, + "step": 9535, + "valid_targets_mean": 2342.4, + "valid_targets_min": 967 + }, + { + "epoch": 4.99738082765846, + "grad_norm": 0.39936657461229824, + "learning_rate": 9.176397484192184e-06, + "loss": 0.076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03136672079563141, + "step": 9540, + "valid_targets_mean": 3335.1, + "valid_targets_min": 886 + }, + { + "epoch": 5.0, + "grad_norm": 0.3896753621417805, + "learning_rate": 9.1544394333328e-06, + "loss": 0.1058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03392448276281357, + "step": 9545, + "valid_targets_mean": 2983.1, + "valid_targets_min": 791 + }, + { + "epoch": 5.00261917234154, + "grad_norm": 0.8291698685938063, + "learning_rate": 9.132499885777964e-06, + "loss": 0.1593, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06088561937212944, + "step": 9550, + "valid_targets_mean": 1236.5, + "valid_targets_min": 746 + }, + { + "epoch": 5.00523834468308, + "grad_norm": 0.795133667121655, + "learning_rate": 9.110578878958145e-06, + "loss": 0.1432, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07181090116500854, + "step": 9555, + "valid_targets_mean": 1550.8, + "valid_targets_min": 612 + }, + { + "epoch": 5.00785751702462, + "grad_norm": 0.7188523527435988, + "learning_rate": 9.088676450272124e-06, + "loss": 0.1396, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06605690717697144, + "step": 9560, + "valid_targets_mean": 1455.8, + "valid_targets_min": 904 + }, + { + "epoch": 5.01047668936616, + "grad_norm": 0.7499204984155243, + "learning_rate": 9.06679263708705e-06, + "loss": 0.1315, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06748449802398682, + "step": 9565, + "valid_targets_mean": 1514.4, + "valid_targets_min": 967 + }, + { + "epoch": 5.013095861707701, + "grad_norm": 0.8584249807542884, + "learning_rate": 9.044927476738252e-06, + "loss": 0.1438, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.069888174533844, + "step": 9570, + "valid_targets_mean": 1500.2, + "valid_targets_min": 718 + }, + { + "epoch": 5.01571503404924, + "grad_norm": 0.7662334735645583, + "learning_rate": 9.02308100652927e-06, + "loss": 0.1384, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07856231182813644, + "step": 9575, + "valid_targets_mean": 1689.9, + "valid_targets_min": 764 + }, + { + "epoch": 5.01833420639078, + "grad_norm": 0.7289531629346846, + "learning_rate": 9.001253263731753e-06, + "loss": 0.1269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06529080867767334, + "step": 9580, + "valid_targets_mean": 1543.9, + "valid_targets_min": 725 + }, + { + "epoch": 5.020953378732321, + "grad_norm": 0.8227298254980042, + "learning_rate": 8.979444285585392e-06, + "loss": 0.1447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05642779916524887, + "step": 9585, + "valid_targets_mean": 1290.1, + "valid_targets_min": 610 + }, + { + "epoch": 5.023572551073861, + "grad_norm": 0.7629736165857393, + "learning_rate": 8.957654109297874e-06, + "loss": 0.1335, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06554756313562393, + "step": 9590, + "valid_targets_mean": 1588.6, + "valid_targets_min": 720 + }, + { + "epoch": 5.0261917234154, + "grad_norm": 0.7158738761162554, + "learning_rate": 8.935882772044798e-06, + "loss": 0.137, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07234790176153183, + "step": 9595, + "valid_targets_mean": 1708.5, + "valid_targets_min": 865 + }, + { + "epoch": 5.028810895756941, + "grad_norm": 0.8754088785499504, + "learning_rate": 8.91413031096963e-06, + "loss": 0.1317, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08297131210565567, + "step": 9600, + "valid_targets_mean": 1502.1, + "valid_targets_min": 593 + }, + { + "epoch": 5.031430068098481, + "grad_norm": 0.7442074558873492, + "learning_rate": 8.892396763183637e-06, + "loss": 0.1314, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06886909157037735, + "step": 9605, + "valid_targets_mean": 1667.9, + "valid_targets_min": 704 + }, + { + "epoch": 5.034049240440021, + "grad_norm": 0.7627126439991847, + "learning_rate": 8.870682165765798e-06, + "loss": 0.1256, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05173000693321228, + "step": 9610, + "valid_targets_mean": 1233.4, + "valid_targets_min": 722 + }, + { + "epoch": 5.036668412781561, + "grad_norm": 0.7142867945568193, + "learning_rate": 8.848986555762777e-06, + "loss": 0.1239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.056171685457229614, + "step": 9615, + "valid_targets_mean": 1556.0, + "valid_targets_min": 968 + }, + { + "epoch": 5.039287585123101, + "grad_norm": 0.7988401443613027, + "learning_rate": 8.827309970188847e-06, + "loss": 0.1249, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07681363821029663, + "step": 9620, + "valid_targets_mean": 1773.1, + "valid_targets_min": 936 + }, + { + "epoch": 5.041906757464641, + "grad_norm": 0.8914213786316774, + "learning_rate": 8.805652446025815e-06, + "loss": 0.1343, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06082507595419884, + "step": 9625, + "valid_targets_mean": 1383.6, + "valid_targets_min": 728 + }, + { + "epoch": 5.0445259298061815, + "grad_norm": 0.7635151965573758, + "learning_rate": 8.784014020222968e-06, + "loss": 0.1333, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08338280022144318, + "step": 9630, + "valid_targets_mean": 2023.5, + "valid_targets_min": 1143 + }, + { + "epoch": 5.047145102147721, + "grad_norm": 0.8405113623184243, + "learning_rate": 8.762394729697022e-06, + "loss": 0.1339, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07841154932975769, + "step": 9635, + "valid_targets_mean": 1411.9, + "valid_targets_min": 818 + }, + { + "epoch": 5.049764274489261, + "grad_norm": 0.8164628534220753, + "learning_rate": 8.740794611332038e-06, + "loss": 0.127, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06135069951415062, + "step": 9640, + "valid_targets_mean": 1393.2, + "valid_targets_min": 625 + }, + { + "epoch": 5.0523834468308015, + "grad_norm": 0.7403910338312527, + "learning_rate": 8.719213701979348e-06, + "loss": 0.1291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07470349967479706, + "step": 9645, + "valid_targets_mean": 1949.8, + "valid_targets_min": 790 + }, + { + "epoch": 5.055002619172342, + "grad_norm": 0.8074833036677275, + "learning_rate": 8.697652038457563e-06, + "loss": 0.1344, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09135995805263519, + "step": 9650, + "valid_targets_mean": 2193.8, + "valid_targets_min": 891 + }, + { + "epoch": 5.057621791513881, + "grad_norm": 0.7255751179833262, + "learning_rate": 8.676109657552396e-06, + "loss": 0.128, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05861027538776398, + "step": 9655, + "valid_targets_mean": 1569.0, + "valid_targets_min": 850 + }, + { + "epoch": 5.0602409638554215, + "grad_norm": 0.7615798411288203, + "learning_rate": 8.654586596016726e-06, + "loss": 0.1291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05548068881034851, + "step": 9660, + "valid_targets_mean": 1384.2, + "valid_targets_min": 974 + }, + { + "epoch": 5.062860136196962, + "grad_norm": 0.8130706992942511, + "learning_rate": 8.633082890570417e-06, + "loss": 0.1224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06968683749437332, + "step": 9665, + "valid_targets_mean": 1502.9, + "valid_targets_min": 998 + }, + { + "epoch": 5.065479308538502, + "grad_norm": 0.7913334909686525, + "learning_rate": 8.611598577900343e-06, + "loss": 0.1271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07109968364238739, + "step": 9670, + "valid_targets_mean": 1675.6, + "valid_targets_min": 1047 + }, + { + "epoch": 5.068098480880042, + "grad_norm": 0.8234985901502248, + "learning_rate": 8.590133694660278e-06, + "loss": 0.1278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0685684010386467, + "step": 9675, + "valid_targets_mean": 1577.6, + "valid_targets_min": 678 + }, + { + "epoch": 5.070717653221582, + "grad_norm": 0.8494760608549315, + "learning_rate": 8.568688277470858e-06, + "loss": 0.1329, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07787296175956726, + "step": 9680, + "valid_targets_mean": 1967.9, + "valid_targets_min": 1075 + }, + { + "epoch": 5.073336825563122, + "grad_norm": 0.8041528005781308, + "learning_rate": 8.547262362919504e-06, + "loss": 0.1351, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07973786443471909, + "step": 9685, + "valid_targets_mean": 1872.6, + "valid_targets_min": 1317 + }, + { + "epoch": 5.0759559979046625, + "grad_norm": 0.7778820031817429, + "learning_rate": 8.525855987560368e-06, + "loss": 0.1271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07093140482902527, + "step": 9690, + "valid_targets_mean": 1697.6, + "valid_targets_min": 957 + }, + { + "epoch": 5.078575170246202, + "grad_norm": 0.792525720698113, + "learning_rate": 8.504469187914242e-06, + "loss": 0.1302, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.057369161397218704, + "step": 9695, + "valid_targets_mean": 1323.0, + "valid_targets_min": 906 + }, + { + "epoch": 5.081194342587742, + "grad_norm": 0.8404788767956344, + "learning_rate": 8.483102000468569e-06, + "loss": 0.1316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.055390436202287674, + "step": 9700, + "valid_targets_mean": 1488.8, + "valid_targets_min": 1111 + }, + { + "epoch": 5.0838135149292825, + "grad_norm": 0.7641603228234167, + "learning_rate": 8.461754461677275e-06, + "loss": 0.1252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06761826574802399, + "step": 9705, + "valid_targets_mean": 1649.2, + "valid_targets_min": 1147 + }, + { + "epoch": 5.086432687270823, + "grad_norm": 0.8392729696383808, + "learning_rate": 8.440426607960821e-06, + "loss": 0.1263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07057835161685944, + "step": 9710, + "valid_targets_mean": 1526.2, + "valid_targets_min": 893 + }, + { + "epoch": 5.089051859612362, + "grad_norm": 0.7783269470106086, + "learning_rate": 8.419118475706032e-06, + "loss": 0.1156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05206485465168953, + "step": 9715, + "valid_targets_mean": 1219.6, + "valid_targets_min": 753 + }, + { + "epoch": 5.0916710319539025, + "grad_norm": 0.7982999694650752, + "learning_rate": 8.397830101266133e-06, + "loss": 0.1285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.061915069818496704, + "step": 9720, + "valid_targets_mean": 1574.5, + "valid_targets_min": 1192 + }, + { + "epoch": 5.094290204295443, + "grad_norm": 0.7793045637084354, + "learning_rate": 8.376561520960603e-06, + "loss": 0.123, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06052004545927048, + "step": 9725, + "valid_targets_mean": 1496.1, + "valid_targets_min": 1039 + }, + { + "epoch": 5.096909376636983, + "grad_norm": 0.8395426162046974, + "learning_rate": 8.355312771075165e-06, + "loss": 0.1262, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0652417466044426, + "step": 9730, + "valid_targets_mean": 1402.0, + "valid_targets_min": 657 + }, + { + "epoch": 5.0995285489785225, + "grad_norm": 0.9063254762504421, + "learning_rate": 8.33408388786172e-06, + "loss": 0.1258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06874285638332367, + "step": 9735, + "valid_targets_mean": 1471.2, + "valid_targets_min": 880 + }, + { + "epoch": 5.102147721320063, + "grad_norm": 0.8635233820789475, + "learning_rate": 8.312874907538259e-06, + "loss": 0.1261, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07698352634906769, + "step": 9740, + "valid_targets_mean": 1567.6, + "valid_targets_min": 1163 + }, + { + "epoch": 5.104766893661603, + "grad_norm": 0.8507730376845948, + "learning_rate": 8.29168586628883e-06, + "loss": 0.1216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06012817099690437, + "step": 9745, + "valid_targets_mean": 1493.1, + "valid_targets_min": 998 + }, + { + "epoch": 5.107386066003143, + "grad_norm": 0.7628871482302233, + "learning_rate": 8.270516800263461e-06, + "loss": 0.1222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.050013184547424316, + "step": 9750, + "valid_targets_mean": 1214.1, + "valid_targets_min": 703 + }, + { + "epoch": 5.110005238344683, + "grad_norm": 0.7848283673414309, + "learning_rate": 8.249367745578086e-06, + "loss": 0.1337, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0638660341501236, + "step": 9755, + "valid_targets_mean": 1459.2, + "valid_targets_min": 934 + }, + { + "epoch": 5.112624410686223, + "grad_norm": 0.8613497551716048, + "learning_rate": 8.228238738314514e-06, + "loss": 0.137, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09289310872554779, + "step": 9760, + "valid_targets_mean": 1754.4, + "valid_targets_min": 734 + }, + { + "epoch": 5.115243583027763, + "grad_norm": 0.7958306842436589, + "learning_rate": 8.207129814520349e-06, + "loss": 0.12, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07653972506523132, + "step": 9765, + "valid_targets_mean": 1864.2, + "valid_targets_min": 1270 + }, + { + "epoch": 5.117862755369304, + "grad_norm": 0.7443615561171484, + "learning_rate": 8.186041010208932e-06, + "loss": 0.121, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06417173147201538, + "step": 9770, + "valid_targets_mean": 1765.5, + "valid_targets_min": 746 + }, + { + "epoch": 5.120481927710843, + "grad_norm": 0.8704389863666305, + "learning_rate": 8.164972361359274e-06, + "loss": 0.1268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08009348809719086, + "step": 9775, + "valid_targets_mean": 1876.4, + "valid_targets_min": 1172 + }, + { + "epoch": 5.123101100052383, + "grad_norm": 0.8254417455907435, + "learning_rate": 8.143923903916e-06, + "loss": 0.1242, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06702611595392227, + "step": 9780, + "valid_targets_mean": 1642.0, + "valid_targets_min": 1033 + }, + { + "epoch": 5.125720272393924, + "grad_norm": 0.7889086458607909, + "learning_rate": 8.1228956737893e-06, + "loss": 0.1181, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07090294361114502, + "step": 9785, + "valid_targets_mean": 1689.0, + "valid_targets_min": 1205 + }, + { + "epoch": 5.128339444735464, + "grad_norm": 0.8058169834033115, + "learning_rate": 8.10188770685482e-06, + "loss": 0.1148, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05185168236494064, + "step": 9790, + "valid_targets_mean": 1164.2, + "valid_targets_min": 737 + }, + { + "epoch": 5.130958617077003, + "grad_norm": 0.9519237857968278, + "learning_rate": 8.080900038953686e-06, + "loss": 0.1306, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06645987927913666, + "step": 9795, + "valid_targets_mean": 1427.9, + "valid_targets_min": 791 + }, + { + "epoch": 5.133577789418544, + "grad_norm": 0.7608506328312206, + "learning_rate": 8.05993270589234e-06, + "loss": 0.1234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05785384774208069, + "step": 9800, + "valid_targets_mean": 1559.5, + "valid_targets_min": 786 + }, + { + "epoch": 5.136196961760084, + "grad_norm": 0.7612550220763856, + "learning_rate": 8.038985743442582e-06, + "loss": 0.1225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05324278026819229, + "step": 9805, + "valid_targets_mean": 1411.5, + "valid_targets_min": 944 + }, + { + "epoch": 5.138816134101624, + "grad_norm": 0.7614465632357175, + "learning_rate": 8.018059187341414e-06, + "loss": 0.1207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.055258601903915405, + "step": 9810, + "valid_targets_mean": 1454.9, + "valid_targets_min": 1227 + }, + { + "epoch": 5.141435306443164, + "grad_norm": 0.7433802949513004, + "learning_rate": 7.997153073291049e-06, + "loss": 0.1264, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05270681530237198, + "step": 9815, + "valid_targets_mean": 1446.9, + "valid_targets_min": 740 + }, + { + "epoch": 5.144054478784704, + "grad_norm": 0.9612758343128028, + "learning_rate": 7.976267436958817e-06, + "loss": 0.1286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08071742206811905, + "step": 9820, + "valid_targets_mean": 2122.9, + "valid_targets_min": 1227 + }, + { + "epoch": 5.146673651126244, + "grad_norm": 0.7703023931906229, + "learning_rate": 7.955402313977115e-06, + "loss": 0.1247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05489915609359741, + "step": 9825, + "valid_targets_mean": 1256.0, + "valid_targets_min": 636 + }, + { + "epoch": 5.149292823467785, + "grad_norm": 0.7565720696589413, + "learning_rate": 7.934557739943333e-06, + "loss": 0.1224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.045493997633457184, + "step": 9830, + "valid_targets_mean": 1168.8, + "valid_targets_min": 814 + }, + { + "epoch": 5.151911995809324, + "grad_norm": 0.8230795234990084, + "learning_rate": 7.91373375041982e-06, + "loss": 0.1168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0581836998462677, + "step": 9835, + "valid_targets_mean": 1275.9, + "valid_targets_min": 911 + }, + { + "epoch": 5.154531168150864, + "grad_norm": 0.7663342792339701, + "learning_rate": 7.89293038093379e-06, + "loss": 0.1231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05573280155658722, + "step": 9840, + "valid_targets_mean": 1431.9, + "valid_targets_min": 661 + }, + { + "epoch": 5.157150340492405, + "grad_norm": 0.8663535122859962, + "learning_rate": 7.87214766697729e-06, + "loss": 0.1291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0651249885559082, + "step": 9845, + "valid_targets_mean": 1572.1, + "valid_targets_min": 1164 + }, + { + "epoch": 5.159769512833945, + "grad_norm": 0.8382575650021854, + "learning_rate": 7.851385644007103e-06, + "loss": 0.1218, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.055575910955667496, + "step": 9850, + "valid_targets_mean": 1396.6, + "valid_targets_min": 692 + }, + { + "epoch": 5.162388685175484, + "grad_norm": 0.7875059756241013, + "learning_rate": 7.830644347444761e-06, + "loss": 0.1255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05687501281499863, + "step": 9855, + "valid_targets_mean": 1405.8, + "valid_targets_min": 923 + }, + { + "epoch": 5.165007857517025, + "grad_norm": 0.8593071246128563, + "learning_rate": 7.80992381267637e-06, + "loss": 0.1274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06243991106748581, + "step": 9860, + "valid_targets_mean": 1375.1, + "valid_targets_min": 922 + }, + { + "epoch": 5.167627029858565, + "grad_norm": 0.7415385381072802, + "learning_rate": 7.78922407505268e-06, + "loss": 0.1221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06369824707508087, + "step": 9865, + "valid_targets_mean": 1806.0, + "valid_targets_min": 710 + }, + { + "epoch": 5.170246202200104, + "grad_norm": 0.7676587590809413, + "learning_rate": 7.768545169888909e-06, + "loss": 0.1263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0626119002699852, + "step": 9870, + "valid_targets_mean": 1342.9, + "valid_targets_min": 836 + }, + { + "epoch": 5.172865374541645, + "grad_norm": 0.8280038560088043, + "learning_rate": 7.747887132464757e-06, + "loss": 0.1229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07222384959459305, + "step": 9875, + "valid_targets_mean": 1504.5, + "valid_targets_min": 1013 + }, + { + "epoch": 5.175484546883185, + "grad_norm": 0.8480684316574301, + "learning_rate": 7.72724999802432e-06, + "loss": 0.1245, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05442634969949722, + "step": 9880, + "valid_targets_mean": 1351.6, + "valid_targets_min": 978 + }, + { + "epoch": 5.178103719224725, + "grad_norm": 0.8943098137120158, + "learning_rate": 7.706633801776031e-06, + "loss": 0.1231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07496099174022675, + "step": 9885, + "valid_targets_mean": 1812.5, + "valid_targets_min": 1205 + }, + { + "epoch": 5.180722891566265, + "grad_norm": 0.7710715592164034, + "learning_rate": 7.686038578892599e-06, + "loss": 0.1327, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05917992815375328, + "step": 9890, + "valid_targets_mean": 1657.9, + "valid_targets_min": 1219 + }, + { + "epoch": 5.183342063907805, + "grad_norm": 0.768425230191172, + "learning_rate": 7.665464364510954e-06, + "loss": 0.1253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07286841422319412, + "step": 9895, + "valid_targets_mean": 1814.4, + "valid_targets_min": 1002 + }, + { + "epoch": 5.185961236249345, + "grad_norm": 0.783120110067545, + "learning_rate": 7.644911193732185e-06, + "loss": 0.1225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05758904665708542, + "step": 9900, + "valid_targets_mean": 1390.4, + "valid_targets_min": 646 + }, + { + "epoch": 5.1885804085908855, + "grad_norm": 0.8756284618345157, + "learning_rate": 7.624379101621464e-06, + "loss": 0.1236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06255842745304108, + "step": 9905, + "valid_targets_mean": 1307.4, + "valid_targets_min": 906 + }, + { + "epoch": 5.191199580932425, + "grad_norm": 0.7865895847705132, + "learning_rate": 7.603868123208023e-06, + "loss": 0.1168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05866144597530365, + "step": 9910, + "valid_targets_mean": 1574.8, + "valid_targets_min": 808 + }, + { + "epoch": 5.193818753273965, + "grad_norm": 0.8621724591786725, + "learning_rate": 7.583378293485059e-06, + "loss": 0.1281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05954202264547348, + "step": 9915, + "valid_targets_mean": 1173.9, + "valid_targets_min": 913 + }, + { + "epoch": 5.1964379256155055, + "grad_norm": 0.8240980648230771, + "learning_rate": 7.5629096474096954e-06, + "loss": 0.1168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05828775838017464, + "step": 9920, + "valid_targets_mean": 1354.2, + "valid_targets_min": 821 + }, + { + "epoch": 5.199057097957046, + "grad_norm": 0.8571886369802686, + "learning_rate": 7.542462219902909e-06, + "loss": 0.115, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.055858269333839417, + "step": 9925, + "valid_targets_mean": 1508.4, + "valid_targets_min": 1013 + }, + { + "epoch": 5.201676270298585, + "grad_norm": 0.7750722608631837, + "learning_rate": 7.5220360458494855e-06, + "loss": 0.1188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06182383745908737, + "step": 9930, + "valid_targets_mean": 1517.8, + "valid_targets_min": 781 + }, + { + "epoch": 5.204295442640126, + "grad_norm": 0.8070247648475251, + "learning_rate": 7.5016311600979245e-06, + "loss": 0.1274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05417487397789955, + "step": 9935, + "valid_targets_mean": 1243.6, + "valid_targets_min": 548 + }, + { + "epoch": 5.206914614981666, + "grad_norm": 0.7338574303878064, + "learning_rate": 7.481247597460448e-06, + "loss": 0.1183, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05301428586244583, + "step": 9940, + "valid_targets_mean": 1269.0, + "valid_targets_min": 694 + }, + { + "epoch": 5.209533787323206, + "grad_norm": 0.7525189322704464, + "learning_rate": 7.460885392712856e-06, + "loss": 0.1257, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07202500849962234, + "step": 9945, + "valid_targets_mean": 2141.0, + "valid_targets_min": 1030 + }, + { + "epoch": 5.212152959664746, + "grad_norm": 0.6971483181611564, + "learning_rate": 7.440544580594553e-06, + "loss": 0.1135, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05420509725809097, + "step": 9950, + "valid_targets_mean": 1738.6, + "valid_targets_min": 682 + }, + { + "epoch": 5.214772132006286, + "grad_norm": 0.9016247140440351, + "learning_rate": 7.420225195808397e-06, + "loss": 0.1153, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06308970600366592, + "step": 9955, + "valid_targets_mean": 1407.2, + "valid_targets_min": 990 + }, + { + "epoch": 5.217391304347826, + "grad_norm": 0.7498791828385352, + "learning_rate": 7.399927273020748e-06, + "loss": 0.1201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05194121599197388, + "step": 9960, + "valid_targets_mean": 1551.6, + "valid_targets_min": 639 + }, + { + "epoch": 5.2200104766893665, + "grad_norm": 0.8056681058630909, + "learning_rate": 7.379650846861295e-06, + "loss": 0.119, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05170396342873573, + "step": 9965, + "valid_targets_mean": 1442.6, + "valid_targets_min": 958 + }, + { + "epoch": 5.222629649030906, + "grad_norm": 0.8173097296836717, + "learning_rate": 7.359395951923081e-06, + "loss": 0.1211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06028531491756439, + "step": 9970, + "valid_targets_mean": 1426.5, + "valid_targets_min": 874 + }, + { + "epoch": 5.225248821372446, + "grad_norm": 0.7462986566841966, + "learning_rate": 7.3391626227624145e-06, + "loss": 0.124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.056972358375787735, + "step": 9975, + "valid_targets_mean": 1298.2, + "valid_targets_min": 557 + }, + { + "epoch": 5.2278679937139865, + "grad_norm": 0.8632265642665938, + "learning_rate": 7.318950893898804e-06, + "loss": 0.1218, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07349438965320587, + "step": 9980, + "valid_targets_mean": 1472.2, + "valid_targets_min": 713 + }, + { + "epoch": 5.230487166055527, + "grad_norm": 0.8247613670529226, + "learning_rate": 7.29876079981491e-06, + "loss": 0.124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0822034552693367, + "step": 9985, + "valid_targets_mean": 3139.9, + "valid_targets_min": 760 + }, + { + "epoch": 5.233106338397066, + "grad_norm": 0.7016447370775042, + "learning_rate": 7.2785923749564905e-06, + "loss": 0.172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08335396647453308, + "step": 9990, + "valid_targets_mean": 7612.6, + "valid_targets_min": 5111 + }, + { + "epoch": 5.2357255107386065, + "grad_norm": 0.5823301815088959, + "learning_rate": 7.2584456537323025e-06, + "loss": 0.1609, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08028516173362732, + "step": 9995, + "valid_targets_mean": 6669.0, + "valid_targets_min": 4480 + }, + { + "epoch": 5.238344683080147, + "grad_norm": 0.42686852024385435, + "learning_rate": 7.238320670514125e-06, + "loss": 0.1499, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07357516139745712, + "step": 10000, + "valid_targets_mean": 6538.6, + "valid_targets_min": 4620 + }, + { + "epoch": 5.240963855421687, + "grad_norm": 0.3860267732299242, + "learning_rate": 7.218217459636605e-06, + "loss": 0.1494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08040302991867065, + "step": 10005, + "valid_targets_mean": 6802.6, + "valid_targets_min": 4873 + }, + { + "epoch": 5.2435830277632265, + "grad_norm": 0.41018469570895844, + "learning_rate": 7.198136055397269e-06, + "loss": 0.1619, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09762245416641235, + "step": 10010, + "valid_targets_mean": 7563.2, + "valid_targets_min": 4229 + }, + { + "epoch": 5.246202200104767, + "grad_norm": 0.44350311791841235, + "learning_rate": 7.178076492056434e-06, + "loss": 0.1576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08566471934318542, + "step": 10015, + "valid_targets_mean": 6109.0, + "valid_targets_min": 4279 + }, + { + "epoch": 5.248821372446307, + "grad_norm": 0.3751231386489058, + "learning_rate": 7.1580388038371525e-06, + "loss": 0.1474, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05747370794415474, + "step": 10020, + "valid_targets_mean": 5549.6, + "valid_targets_min": 4542 + }, + { + "epoch": 5.251440544787847, + "grad_norm": 0.5169337392227329, + "learning_rate": 7.1380230249251605e-06, + "loss": 0.1668, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07669960707426071, + "step": 10025, + "valid_targets_mean": 2525.8, + "valid_targets_min": 1497 + }, + { + "epoch": 5.254059717129387, + "grad_norm": 0.37923721697545987, + "learning_rate": 7.118029189468812e-06, + "loss": 0.152, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07565468549728394, + "step": 10030, + "valid_targets_mean": 6166.2, + "valid_targets_min": 5332 + }, + { + "epoch": 5.256678889470927, + "grad_norm": 0.40425635783083314, + "learning_rate": 7.098057331579031e-06, + "loss": 0.1512, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08241156488656998, + "step": 10035, + "valid_targets_mean": 5823.5, + "valid_targets_min": 4612 + }, + { + "epoch": 5.259298061812467, + "grad_norm": 0.3907609589866494, + "learning_rate": 7.078107485329222e-06, + "loss": 0.1592, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0800551027059555, + "step": 10040, + "valid_targets_mean": 6896.5, + "valid_targets_min": 4491 + }, + { + "epoch": 5.261917234154008, + "grad_norm": 0.3778040111634576, + "learning_rate": 7.05817968475528e-06, + "loss": 0.1486, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07752105593681335, + "step": 10045, + "valid_targets_mean": 6611.1, + "valid_targets_min": 4754 + }, + { + "epoch": 5.264536406495547, + "grad_norm": 0.3812696012808861, + "learning_rate": 7.038273963855442e-06, + "loss": 0.145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06828771531581879, + "step": 10050, + "valid_targets_mean": 5907.1, + "valid_targets_min": 4787 + }, + { + "epoch": 5.267155578837087, + "grad_norm": 0.38896075575746797, + "learning_rate": 7.018390356590303e-06, + "loss": 0.1371, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06619839370250702, + "step": 10055, + "valid_targets_mean": 6055.5, + "valid_targets_min": 5052 + }, + { + "epoch": 5.269774751178628, + "grad_norm": 0.39253571485970484, + "learning_rate": 6.998528896882726e-06, + "loss": 0.1397, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06778645515441895, + "step": 10060, + "valid_targets_mean": 6365.0, + "valid_targets_min": 4664 + }, + { + "epoch": 5.272393923520168, + "grad_norm": 0.3861560859423902, + "learning_rate": 6.978689618617784e-06, + "loss": 0.1504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06602711230516434, + "step": 10065, + "valid_targets_mean": 5928.2, + "valid_targets_min": 4211 + }, + { + "epoch": 5.275013095861707, + "grad_norm": 0.3713955201784082, + "learning_rate": 6.958872555642711e-06, + "loss": 0.1486, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07369357347488403, + "step": 10070, + "valid_targets_mean": 6415.9, + "valid_targets_min": 4582 + }, + { + "epoch": 5.277632268203248, + "grad_norm": 0.38669814277909503, + "learning_rate": 6.939077741766842e-06, + "loss": 0.1348, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06115833669900894, + "step": 10075, + "valid_targets_mean": 6044.8, + "valid_targets_min": 4800 + }, + { + "epoch": 5.280251440544788, + "grad_norm": 0.3441598004906199, + "learning_rate": 6.9193052107615335e-06, + "loss": 0.1341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06817680597305298, + "step": 10080, + "valid_targets_mean": 8009.0, + "valid_targets_min": 6651 + }, + { + "epoch": 5.282870612886328, + "grad_norm": 0.4086751254195686, + "learning_rate": 6.8995549963601675e-06, + "loss": 0.1525, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0852825790643692, + "step": 10085, + "valid_targets_mean": 5887.5, + "valid_targets_min": 3477 + }, + { + "epoch": 5.285489785227868, + "grad_norm": 0.4855072130935138, + "learning_rate": 6.8798271322580015e-06, + "loss": 0.1676, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09230928122997284, + "step": 10090, + "valid_targets_mean": 5471.1, + "valid_targets_min": 965 + }, + { + "epoch": 5.288108957569408, + "grad_norm": 0.3672577879646038, + "learning_rate": 6.860121652112211e-06, + "loss": 0.1377, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07655905187129974, + "step": 10095, + "valid_targets_mean": 6654.1, + "valid_targets_min": 5226 + }, + { + "epoch": 5.290728129910948, + "grad_norm": 0.4055655338645675, + "learning_rate": 6.840438589541733e-06, + "loss": 0.1474, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06398853659629822, + "step": 10100, + "valid_targets_mean": 6363.4, + "valid_targets_min": 4213 + }, + { + "epoch": 5.293347302252489, + "grad_norm": 0.42587886910638884, + "learning_rate": 6.820777978127315e-06, + "loss": 0.1606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08191876113414764, + "step": 10105, + "valid_targets_mean": 5469.9, + "valid_targets_min": 3761 + }, + { + "epoch": 5.295966474594028, + "grad_norm": 0.4134904846413301, + "learning_rate": 6.801139851411347e-06, + "loss": 0.1778, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10157156735658646, + "step": 10110, + "valid_targets_mean": 7206.2, + "valid_targets_min": 4993 + }, + { + "epoch": 5.298585646935568, + "grad_norm": 0.3917239886283864, + "learning_rate": 6.78152424289789e-06, + "loss": 0.173, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07931825518608093, + "step": 10115, + "valid_targets_mean": 6402.2, + "valid_targets_min": 5199 + }, + { + "epoch": 5.301204819277109, + "grad_norm": 0.3825102469209971, + "learning_rate": 6.761931186052579e-06, + "loss": 0.1508, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08583804219961166, + "step": 10120, + "valid_targets_mean": 7578.1, + "valid_targets_min": 4534 + }, + { + "epoch": 5.303823991618648, + "grad_norm": 0.4109790035922538, + "learning_rate": 6.742360714302576e-06, + "loss": 0.1511, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06634113192558289, + "step": 10125, + "valid_targets_mean": 6264.4, + "valid_targets_min": 4751 + }, + { + "epoch": 5.306443163960188, + "grad_norm": 0.4112262337186078, + "learning_rate": 6.7228128610365116e-06, + "loss": 0.152, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06814072281122208, + "step": 10130, + "valid_targets_mean": 5604.1, + "valid_targets_min": 3888 + }, + { + "epoch": 5.309062336301729, + "grad_norm": 0.4031731450213549, + "learning_rate": 6.703287659604429e-06, + "loss": 0.1576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08444470167160034, + "step": 10135, + "valid_targets_mean": 7001.6, + "valid_targets_min": 4455 + }, + { + "epoch": 5.311681508643269, + "grad_norm": 0.39609044928145004, + "learning_rate": 6.683785143317707e-06, + "loss": 0.15, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08760792016983032, + "step": 10140, + "valid_targets_mean": 6955.5, + "valid_targets_min": 5230 + }, + { + "epoch": 5.314300680984809, + "grad_norm": 0.3808870932482914, + "learning_rate": 6.6643053454490605e-06, + "loss": 0.1577, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06994412839412689, + "step": 10145, + "valid_targets_mean": 7295.8, + "valid_targets_min": 5668 + }, + { + "epoch": 5.316919853326349, + "grad_norm": 0.413429926706307, + "learning_rate": 6.644848299232407e-06, + "loss": 0.1551, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0801548883318901, + "step": 10150, + "valid_targets_mean": 6350.4, + "valid_targets_min": 4871 + }, + { + "epoch": 5.319539025667889, + "grad_norm": 0.37475407501719343, + "learning_rate": 6.625414037862865e-06, + "loss": 0.1449, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08898886293172836, + "step": 10155, + "valid_targets_mean": 8015.2, + "valid_targets_min": 6018 + }, + { + "epoch": 5.322158198009429, + "grad_norm": 0.35684775592882495, + "learning_rate": 6.606002594496683e-06, + "loss": 0.1313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06981298327445984, + "step": 10160, + "valid_targets_mean": 7110.1, + "valid_targets_min": 3533 + }, + { + "epoch": 5.324777370350969, + "grad_norm": 0.4425639362014185, + "learning_rate": 6.586614002251173e-06, + "loss": 0.1573, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08674512058496475, + "step": 10165, + "valid_targets_mean": 6875.0, + "valid_targets_min": 5199 + }, + { + "epoch": 5.327396542692509, + "grad_norm": 0.42824677791656335, + "learning_rate": 6.567248294204669e-06, + "loss": 0.1549, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07547745108604431, + "step": 10170, + "valid_targets_mean": 5568.4, + "valid_targets_min": 4923 + }, + { + "epoch": 5.330015715034049, + "grad_norm": 0.36854650462535177, + "learning_rate": 6.547905503396454e-06, + "loss": 0.151, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.059491705149412155, + "step": 10175, + "valid_targets_mean": 6421.9, + "valid_targets_min": 4527 + }, + { + "epoch": 5.3326348873755895, + "grad_norm": 0.39351311799382077, + "learning_rate": 6.528585662826725e-06, + "loss": 0.1485, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09477847069501877, + "step": 10180, + "valid_targets_mean": 7147.9, + "valid_targets_min": 3082 + }, + { + "epoch": 5.33525405971713, + "grad_norm": 0.38167891224919565, + "learning_rate": 6.5092888054564995e-06, + "loss": 0.1369, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06909792125225067, + "step": 10185, + "valid_targets_mean": 6880.6, + "valid_targets_min": 4685 + }, + { + "epoch": 5.337873232058669, + "grad_norm": 0.40048444743253364, + "learning_rate": 6.490014964207622e-06, + "loss": 0.1509, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06907521188259125, + "step": 10190, + "valid_targets_mean": 5915.5, + "valid_targets_min": 4875 + }, + { + "epoch": 5.34049240440021, + "grad_norm": 0.3729187881083819, + "learning_rate": 6.470764171962633e-06, + "loss": 0.1539, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06739333271980286, + "step": 10195, + "valid_targets_mean": 6234.5, + "valid_targets_min": 4433 + }, + { + "epoch": 5.34311157674175, + "grad_norm": 0.3943046453666481, + "learning_rate": 6.451536461564774e-06, + "loss": 0.144, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06472145020961761, + "step": 10200, + "valid_targets_mean": 5684.0, + "valid_targets_min": 4540 + }, + { + "epoch": 5.345730749083289, + "grad_norm": 0.43902753507712433, + "learning_rate": 6.432331865817891e-06, + "loss": 0.1557, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09635139256715775, + "step": 10205, + "valid_targets_mean": 7353.4, + "valid_targets_min": 5101 + }, + { + "epoch": 5.34834992142483, + "grad_norm": 0.4040924994306939, + "learning_rate": 6.413150417486409e-06, + "loss": 0.147, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06020814925432205, + "step": 10210, + "valid_targets_mean": 5300.5, + "valid_targets_min": 4442 + }, + { + "epoch": 5.35096909376637, + "grad_norm": 0.3703374972314483, + "learning_rate": 6.3939921492952514e-06, + "loss": 0.1273, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06047903001308441, + "step": 10215, + "valid_targets_mean": 6084.1, + "valid_targets_min": 5268 + }, + { + "epoch": 5.35358826610791, + "grad_norm": 0.3636680625578178, + "learning_rate": 6.374857093929802e-06, + "loss": 0.1303, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07073706388473511, + "step": 10220, + "valid_targets_mean": 6446.6, + "valid_targets_min": 5074 + }, + { + "epoch": 5.35620743844945, + "grad_norm": 0.3788299313306084, + "learning_rate": 6.355745284035835e-06, + "loss": 0.1361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06560464203357697, + "step": 10225, + "valid_targets_mean": 6195.0, + "valid_targets_min": 5221 + }, + { + "epoch": 5.35882661079099, + "grad_norm": 0.4113542279653514, + "learning_rate": 6.336656752219479e-06, + "loss": 0.1458, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07294383645057678, + "step": 10230, + "valid_targets_mean": 5689.1, + "valid_targets_min": 4642 + }, + { + "epoch": 5.36144578313253, + "grad_norm": 0.47569693807252555, + "learning_rate": 6.3175915310471155e-06, + "loss": 0.1676, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08518552035093307, + "step": 10235, + "valid_targets_mean": 4461.4, + "valid_targets_min": 3222 + }, + { + "epoch": 5.3640649554740705, + "grad_norm": 0.4401813564141267, + "learning_rate": 6.2985496530454115e-06, + "loss": 0.1766, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07736337929964066, + "step": 10240, + "valid_targets_mean": 6822.2, + "valid_targets_min": 4371 + }, + { + "epoch": 5.36668412781561, + "grad_norm": 0.4407114697967697, + "learning_rate": 6.279531150701146e-06, + "loss": 0.1422, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07739515602588654, + "step": 10245, + "valid_targets_mean": 5632.6, + "valid_targets_min": 3689 + }, + { + "epoch": 5.36930330015715, + "grad_norm": 0.439335184296538, + "learning_rate": 6.260536056461275e-06, + "loss": 0.1502, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07690007984638214, + "step": 10250, + "valid_targets_mean": 6364.1, + "valid_targets_min": 4281 + }, + { + "epoch": 5.3719224724986905, + "grad_norm": 0.4600670189533514, + "learning_rate": 6.241564402732776e-06, + "loss": 0.1517, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09007485955953598, + "step": 10255, + "valid_targets_mean": 6337.8, + "valid_targets_min": 4844 + }, + { + "epoch": 5.374541644840231, + "grad_norm": 0.3955954710935925, + "learning_rate": 6.222616221882658e-06, + "loss": 0.163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06693617254495621, + "step": 10260, + "valid_targets_mean": 5507.5, + "valid_targets_min": 4549 + }, + { + "epoch": 5.37716081718177, + "grad_norm": 0.39154404681959404, + "learning_rate": 6.203691546237876e-06, + "loss": 0.1512, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06701533496379852, + "step": 10265, + "valid_targets_mean": 5274.8, + "valid_targets_min": 2461 + }, + { + "epoch": 5.3797799895233105, + "grad_norm": 0.405735916954033, + "learning_rate": 6.184790408085281e-06, + "loss": 0.153, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0845988541841507, + "step": 10270, + "valid_targets_mean": 6465.2, + "valid_targets_min": 2815 + }, + { + "epoch": 5.382399161864851, + "grad_norm": 0.37252624761638364, + "learning_rate": 6.165912839671577e-06, + "loss": 0.1502, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06499049812555313, + "step": 10275, + "valid_targets_mean": 6715.5, + "valid_targets_min": 5192 + }, + { + "epoch": 5.385018334206391, + "grad_norm": 0.4138794283918792, + "learning_rate": 6.147058873203247e-06, + "loss": 0.1362, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06541548669338226, + "step": 10280, + "valid_targets_mean": 5737.2, + "valid_targets_min": 5186 + }, + { + "epoch": 5.3876375065479305, + "grad_norm": 0.4320162655413788, + "learning_rate": 6.12822854084651e-06, + "loss": 0.1482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05883662402629852, + "step": 10285, + "valid_targets_mean": 5329.5, + "valid_targets_min": 3786 + }, + { + "epoch": 5.390256678889471, + "grad_norm": 0.3993761360156539, + "learning_rate": 6.1094218747272725e-06, + "loss": 0.193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08521421253681183, + "step": 10290, + "valid_targets_mean": 6233.8, + "valid_targets_min": 5147 + }, + { + "epoch": 5.392875851231011, + "grad_norm": 0.39569544811437657, + "learning_rate": 6.0906389069310434e-06, + "loss": 0.141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08180350810289383, + "step": 10295, + "valid_targets_mean": 5807.6, + "valid_targets_min": 3952 + }, + { + "epoch": 5.395495023572551, + "grad_norm": 0.4311559510427168, + "learning_rate": 6.07187966950292e-06, + "loss": 0.1522, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08369584381580353, + "step": 10300, + "valid_targets_mean": 6452.8, + "valid_targets_min": 5079 + }, + { + "epoch": 5.398114195914091, + "grad_norm": 0.4342446058772487, + "learning_rate": 6.053144194447507e-06, + "loss": 0.1546, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08193376660346985, + "step": 10305, + "valid_targets_mean": 6432.9, + "valid_targets_min": 3762 + }, + { + "epoch": 5.400733368255631, + "grad_norm": 0.4094968353215779, + "learning_rate": 6.0344325137288675e-06, + "loss": 0.1353, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06287078559398651, + "step": 10310, + "valid_targets_mean": 5954.1, + "valid_targets_min": 4726 + }, + { + "epoch": 5.403352540597171, + "grad_norm": 0.4694056913890443, + "learning_rate": 6.015744659270475e-06, + "loss": 0.1419, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08099617063999176, + "step": 10315, + "valid_targets_mean": 5874.6, + "valid_targets_min": 3724 + }, + { + "epoch": 5.405971712938712, + "grad_norm": 0.3680358302163034, + "learning_rate": 5.997080662955148e-06, + "loss": 0.1311, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06874550879001617, + "step": 10320, + "valid_targets_mean": 6436.9, + "valid_targets_min": 5578 + }, + { + "epoch": 5.408590885280251, + "grad_norm": 0.40563622398332005, + "learning_rate": 5.978440556625009e-06, + "loss": 0.1483, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0687650516629219, + "step": 10325, + "valid_targets_mean": 6727.8, + "valid_targets_min": 5795 + }, + { + "epoch": 5.411210057621791, + "grad_norm": 0.38579147373260586, + "learning_rate": 5.9598243720814e-06, + "loss": 0.1406, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06289946287870407, + "step": 10330, + "valid_targets_mean": 6116.2, + "valid_targets_min": 5268 + }, + { + "epoch": 5.413829229963332, + "grad_norm": 0.36715823726572966, + "learning_rate": 5.941232141084892e-06, + "loss": 0.1424, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06658988445997238, + "step": 10335, + "valid_targets_mean": 7379.5, + "valid_targets_min": 4920 + }, + { + "epoch": 5.416448402304872, + "grad_norm": 0.3570910803879039, + "learning_rate": 5.922663895355138e-06, + "loss": 0.1486, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.055937521159648895, + "step": 10340, + "valid_targets_mean": 7048.4, + "valid_targets_min": 5243 + }, + { + "epoch": 5.419067574646411, + "grad_norm": 0.40882981172440686, + "learning_rate": 5.904119666570929e-06, + "loss": 0.1341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07782215625047684, + "step": 10345, + "valid_targets_mean": 6385.8, + "valid_targets_min": 4794 + }, + { + "epoch": 5.421686746987952, + "grad_norm": 0.4339250956620702, + "learning_rate": 5.885599486370024e-06, + "loss": 0.1522, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06769482791423798, + "step": 10350, + "valid_targets_mean": 6215.4, + "valid_targets_min": 5168 + }, + { + "epoch": 5.424305919329492, + "grad_norm": 0.43044761296828704, + "learning_rate": 5.867103386349189e-06, + "loss": 0.1549, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08711810410022736, + "step": 10355, + "valid_targets_mean": 5333.2, + "valid_targets_min": 3130 + }, + { + "epoch": 5.426925091671032, + "grad_norm": 0.5643488195304203, + "learning_rate": 5.8486313980640975e-06, + "loss": 0.1862, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09607409685850143, + "step": 10360, + "valid_targets_mean": 5546.2, + "valid_targets_min": 1971 + }, + { + "epoch": 5.429544264012572, + "grad_norm": 0.5850889872445502, + "learning_rate": 5.830183553029285e-06, + "loss": 0.2135, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13026058673858643, + "step": 10365, + "valid_targets_mean": 5648.9, + "valid_targets_min": 1631 + }, + { + "epoch": 5.432163436354112, + "grad_norm": 0.5666667792864185, + "learning_rate": 5.811759882718102e-06, + "loss": 0.2166, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12489330023527145, + "step": 10370, + "valid_targets_mean": 5411.4, + "valid_targets_min": 1509 + }, + { + "epoch": 5.434782608695652, + "grad_norm": 0.5258933268049755, + "learning_rate": 5.793360418562659e-06, + "loss": 0.2041, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09626871347427368, + "step": 10375, + "valid_targets_mean": 4960.2, + "valid_targets_min": 2736 + }, + { + "epoch": 5.437401781037193, + "grad_norm": 0.6114570302288379, + "learning_rate": 5.7749851919537396e-06, + "loss": 0.2091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09290073066949844, + "step": 10380, + "valid_targets_mean": 3726.8, + "valid_targets_min": 1439 + }, + { + "epoch": 5.440020953378732, + "grad_norm": 0.5384858421780185, + "learning_rate": 5.756634234240825e-06, + "loss": 0.2165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09385785460472107, + "step": 10385, + "valid_targets_mean": 4269.4, + "valid_targets_min": 1838 + }, + { + "epoch": 5.442640125720272, + "grad_norm": 0.5329360036480885, + "learning_rate": 5.738307576731943e-06, + "loss": 0.2023, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12725722789764404, + "step": 10390, + "valid_targets_mean": 5973.6, + "valid_targets_min": 2762 + }, + { + "epoch": 5.445259298061813, + "grad_norm": 0.5793722639828044, + "learning_rate": 5.7200052506937095e-06, + "loss": 0.211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0956265777349472, + "step": 10395, + "valid_targets_mean": 3987.1, + "valid_targets_min": 1654 + }, + { + "epoch": 5.447878470403353, + "grad_norm": 0.496775138740992, + "learning_rate": 5.701727287351186e-06, + "loss": 0.2087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09867385029792786, + "step": 10400, + "valid_targets_mean": 5043.6, + "valid_targets_min": 2493 + }, + { + "epoch": 5.450497642744892, + "grad_norm": 0.5812377395766525, + "learning_rate": 5.6834737178879e-06, + "loss": 0.2188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09992499649524689, + "step": 10405, + "valid_targets_mean": 4468.9, + "valid_targets_min": 874 + }, + { + "epoch": 5.453116815086433, + "grad_norm": 0.48686859517785813, + "learning_rate": 5.665244573445747e-06, + "loss": 0.208, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09565421938896179, + "step": 10410, + "valid_targets_mean": 5241.0, + "valid_targets_min": 953 + }, + { + "epoch": 5.455735987427973, + "grad_norm": 0.5699010720655088, + "learning_rate": 5.647039885124956e-06, + "loss": 0.2108, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1318211406469345, + "step": 10415, + "valid_targets_mean": 5277.0, + "valid_targets_min": 1265 + }, + { + "epoch": 5.458355159769513, + "grad_norm": 0.5097020234723649, + "learning_rate": 5.628859683984034e-06, + "loss": 0.2041, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10591420531272888, + "step": 10420, + "valid_targets_mean": 6127.8, + "valid_targets_min": 2566 + }, + { + "epoch": 5.460974332111053, + "grad_norm": 0.5595183648685903, + "learning_rate": 5.610704001039706e-06, + "loss": 0.2101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09012778103351593, + "step": 10425, + "valid_targets_mean": 3446.9, + "valid_targets_min": 1759 + }, + { + "epoch": 5.463593504452593, + "grad_norm": 0.5984489249129414, + "learning_rate": 5.592572867266877e-06, + "loss": 0.2007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09819424897432327, + "step": 10430, + "valid_targets_mean": 3659.4, + "valid_targets_min": 2179 + }, + { + "epoch": 5.466212676794133, + "grad_norm": 0.620023251286136, + "learning_rate": 5.57446631359855e-06, + "loss": 0.2045, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1056923121213913, + "step": 10435, + "valid_targets_mean": 4161.5, + "valid_targets_min": 1785 + }, + { + "epoch": 5.4688318491356736, + "grad_norm": 0.6052536403022243, + "learning_rate": 5.556384370925812e-06, + "loss": 0.1994, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11983170360326767, + "step": 10440, + "valid_targets_mean": 4467.9, + "valid_targets_min": 2345 + }, + { + "epoch": 5.471451021477213, + "grad_norm": 0.5988358860825104, + "learning_rate": 5.538327070097753e-06, + "loss": 0.2061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11621883511543274, + "step": 10445, + "valid_targets_mean": 4057.2, + "valid_targets_min": 2767 + }, + { + "epoch": 5.474070193818753, + "grad_norm": 0.6636345304563924, + "learning_rate": 5.5202944419214236e-06, + "loss": 0.2099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10627111792564392, + "step": 10450, + "valid_targets_mean": 3450.2, + "valid_targets_min": 1205 + }, + { + "epoch": 5.476689366160294, + "grad_norm": 0.5966289856538027, + "learning_rate": 5.502286517161783e-06, + "loss": 0.2016, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10250097513198853, + "step": 10455, + "valid_targets_mean": 3777.1, + "valid_targets_min": 2004 + }, + { + "epoch": 5.479308538501833, + "grad_norm": 0.6305270129637696, + "learning_rate": 5.4843033265416426e-06, + "loss": 0.211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11023075878620148, + "step": 10460, + "valid_targets_mean": 4273.0, + "valid_targets_min": 1469 + }, + { + "epoch": 5.481927710843373, + "grad_norm": 0.62686315049717, + "learning_rate": 5.466344900741616e-06, + "loss": 0.1947, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11784721165895462, + "step": 10465, + "valid_targets_mean": 4196.8, + "valid_targets_min": 1889 + }, + { + "epoch": 5.484546883184914, + "grad_norm": 0.6191613884937408, + "learning_rate": 5.448411270400071e-06, + "loss": 0.1917, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10129757970571518, + "step": 10470, + "valid_targets_mean": 4319.2, + "valid_targets_min": 2046 + }, + { + "epoch": 5.487166055526454, + "grad_norm": 0.6381998419206792, + "learning_rate": 5.430502466113052e-06, + "loss": 0.1921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11723365634679794, + "step": 10475, + "valid_targets_mean": 4580.1, + "valid_targets_min": 3373 + }, + { + "epoch": 5.489785227867994, + "grad_norm": 0.6853399916665825, + "learning_rate": 5.4126185184342875e-06, + "loss": 0.2037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10599417984485626, + "step": 10480, + "valid_targets_mean": 3786.0, + "valid_targets_min": 1747 + }, + { + "epoch": 5.492404400209534, + "grad_norm": 0.6176675884859637, + "learning_rate": 5.39475945787505e-06, + "loss": 0.2049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08931992948055267, + "step": 10485, + "valid_targets_mean": 3339.9, + "valid_targets_min": 1166 + }, + { + "epoch": 5.495023572551074, + "grad_norm": 0.5792463399349149, + "learning_rate": 5.376925314904202e-06, + "loss": 0.1959, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09918844699859619, + "step": 10490, + "valid_targets_mean": 4114.1, + "valid_targets_min": 1537 + }, + { + "epoch": 5.497642744892614, + "grad_norm": 0.5807901724764257, + "learning_rate": 5.359116119948056e-06, + "loss": 0.1973, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09208104759454727, + "step": 10495, + "valid_targets_mean": 4550.4, + "valid_targets_min": 3119 + }, + { + "epoch": 5.500261917234154, + "grad_norm": 0.6137099431127251, + "learning_rate": 5.341331903390381e-06, + "loss": 0.1979, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09576673805713654, + "step": 10500, + "valid_targets_mean": 3810.8, + "valid_targets_min": 2562 + }, + { + "epoch": 5.502881089575694, + "grad_norm": 0.6073790234492764, + "learning_rate": 5.323572695572326e-06, + "loss": 0.1962, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10099849849939346, + "step": 10505, + "valid_targets_mean": 4045.5, + "valid_targets_min": 2659 + }, + { + "epoch": 5.505500261917234, + "grad_norm": 0.553561835142201, + "learning_rate": 5.305838526792375e-06, + "loss": 0.1878, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08134942501783371, + "step": 10510, + "valid_targets_mean": 4064.8, + "valid_targets_min": 1349 + }, + { + "epoch": 5.5081194342587745, + "grad_norm": 0.6775278036738944, + "learning_rate": 5.2881294273062926e-06, + "loss": 0.2001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09701518714427948, + "step": 10515, + "valid_targets_mean": 3371.4, + "valid_targets_min": 2474 + }, + { + "epoch": 5.510738606600315, + "grad_norm": 0.6909881239559398, + "learning_rate": 5.270445427327071e-06, + "loss": 0.1979, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0812319666147232, + "step": 10520, + "valid_targets_mean": 2590.5, + "valid_targets_min": 738 + }, + { + "epoch": 5.513357778941854, + "grad_norm": 0.6275919728018728, + "learning_rate": 5.252786557024885e-06, + "loss": 0.1893, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09055991470813751, + "step": 10525, + "valid_targets_mean": 3570.5, + "valid_targets_min": 2033 + }, + { + "epoch": 5.5159769512833945, + "grad_norm": 0.721356563398191, + "learning_rate": 5.2351528465270405e-06, + "loss": 0.195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10568110644817352, + "step": 10530, + "valid_targets_mean": 2933.1, + "valid_targets_min": 1346 + }, + { + "epoch": 5.518596123624935, + "grad_norm": 0.8071270869299125, + "learning_rate": 5.217544325917893e-06, + "loss": 0.1954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10447847098112106, + "step": 10535, + "valid_targets_mean": 2991.1, + "valid_targets_min": 1821 + }, + { + "epoch": 5.521215295966474, + "grad_norm": 0.6504779203035157, + "learning_rate": 5.199961025238871e-06, + "loss": 0.1948, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09409458935260773, + "step": 10540, + "valid_targets_mean": 3400.1, + "valid_targets_min": 2535 + }, + { + "epoch": 5.5238344683080145, + "grad_norm": 0.671693602313302, + "learning_rate": 5.182402974488323e-06, + "loss": 0.1952, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09331804513931274, + "step": 10545, + "valid_targets_mean": 3411.5, + "valid_targets_min": 2352 + }, + { + "epoch": 5.526453640649555, + "grad_norm": 0.6471336187560586, + "learning_rate": 5.164870203621553e-06, + "loss": 0.1928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08596295118331909, + "step": 10550, + "valid_targets_mean": 3319.8, + "valid_targets_min": 1153 + }, + { + "epoch": 5.529072812991095, + "grad_norm": 0.9139238811458623, + "learning_rate": 5.147362742550725e-06, + "loss": 0.1943, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10043549537658691, + "step": 10555, + "valid_targets_mean": 3718.0, + "valid_targets_min": 2072 + }, + { + "epoch": 5.5316919853326345, + "grad_norm": 0.6312099733530194, + "learning_rate": 5.129880621144827e-06, + "loss": 0.1953, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0861826241016388, + "step": 10560, + "valid_targets_mean": 3451.0, + "valid_targets_min": 922 + }, + { + "epoch": 5.534311157674175, + "grad_norm": 0.6036615572114501, + "learning_rate": 5.112423869229608e-06, + "loss": 0.1927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07662707567214966, + "step": 10565, + "valid_targets_mean": 3381.6, + "valid_targets_min": 1417 + }, + { + "epoch": 5.536930330015715, + "grad_norm": 0.6239335015347284, + "learning_rate": 5.09499251658754e-06, + "loss": 0.2003, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08969300985336304, + "step": 10570, + "valid_targets_mean": 4260.6, + "valid_targets_min": 1844 + }, + { + "epoch": 5.539549502357255, + "grad_norm": 0.7308611942195394, + "learning_rate": 5.077586592957771e-06, + "loss": 0.1931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1015428975224495, + "step": 10575, + "valid_targets_mean": 3525.2, + "valid_targets_min": 1261 + }, + { + "epoch": 5.542168674698795, + "grad_norm": 0.6311203968047921, + "learning_rate": 5.060206128036034e-06, + "loss": 0.1944, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11546990275382996, + "step": 10580, + "valid_targets_mean": 4548.6, + "valid_targets_min": 2077 + }, + { + "epoch": 5.544787847040335, + "grad_norm": 0.6104267190252021, + "learning_rate": 5.042851151474675e-06, + "loss": 0.1919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10856322199106216, + "step": 10585, + "valid_targets_mean": 4140.9, + "valid_targets_min": 2724 + }, + { + "epoch": 5.547407019381875, + "grad_norm": 0.667555633639888, + "learning_rate": 5.025521692882513e-06, + "loss": 0.1946, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14028789103031158, + "step": 10590, + "valid_targets_mean": 5291.4, + "valid_targets_min": 2292 + }, + { + "epoch": 5.550026191723416, + "grad_norm": 0.7172987509908402, + "learning_rate": 5.008217781824849e-06, + "loss": 0.1971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0968562513589859, + "step": 10595, + "valid_targets_mean": 2965.1, + "valid_targets_min": 1377 + }, + { + "epoch": 5.552645364064955, + "grad_norm": 0.6177201842022538, + "learning_rate": 4.990939447823402e-06, + "loss": 0.198, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08947396278381348, + "step": 10600, + "valid_targets_mean": 3099.5, + "valid_targets_min": 1350 + }, + { + "epoch": 5.555264536406495, + "grad_norm": 0.6603323375361946, + "learning_rate": 4.973686720356248e-06, + "loss": 0.1945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09418955445289612, + "step": 10605, + "valid_targets_mean": 3031.9, + "valid_targets_min": 654 + }, + { + "epoch": 5.557883708748036, + "grad_norm": 0.6490782382697062, + "learning_rate": 4.956459628857775e-06, + "loss": 0.1958, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07847204059362411, + "step": 10610, + "valid_targets_mean": 3463.8, + "valid_targets_min": 1706 + }, + { + "epoch": 5.560502881089576, + "grad_norm": 0.6090670662855951, + "learning_rate": 4.9392582027186466e-06, + "loss": 0.2016, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10062491148710251, + "step": 10615, + "valid_targets_mean": 4105.5, + "valid_targets_min": 1739 + }, + { + "epoch": 5.563122053431115, + "grad_norm": 0.6709318550615645, + "learning_rate": 4.922082471285712e-06, + "loss": 0.1947, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08609208464622498, + "step": 10620, + "valid_targets_mean": 2944.4, + "valid_targets_min": 1302 + }, + { + "epoch": 5.565741225772656, + "grad_norm": 0.5884399803714986, + "learning_rate": 4.9049324638620245e-06, + "loss": 0.182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0818995013833046, + "step": 10625, + "valid_targets_mean": 3531.5, + "valid_targets_min": 2501 + }, + { + "epoch": 5.568360398114196, + "grad_norm": 0.5836595702624258, + "learning_rate": 4.8878082097067055e-06, + "loss": 0.1925, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09440377354621887, + "step": 10630, + "valid_targets_mean": 4673.8, + "valid_targets_min": 3232 + }, + { + "epoch": 5.570979570455736, + "grad_norm": 0.6058345329660421, + "learning_rate": 4.870709738034982e-06, + "loss": 0.1831, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1017429381608963, + "step": 10635, + "valid_targets_mean": 4465.1, + "valid_targets_min": 1101 + }, + { + "epoch": 5.573598742797276, + "grad_norm": 0.6198171565286366, + "learning_rate": 4.85363707801805e-06, + "loss": 0.2082, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10447974503040314, + "step": 10640, + "valid_targets_mean": 4113.2, + "valid_targets_min": 2079 + }, + { + "epoch": 5.576217915138816, + "grad_norm": 1.4356392096515265, + "learning_rate": 4.836590258783118e-06, + "loss": 0.1954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10219666361808777, + "step": 10645, + "valid_targets_mean": 3891.4, + "valid_targets_min": 2138 + }, + { + "epoch": 5.578837087480356, + "grad_norm": 0.5999752289086019, + "learning_rate": 4.819569309413266e-06, + "loss": 0.1962, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09590047597885132, + "step": 10650, + "valid_targets_mean": 3470.2, + "valid_targets_min": 1234 + }, + { + "epoch": 5.581456259821897, + "grad_norm": 0.6151013944912155, + "learning_rate": 4.802574258947459e-06, + "loss": 0.1968, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09681589901447296, + "step": 10655, + "valid_targets_mean": 4038.5, + "valid_targets_min": 1822 + }, + { + "epoch": 5.584075432163436, + "grad_norm": 0.5968394738555188, + "learning_rate": 4.7856051363804715e-06, + "loss": 0.2043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09785608947277069, + "step": 10660, + "valid_targets_mean": 4214.6, + "valid_targets_min": 1651 + }, + { + "epoch": 5.586694604504976, + "grad_norm": 0.6446692840414369, + "learning_rate": 4.768661970662847e-06, + "loss": 0.1932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11061255633831024, + "step": 10665, + "valid_targets_mean": 3447.9, + "valid_targets_min": 1434 + }, + { + "epoch": 5.589313776846517, + "grad_norm": 0.5956230197811474, + "learning_rate": 4.751744790700841e-06, + "loss": 0.1861, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10208860039710999, + "step": 10670, + "valid_targets_mean": 4753.4, + "valid_targets_min": 2725 + }, + { + "epoch": 5.591932949188057, + "grad_norm": 0.592416691781473, + "learning_rate": 4.7348536253563815e-06, + "loss": 0.1832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09418331831693649, + "step": 10675, + "valid_targets_mean": 4005.8, + "valid_targets_min": 1966 + }, + { + "epoch": 5.594552121529596, + "grad_norm": 0.6320872525497788, + "learning_rate": 4.717988503446993e-06, + "loss": 0.1802, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08939506113529205, + "step": 10680, + "valid_targets_mean": 3669.0, + "valid_targets_min": 1407 + }, + { + "epoch": 5.597171293871137, + "grad_norm": 0.6581995553668584, + "learning_rate": 4.7011494537458035e-06, + "loss": 0.1822, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09837263822555542, + "step": 10685, + "valid_targets_mean": 4330.5, + "valid_targets_min": 1444 + }, + { + "epoch": 5.599790466212677, + "grad_norm": 0.6160637343893121, + "learning_rate": 4.684336504981426e-06, + "loss": 0.1746, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07830608636140823, + "step": 10690, + "valid_targets_mean": 3077.8, + "valid_targets_min": 1504 + }, + { + "epoch": 5.602409638554217, + "grad_norm": 0.6184021344561963, + "learning_rate": 4.667549685837962e-06, + "loss": 0.1721, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0702492818236351, + "step": 10695, + "valid_targets_mean": 3051.6, + "valid_targets_min": 858 + }, + { + "epoch": 5.605028810895757, + "grad_norm": 0.6898866591128014, + "learning_rate": 4.650789024954929e-06, + "loss": 0.1887, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07904627919197083, + "step": 10700, + "valid_targets_mean": 3231.8, + "valid_targets_min": 1288 + }, + { + "epoch": 5.607647983237297, + "grad_norm": 0.664381529980434, + "learning_rate": 4.634054550927218e-06, + "loss": 0.2058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09320087730884552, + "step": 10705, + "valid_targets_mean": 4053.0, + "valid_targets_min": 1537 + }, + { + "epoch": 5.610267155578837, + "grad_norm": 0.6771694791746062, + "learning_rate": 4.6173462923050424e-06, + "loss": 0.1862, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09745335578918457, + "step": 10710, + "valid_targets_mean": 3917.1, + "valid_targets_min": 2060 + }, + { + "epoch": 5.612886327920377, + "grad_norm": 0.6242309125978881, + "learning_rate": 4.600664277593892e-06, + "loss": 0.1913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1041133925318718, + "step": 10715, + "valid_targets_mean": 4482.6, + "valid_targets_min": 2515 + }, + { + "epoch": 5.615505500261917, + "grad_norm": 0.628486105645744, + "learning_rate": 4.584008535254482e-06, + "loss": 0.1862, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09165383875370026, + "step": 10720, + "valid_targets_mean": 3847.2, + "valid_targets_min": 1744 + }, + { + "epoch": 5.618124672603457, + "grad_norm": 0.6165649846115652, + "learning_rate": 4.567379093702691e-06, + "loss": 0.1913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09430750459432602, + "step": 10725, + "valid_targets_mean": 5009.9, + "valid_targets_min": 2062 + }, + { + "epoch": 5.620743844944998, + "grad_norm": 0.6345298501930282, + "learning_rate": 4.550775981309561e-06, + "loss": 0.1865, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08381767570972443, + "step": 10730, + "valid_targets_mean": 3550.4, + "valid_targets_min": 1181 + }, + { + "epoch": 5.623363017286538, + "grad_norm": 0.6446078817200693, + "learning_rate": 4.534199226401177e-06, + "loss": 0.1785, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10016798228025436, + "step": 10735, + "valid_targets_mean": 4010.6, + "valid_targets_min": 1937 + }, + { + "epoch": 5.625982189628077, + "grad_norm": 0.6983886083346015, + "learning_rate": 4.5176488572586765e-06, + "loss": 0.1948, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10849693417549133, + "step": 10740, + "valid_targets_mean": 3624.9, + "valid_targets_min": 1649 + }, + { + "epoch": 5.628601361969618, + "grad_norm": 0.7505911544275667, + "learning_rate": 4.501124902118177e-06, + "loss": 0.1855, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09305763244628906, + "step": 10745, + "valid_targets_mean": 2808.1, + "valid_targets_min": 1197 + }, + { + "epoch": 5.631220534311158, + "grad_norm": 0.7966629300365251, + "learning_rate": 4.48462738917073e-06, + "loss": 0.1888, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09724985063076019, + "step": 10750, + "valid_targets_mean": 3251.4, + "valid_targets_min": 1824 + }, + { + "epoch": 5.633839706652697, + "grad_norm": 0.6871211929063602, + "learning_rate": 4.468156346562282e-06, + "loss": 0.1978, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09823998808860779, + "step": 10755, + "valid_targets_mean": 3145.6, + "valid_targets_min": 538 + }, + { + "epoch": 5.636458878994238, + "grad_norm": 0.6329632570910867, + "learning_rate": 4.451711802393615e-06, + "loss": 0.1914, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08536972105503082, + "step": 10760, + "valid_targets_mean": 3597.1, + "valid_targets_min": 537 + }, + { + "epoch": 5.639078051335778, + "grad_norm": 0.6906245376287569, + "learning_rate": 4.435293784720283e-06, + "loss": 0.2037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09746938198804855, + "step": 10765, + "valid_targets_mean": 3386.5, + "valid_targets_min": 2169 + }, + { + "epoch": 5.641697223677318, + "grad_norm": 0.6556767054751694, + "learning_rate": 4.418902321552629e-06, + "loss": 0.1868, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0984741672873497, + "step": 10770, + "valid_targets_mean": 3687.6, + "valid_targets_min": 1625 + }, + { + "epoch": 5.6443163960188585, + "grad_norm": 0.6336878369135004, + "learning_rate": 4.4025374408556406e-06, + "loss": 0.2017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08894580602645874, + "step": 10775, + "valid_targets_mean": 3807.0, + "valid_targets_min": 2642 + }, + { + "epoch": 5.646935568360398, + "grad_norm": 0.6360101774608651, + "learning_rate": 4.386199170549002e-06, + "loss": 0.1967, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11144876480102539, + "step": 10780, + "valid_targets_mean": 4289.9, + "valid_targets_min": 2935 + }, + { + "epoch": 5.649554740701938, + "grad_norm": 0.5724879038589, + "learning_rate": 4.36988753850695e-06, + "loss": 0.1933, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10036087781190872, + "step": 10785, + "valid_targets_mean": 5189.9, + "valid_targets_min": 2652 + }, + { + "epoch": 5.6521739130434785, + "grad_norm": 0.6385118450508577, + "learning_rate": 4.353602572558322e-06, + "loss": 0.1943, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1132982149720192, + "step": 10790, + "valid_targets_mean": 4117.2, + "valid_targets_min": 648 + }, + { + "epoch": 5.654793085385018, + "grad_norm": 0.6732253239872739, + "learning_rate": 4.337344300486426e-06, + "loss": 0.1921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08556917309761047, + "step": 10795, + "valid_targets_mean": 3492.8, + "valid_targets_min": 637 + }, + { + "epoch": 5.657412257726558, + "grad_norm": 0.7495367417437739, + "learning_rate": 4.3211127500290396e-06, + "loss": 0.189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09711206704378128, + "step": 10800, + "valid_targets_mean": 3412.5, + "valid_targets_min": 719 + }, + { + "epoch": 5.6600314300680985, + "grad_norm": 0.6042811234142205, + "learning_rate": 4.3049079488783584e-06, + "loss": 0.1942, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08225598931312561, + "step": 10805, + "valid_targets_mean": 4227.4, + "valid_targets_min": 2182 + }, + { + "epoch": 5.662650602409639, + "grad_norm": 0.6598304132631697, + "learning_rate": 4.288729924680935e-06, + "loss": 0.1822, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08877980709075928, + "step": 10810, + "valid_targets_mean": 3211.1, + "valid_targets_min": 1372 + }, + { + "epoch": 5.665269774751179, + "grad_norm": 0.6929454788075643, + "learning_rate": 4.272578705037638e-06, + "loss": 0.1838, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11478810012340546, + "step": 10815, + "valid_targets_mean": 4490.9, + "valid_targets_min": 2594 + }, + { + "epoch": 5.6678889470927185, + "grad_norm": 0.6365936711525688, + "learning_rate": 4.256454317503611e-06, + "loss": 0.1881, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08295011520385742, + "step": 10820, + "valid_targets_mean": 3054.6, + "valid_targets_min": 530 + }, + { + "epoch": 5.670508119434259, + "grad_norm": 0.6655384406299206, + "learning_rate": 4.240356789588207e-06, + "loss": 0.1903, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1293245553970337, + "step": 10825, + "valid_targets_mean": 4110.2, + "valid_targets_min": 611 + }, + { + "epoch": 5.673127291775799, + "grad_norm": 0.7562332468745507, + "learning_rate": 4.22428614875497e-06, + "loss": 0.1888, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10113480687141418, + "step": 10830, + "valid_targets_mean": 3804.2, + "valid_targets_min": 1987 + }, + { + "epoch": 5.6757464641173385, + "grad_norm": 0.7150061744982886, + "learning_rate": 4.208242422421567e-06, + "loss": 0.1904, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09328234195709229, + "step": 10835, + "valid_targets_mean": 3203.2, + "valid_targets_min": 1362 + }, + { + "epoch": 5.678365636458879, + "grad_norm": 0.602777121567536, + "learning_rate": 4.192225637959743e-06, + "loss": 0.1924, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.090776726603508, + "step": 10840, + "valid_targets_mean": 3245.1, + "valid_targets_min": 852 + }, + { + "epoch": 5.680984808800419, + "grad_norm": 0.6780464690155531, + "learning_rate": 4.176235822695285e-06, + "loss": 0.1886, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07259844988584518, + "step": 10845, + "valid_targets_mean": 2537.4, + "valid_targets_min": 1195 + }, + { + "epoch": 5.683603981141959, + "grad_norm": 0.7248873902463573, + "learning_rate": 4.1602730039079645e-06, + "loss": 0.1928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10924700647592545, + "step": 10850, + "valid_targets_mean": 4383.0, + "valid_targets_min": 1397 + }, + { + "epoch": 5.686223153483499, + "grad_norm": 0.6970237986287124, + "learning_rate": 4.144337208831499e-06, + "loss": 0.1858, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07984375953674316, + "step": 10855, + "valid_targets_mean": 3421.0, + "valid_targets_min": 1975 + }, + { + "epoch": 5.688842325825039, + "grad_norm": 0.6622949330317035, + "learning_rate": 4.128428464653484e-06, + "loss": 0.1755, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09665311127901077, + "step": 10860, + "valid_targets_mean": 4100.6, + "valid_targets_min": 2564 + }, + { + "epoch": 5.691461498166579, + "grad_norm": 0.5573716439983707, + "learning_rate": 4.112546798515402e-06, + "loss": 0.1862, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08861871808767319, + "step": 10865, + "valid_targets_mean": 4986.9, + "valid_targets_min": 2595 + }, + { + "epoch": 5.69408067050812, + "grad_norm": 0.6361048862555745, + "learning_rate": 4.0966922375124894e-06, + "loss": 0.1855, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10304940491914749, + "step": 10870, + "valid_targets_mean": 3992.9, + "valid_targets_min": 2845 + }, + { + "epoch": 5.696699842849659, + "grad_norm": 0.6974644732997708, + "learning_rate": 4.080864808693787e-06, + "loss": 0.1796, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06854330003261566, + "step": 10875, + "valid_targets_mean": 2390.1, + "valid_targets_min": 993 + }, + { + "epoch": 5.699319015191199, + "grad_norm": 0.6106160850582569, + "learning_rate": 4.0650645390620135e-06, + "loss": 0.1731, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07218549400568008, + "step": 10880, + "valid_targets_mean": 3729.1, + "valid_targets_min": 1575 + }, + { + "epoch": 5.70193818753274, + "grad_norm": 0.6832198918686105, + "learning_rate": 4.049291455573561e-06, + "loss": 0.1807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09670407325029373, + "step": 10885, + "valid_targets_mean": 3469.0, + "valid_targets_min": 1360 + }, + { + "epoch": 5.70455735987428, + "grad_norm": 0.6375939367279172, + "learning_rate": 4.033545585138445e-06, + "loss": 0.1801, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08804913610219955, + "step": 10890, + "valid_targets_mean": 3555.5, + "valid_targets_min": 2278 + }, + { + "epoch": 5.707176532215819, + "grad_norm": 0.6613298545136447, + "learning_rate": 4.01782695462025e-06, + "loss": 0.197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10436461865901947, + "step": 10895, + "valid_targets_mean": 3812.2, + "valid_targets_min": 1454 + }, + { + "epoch": 5.70979570455736, + "grad_norm": 0.6612294096053106, + "learning_rate": 4.002135590836089e-06, + "loss": 0.1821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09107402712106705, + "step": 10900, + "valid_targets_mean": 3796.6, + "valid_targets_min": 2344 + }, + { + "epoch": 5.7124148768989, + "grad_norm": 0.7213039975427157, + "learning_rate": 3.986471520556552e-06, + "loss": 0.1841, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09840808808803558, + "step": 10905, + "valid_targets_mean": 3324.1, + "valid_targets_min": 1278 + }, + { + "epoch": 5.71503404924044, + "grad_norm": 0.7352845265339429, + "learning_rate": 3.9708347705056675e-06, + "loss": 0.1742, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09732574224472046, + "step": 10910, + "valid_targets_mean": 3381.4, + "valid_targets_min": 1858 + }, + { + "epoch": 5.71765322158198, + "grad_norm": 0.6978698405212208, + "learning_rate": 3.95522536736086e-06, + "loss": 0.1836, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07258081436157227, + "step": 10915, + "valid_targets_mean": 2566.0, + "valid_targets_min": 420 + }, + { + "epoch": 5.72027239392352, + "grad_norm": 0.9922074600950967, + "learning_rate": 3.9396433377528746e-06, + "loss": 0.185, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08637166023254395, + "step": 10920, + "valid_targets_mean": 2649.4, + "valid_targets_min": 1039 + }, + { + "epoch": 5.72289156626506, + "grad_norm": 0.6583115136938968, + "learning_rate": 3.924088708265792e-06, + "loss": 0.1898, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08856631070375443, + "step": 10925, + "valid_targets_mean": 4475.1, + "valid_targets_min": 1737 + }, + { + "epoch": 5.725510738606601, + "grad_norm": 0.6787761111080356, + "learning_rate": 3.908561505436905e-06, + "loss": 0.1847, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11043144762516022, + "step": 10930, + "valid_targets_mean": 4150.8, + "valid_targets_min": 809 + }, + { + "epoch": 5.72812991094814, + "grad_norm": 0.6197335955768134, + "learning_rate": 3.89306175575676e-06, + "loss": 0.1829, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08951283246278763, + "step": 10935, + "valid_targets_mean": 3864.1, + "valid_targets_min": 1780 + }, + { + "epoch": 5.73074908328968, + "grad_norm": 0.5999510307672616, + "learning_rate": 3.8775894856690245e-06, + "loss": 0.1901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08658986538648605, + "step": 10940, + "valid_targets_mean": 4058.0, + "valid_targets_min": 2185 + }, + { + "epoch": 5.733368255631221, + "grad_norm": 0.4682407816392999, + "learning_rate": 3.862144721570504e-06, + "loss": 0.1553, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04221086576581001, + "step": 10945, + "valid_targets_mean": 2736.0, + "valid_targets_min": 876 + }, + { + "epoch": 5.735987427972761, + "grad_norm": 0.547156207816398, + "learning_rate": 3.84672748981108e-06, + "loss": 0.0959, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03678930923342705, + "step": 10950, + "valid_targets_mean": 1472.5, + "valid_targets_min": 324 + }, + { + "epoch": 5.7386066003143, + "grad_norm": 0.3865703266841375, + "learning_rate": 3.83133781669365e-06, + "loss": 0.0739, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04523061215877533, + "step": 10955, + "valid_targets_mean": 2699.9, + "valid_targets_min": 1064 + }, + { + "epoch": 5.741225772655841, + "grad_norm": 0.40660624020334646, + "learning_rate": 3.815975728474106e-06, + "loss": 0.0732, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03883367404341698, + "step": 10960, + "valid_targets_mean": 3137.0, + "valid_targets_min": 710 + }, + { + "epoch": 5.743844944997381, + "grad_norm": 0.32419841244438224, + "learning_rate": 3.800641251361268e-06, + "loss": 0.0863, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02795051783323288, + "step": 10965, + "valid_targets_mean": 3472.9, + "valid_targets_min": 1223 + }, + { + "epoch": 5.746464117338921, + "grad_norm": 0.39505777994688596, + "learning_rate": 3.7853344115168633e-06, + "loss": 0.0739, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04061180725693703, + "step": 10970, + "valid_targets_mean": 3326.0, + "valid_targets_min": 1431 + }, + { + "epoch": 5.749083289680461, + "grad_norm": 0.7389516836791228, + "learning_rate": 3.7700552350554477e-06, + "loss": 0.1073, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04988997429609299, + "step": 10975, + "valid_targets_mean": 1161.2, + "valid_targets_min": 559 + }, + { + "epoch": 5.751702462022001, + "grad_norm": 0.37442300106849613, + "learning_rate": 3.7548037480443977e-06, + "loss": 0.1001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.037189219146966934, + "step": 10980, + "valid_targets_mean": 3598.2, + "valid_targets_min": 1623 + }, + { + "epoch": 5.754321634363541, + "grad_norm": 0.42154321075664153, + "learning_rate": 3.7395799765038422e-06, + "loss": 0.0834, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.043459370732307434, + "step": 10985, + "valid_targets_mean": 3178.2, + "valid_targets_min": 846 + }, + { + "epoch": 5.756940806705082, + "grad_norm": 0.4928263714664533, + "learning_rate": 3.724383946406631e-06, + "loss": 0.119, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0836353674530983, + "step": 10990, + "valid_targets_mean": 3622.6, + "valid_targets_min": 1949 + }, + { + "epoch": 5.759559979046621, + "grad_norm": 0.3711070967607157, + "learning_rate": 3.709215683678282e-06, + "loss": 0.0608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03476902097463608, + "step": 10995, + "valid_targets_mean": 3344.9, + "valid_targets_min": 764 + }, + { + "epoch": 5.762179151388161, + "grad_norm": 0.4475362921935387, + "learning_rate": 3.6940752141969415e-06, + "loss": 0.0734, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.041336361318826675, + "step": 11000, + "valid_targets_mean": 2391.6, + "valid_targets_min": 776 + }, + { + "epoch": 5.764798323729702, + "grad_norm": 0.38741715814397437, + "learning_rate": 3.678962563793325e-06, + "loss": 0.0753, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04356415197253227, + "step": 11005, + "valid_targets_mean": 2818.5, + "valid_targets_min": 754 + }, + { + "epoch": 5.767417496071241, + "grad_norm": 0.5117880596971838, + "learning_rate": 3.6638777582507177e-06, + "loss": 0.0927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.047148026525974274, + "step": 11010, + "valid_targets_mean": 1646.6, + "valid_targets_min": 635 + }, + { + "epoch": 5.770036668412781, + "grad_norm": 0.41930356078044206, + "learning_rate": 3.6488208233048594e-06, + "loss": 0.0875, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03821966052055359, + "step": 11015, + "valid_targets_mean": 3374.8, + "valid_targets_min": 1862 + }, + { + "epoch": 5.772655840754322, + "grad_norm": 0.43534620045705974, + "learning_rate": 3.6337917846439806e-06, + "loss": 0.0737, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04205740988254547, + "step": 11020, + "valid_targets_mean": 2837.4, + "valid_targets_min": 574 + }, + { + "epoch": 5.775275013095862, + "grad_norm": 0.5249942594507854, + "learning_rate": 3.6187906679086827e-06, + "loss": 0.0705, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03166569769382477, + "step": 11025, + "valid_targets_mean": 2618.4, + "valid_targets_min": 523 + }, + { + "epoch": 5.777894185437402, + "grad_norm": 0.4626425302288907, + "learning_rate": 3.603817498691966e-06, + "loss": 0.0738, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04045230522751808, + "step": 11030, + "valid_targets_mean": 3548.9, + "valid_targets_min": 2189 + }, + { + "epoch": 5.780513357778942, + "grad_norm": 0.37052238295789225, + "learning_rate": 3.588872302539117e-06, + "loss": 0.0775, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02780608832836151, + "step": 11035, + "valid_targets_mean": 3564.6, + "valid_targets_min": 827 + }, + { + "epoch": 5.783132530120482, + "grad_norm": 0.4707983746182179, + "learning_rate": 3.5739551049477174e-06, + "loss": 0.088, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04321026802062988, + "step": 11040, + "valid_targets_mean": 1936.6, + "valid_targets_min": 597 + }, + { + "epoch": 5.785751702462022, + "grad_norm": 0.5187164571096663, + "learning_rate": 3.5590659313675735e-06, + "loss": 0.0821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03667140007019043, + "step": 11045, + "valid_targets_mean": 1747.5, + "valid_targets_min": 701 + }, + { + "epoch": 5.788370874803562, + "grad_norm": 0.5938730178938206, + "learning_rate": 3.5442048072006884e-06, + "loss": 0.1082, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10945126414299011, + "step": 11050, + "valid_targets_mean": 3329.6, + "valid_targets_min": 1652 + }, + { + "epoch": 5.790990047145102, + "grad_norm": 0.4288560923289433, + "learning_rate": 3.5293717578012055e-06, + "loss": 0.087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.034772470593452454, + "step": 11055, + "valid_targets_mean": 3117.1, + "valid_targets_min": 786 + }, + { + "epoch": 5.793609219486642, + "grad_norm": 0.5250971863597397, + "learning_rate": 3.514566808475375e-06, + "loss": 0.0725, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04586917161941528, + "step": 11060, + "valid_targets_mean": 2574.4, + "valid_targets_min": 971 + }, + { + "epoch": 5.7962283918281825, + "grad_norm": 0.4121152028658852, + "learning_rate": 3.4997899844814874e-06, + "loss": 0.1037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03905129432678223, + "step": 11065, + "valid_targets_mean": 3320.0, + "valid_targets_min": 2610 + }, + { + "epoch": 5.798847564169723, + "grad_norm": 0.4432979042499083, + "learning_rate": 3.4850413110298864e-06, + "loss": 0.0886, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02789444476366043, + "step": 11070, + "valid_targets_mean": 2580.6, + "valid_targets_min": 753 + }, + { + "epoch": 5.801466736511262, + "grad_norm": 0.5486777703978877, + "learning_rate": 3.470320813282848e-06, + "loss": 0.0802, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03787270560860634, + "step": 11075, + "valid_targets_mean": 1537.1, + "valid_targets_min": 619 + }, + { + "epoch": 5.8040859088528025, + "grad_norm": 0.593247965443131, + "learning_rate": 3.4556285163546143e-06, + "loss": 0.2632, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10560999810695648, + "step": 11080, + "valid_targets_mean": 2271.2, + "valid_targets_min": 987 + }, + { + "epoch": 5.806705081194343, + "grad_norm": 0.605181929270286, + "learning_rate": 3.4409644453112857e-06, + "loss": 0.0934, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04537982866168022, + "step": 11085, + "valid_targets_mean": 1351.5, + "valid_targets_min": 329 + }, + { + "epoch": 5.809324253535882, + "grad_norm": 0.5073357781037506, + "learning_rate": 3.426328625170823e-06, + "loss": 0.0821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03772849217057228, + "step": 11090, + "valid_targets_mean": 1553.9, + "valid_targets_min": 608 + }, + { + "epoch": 5.8119434258774225, + "grad_norm": 0.49130373857608134, + "learning_rate": 3.4117210809029876e-06, + "loss": 0.1719, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04965986683964729, + "step": 11095, + "valid_targets_mean": 3645.6, + "valid_targets_min": 873 + }, + { + "epoch": 5.814562598218963, + "grad_norm": 0.30933644359373974, + "learning_rate": 3.3971418374292963e-06, + "loss": 0.0707, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02171337977051735, + "step": 11100, + "valid_targets_mean": 4720.6, + "valid_targets_min": 3529 + }, + { + "epoch": 5.817181770560503, + "grad_norm": 0.45661785074403527, + "learning_rate": 3.3825909196229858e-06, + "loss": 0.0842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04527841880917549, + "step": 11105, + "valid_targets_mean": 4437.6, + "valid_targets_min": 2336 + }, + { + "epoch": 5.819800942902043, + "grad_norm": 0.42559521589327926, + "learning_rate": 3.3680683523089662e-06, + "loss": 0.0775, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03421613574028015, + "step": 11110, + "valid_targets_mean": 3533.1, + "valid_targets_min": 1226 + }, + { + "epoch": 5.822420115243583, + "grad_norm": 0.4042524258233285, + "learning_rate": 3.353574160263784e-06, + "loss": 0.0726, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03365694358944893, + "step": 11115, + "valid_targets_mean": 3299.2, + "valid_targets_min": 798 + }, + { + "epoch": 5.825039287585123, + "grad_norm": 0.43669496834047056, + "learning_rate": 3.33910836821556e-06, + "loss": 0.0711, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03029424138367176, + "step": 11120, + "valid_targets_mean": 1836.9, + "valid_targets_min": 723 + }, + { + "epoch": 5.827658459926663, + "grad_norm": 0.43820954403937185, + "learning_rate": 3.3246710008439777e-06, + "loss": 0.0705, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03753548488020897, + "step": 11125, + "valid_targets_mean": 3316.0, + "valid_targets_min": 898 + }, + { + "epoch": 5.830277632268203, + "grad_norm": 0.3244610135700791, + "learning_rate": 3.3102620827802247e-06, + "loss": 0.0687, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.026321982964873314, + "step": 11130, + "valid_targets_mean": 4027.2, + "valid_targets_min": 3278 + }, + { + "epoch": 5.832896804609743, + "grad_norm": 0.49542063669645076, + "learning_rate": 3.295881638606948e-06, + "loss": 0.0711, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03268700838088989, + "step": 11135, + "valid_targets_mean": 2052.8, + "valid_targets_min": 739 + }, + { + "epoch": 5.835515976951283, + "grad_norm": 0.5033031868779394, + "learning_rate": 3.2815296928582163e-06, + "loss": 0.1023, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03714592009782791, + "step": 11140, + "valid_targets_mean": 1574.9, + "valid_targets_min": 538 + }, + { + "epoch": 5.838135149292824, + "grad_norm": 0.37289485687861634, + "learning_rate": 3.267206270019481e-06, + "loss": 0.0582, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0287267304956913, + "step": 11145, + "valid_targets_mean": 1956.9, + "valid_targets_min": 654 + }, + { + "epoch": 5.840754321634364, + "grad_norm": 0.4629461873322304, + "learning_rate": 3.252911394527527e-06, + "loss": 0.0707, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04151737689971924, + "step": 11150, + "valid_targets_mean": 2735.4, + "valid_targets_min": 930 + }, + { + "epoch": 5.843373493975903, + "grad_norm": 0.4710233917879916, + "learning_rate": 3.2386450907704426e-06, + "loss": 0.064, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03753400593996048, + "step": 11155, + "valid_targets_mean": 2965.0, + "valid_targets_min": 684 + }, + { + "epoch": 5.845992666317444, + "grad_norm": 0.43800059549274245, + "learning_rate": 3.2244073830875512e-06, + "loss": 0.1078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03819188103079796, + "step": 11160, + "valid_targets_mean": 3344.6, + "valid_targets_min": 999 + }, + { + "epoch": 5.848611838658984, + "grad_norm": 0.5721017706752082, + "learning_rate": 3.2101982957694244e-06, + "loss": 0.0856, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04740625619888306, + "step": 11165, + "valid_targets_mean": 2445.4, + "valid_targets_min": 696 + }, + { + "epoch": 5.8512310110005235, + "grad_norm": 0.4113218661338274, + "learning_rate": 3.1960178530577645e-06, + "loss": 0.0885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.037107281386852264, + "step": 11170, + "valid_targets_mean": 3514.9, + "valid_targets_min": 1068 + }, + { + "epoch": 5.853850183342064, + "grad_norm": 0.49946959668671437, + "learning_rate": 3.181866079145446e-06, + "loss": 0.0747, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0346212312579155, + "step": 11175, + "valid_targets_mean": 1602.8, + "valid_targets_min": 536 + }, + { + "epoch": 5.856469355683604, + "grad_norm": 0.5657946144647372, + "learning_rate": 3.167742998176391e-06, + "loss": 0.1159, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09299509227275848, + "step": 11180, + "valid_targets_mean": 3568.8, + "valid_targets_min": 1507 + }, + { + "epoch": 5.859088528025144, + "grad_norm": 0.47555773468925827, + "learning_rate": 3.1536486342455987e-06, + "loss": 0.0839, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.041637204587459564, + "step": 11185, + "valid_targets_mean": 3292.2, + "valid_targets_min": 2342 + }, + { + "epoch": 5.861707700366684, + "grad_norm": 0.6132193893444337, + "learning_rate": 3.1395830113990633e-06, + "loss": 0.1023, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0404975600540638, + "step": 11190, + "valid_targets_mean": 1567.5, + "valid_targets_min": 687 + }, + { + "epoch": 5.864326872708224, + "grad_norm": 0.6062733694551393, + "learning_rate": 3.125546153633747e-06, + "loss": 0.0697, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.026830414310097694, + "step": 11195, + "valid_targets_mean": 1145.4, + "valid_targets_min": 449 + }, + { + "epoch": 5.866946045049764, + "grad_norm": 0.3731457384576194, + "learning_rate": 3.1115380848975363e-06, + "loss": 0.0772, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.030195914208889008, + "step": 11200, + "valid_targets_mean": 3191.0, + "valid_targets_min": 658 + }, + { + "epoch": 5.869565217391305, + "grad_norm": 0.6184036320128709, + "learning_rate": 3.0975588290892e-06, + "loss": 0.0827, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.043835822492837906, + "step": 11205, + "valid_targets_mean": 1924.8, + "valid_targets_min": 577 + }, + { + "epoch": 5.872184389732844, + "grad_norm": 0.3683210417331091, + "learning_rate": 3.083608410058356e-06, + "loss": 0.0651, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03257773816585541, + "step": 11210, + "valid_targets_mean": 3992.5, + "valid_targets_min": 726 + }, + { + "epoch": 5.874803562074384, + "grad_norm": 0.4266228733303925, + "learning_rate": 3.06968685160542e-06, + "loss": 0.0641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03843538835644722, + "step": 11215, + "valid_targets_mean": 3626.4, + "valid_targets_min": 2252 + }, + { + "epoch": 5.877422734415925, + "grad_norm": 0.459369175896622, + "learning_rate": 3.055794177481559e-06, + "loss": 0.0716, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02921932563185692, + "step": 11220, + "valid_targets_mean": 1556.2, + "valid_targets_min": 531 + }, + { + "epoch": 5.880041906757465, + "grad_norm": 0.5033875693245169, + "learning_rate": 3.0419304113886894e-06, + "loss": 0.0885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.037124909460544586, + "step": 11225, + "valid_targets_mean": 2410.5, + "valid_targets_min": 744 + }, + { + "epoch": 5.882661079099004, + "grad_norm": 0.4929635596819927, + "learning_rate": 3.028095576979375e-06, + "loss": 0.0848, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04303295165300369, + "step": 11230, + "valid_targets_mean": 3795.1, + "valid_targets_min": 3136 + }, + { + "epoch": 5.885280251440545, + "grad_norm": 0.34164401492577223, + "learning_rate": 3.014289697856845e-06, + "loss": 0.0721, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0300001110881567, + "step": 11235, + "valid_targets_mean": 3324.4, + "valid_targets_min": 2366 + }, + { + "epoch": 5.887899423782085, + "grad_norm": 0.4084330205871245, + "learning_rate": 3.000512797574917e-06, + "loss": 0.0692, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02712399885058403, + "step": 11240, + "valid_targets_mean": 1668.1, + "valid_targets_min": 669 + }, + { + "epoch": 5.890518596123625, + "grad_norm": 0.5342207638177974, + "learning_rate": 2.9867648996379706e-06, + "loss": 0.0855, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0455302894115448, + "step": 11245, + "valid_targets_mean": 3529.8, + "valid_targets_min": 1785 + }, + { + "epoch": 5.893137768465165, + "grad_norm": 0.34233018289648487, + "learning_rate": 2.973046027500912e-06, + "loss": 0.06, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03136247768998146, + "step": 11250, + "valid_targets_mean": 4120.1, + "valid_targets_min": 3862 + }, + { + "epoch": 5.895756940806705, + "grad_norm": 0.42123279871969677, + "learning_rate": 2.9593562045691104e-06, + "loss": 0.0742, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03143005073070526, + "step": 11255, + "valid_targets_mean": 3062.2, + "valid_targets_min": 539 + }, + { + "epoch": 5.898376113148245, + "grad_norm": 0.43786853410663623, + "learning_rate": 2.9456954541983982e-06, + "loss": 0.0754, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.029972806572914124, + "step": 11260, + "valid_targets_mean": 2781.5, + "valid_targets_min": 1016 + }, + { + "epoch": 5.900995285489786, + "grad_norm": 0.7461927569998023, + "learning_rate": 2.932063799694984e-06, + "loss": 0.086, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04962751269340515, + "step": 11265, + "valid_targets_mean": 1102.9, + "valid_targets_min": 888 + }, + { + "epoch": 5.903614457831325, + "grad_norm": 0.5102448970842115, + "learning_rate": 2.918461264315462e-06, + "loss": 0.0777, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.028521444648504257, + "step": 11270, + "valid_targets_mean": 2602.5, + "valid_targets_min": 697 + }, + { + "epoch": 5.906233630172865, + "grad_norm": 0.6825464712654099, + "learning_rate": 2.904887871266724e-06, + "loss": 0.0742, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.047726817429065704, + "step": 11275, + "valid_targets_mean": 1592.9, + "valid_targets_min": 605 + }, + { + "epoch": 5.908852802514406, + "grad_norm": 0.3946021142719126, + "learning_rate": 2.8913436437059526e-06, + "loss": 0.0759, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.030810732394456863, + "step": 11280, + "valid_targets_mean": 2899.1, + "valid_targets_min": 1117 + }, + { + "epoch": 5.911471974855946, + "grad_norm": 0.43552867821377794, + "learning_rate": 2.8778286047405755e-06, + "loss": 0.096, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.034283559769392014, + "step": 11285, + "valid_targets_mean": 3376.6, + "valid_targets_min": 1388 + }, + { + "epoch": 5.914091147197485, + "grad_norm": 0.43670750851172746, + "learning_rate": 2.8643427774282174e-06, + "loss": 0.0748, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.032360583543777466, + "step": 11290, + "valid_targets_mean": 3243.4, + "valid_targets_min": 524 + }, + { + "epoch": 5.916710319539026, + "grad_norm": 0.480477215537576, + "learning_rate": 2.8508861847766665e-06, + "loss": 0.0655, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03470785170793533, + "step": 11295, + "valid_targets_mean": 2468.0, + "valid_targets_min": 970 + }, + { + "epoch": 5.919329491880566, + "grad_norm": 0.5347638590624609, + "learning_rate": 2.8374588497438415e-06, + "loss": 0.0859, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03941023349761963, + "step": 11300, + "valid_targets_mean": 2959.6, + "valid_targets_min": 877 + }, + { + "epoch": 5.921948664222106, + "grad_norm": 0.39492224392015796, + "learning_rate": 2.8240607952377265e-06, + "loss": 0.0801, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.029691524803638458, + "step": 11305, + "valid_targets_mean": 3886.5, + "valid_targets_min": 3251 + }, + { + "epoch": 5.924567836563646, + "grad_norm": 0.5711688477381672, + "learning_rate": 2.810692044116381e-06, + "loss": 0.063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0402698814868927, + "step": 11310, + "valid_targets_mean": 2695.6, + "valid_targets_min": 564 + }, + { + "epoch": 5.927187008905186, + "grad_norm": 0.39760929628729696, + "learning_rate": 2.797352619187834e-06, + "loss": 0.0721, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03923739492893219, + "step": 11315, + "valid_targets_mean": 4404.8, + "valid_targets_min": 2555 + }, + { + "epoch": 5.929806181246726, + "grad_norm": 0.3715878331665758, + "learning_rate": 2.7840425432101237e-06, + "loss": 0.0646, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03085777349770069, + "step": 11320, + "valid_targets_mean": 4410.5, + "valid_targets_min": 3261 + }, + { + "epoch": 5.9324253535882665, + "grad_norm": 0.4504797890028626, + "learning_rate": 2.7707618388911715e-06, + "loss": 0.0589, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.024951647967100143, + "step": 11325, + "valid_targets_mean": 1768.5, + "valid_targets_min": 618 + }, + { + "epoch": 5.935044525929806, + "grad_norm": 0.3407615967389443, + "learning_rate": 2.757510528888836e-06, + "loss": 0.0818, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.033380474895238876, + "step": 11330, + "valid_targets_mean": 3985.8, + "valid_targets_min": 3213 + }, + { + "epoch": 5.937663698271346, + "grad_norm": 0.38157658006958145, + "learning_rate": 2.7442886358107834e-06, + "loss": 0.0765, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08153171092271805, + "step": 11335, + "valid_targets_mean": 3149.1, + "valid_targets_min": 1539 + }, + { + "epoch": 5.9402828706128865, + "grad_norm": 0.3566791419158281, + "learning_rate": 2.731096182214521e-06, + "loss": 0.0842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.026738319545984268, + "step": 11340, + "valid_targets_mean": 2094.8, + "valid_targets_min": 509 + }, + { + "epoch": 5.942902042954426, + "grad_norm": 0.34299001263736395, + "learning_rate": 2.717933190607318e-06, + "loss": 0.0804, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.01958930492401123, + "step": 11345, + "valid_targets_mean": 2441.4, + "valid_targets_min": 633 + }, + { + "epoch": 5.945521215295966, + "grad_norm": 0.45419186364997993, + "learning_rate": 2.704799683446184e-06, + "loss": 0.0931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.035698674619197845, + "step": 11350, + "valid_targets_mean": 2740.9, + "valid_targets_min": 737 + }, + { + "epoch": 5.9481403876375065, + "grad_norm": 0.3987062350948198, + "learning_rate": 2.691695683137827e-06, + "loss": 0.0628, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03007950820028782, + "step": 11355, + "valid_targets_mean": 2726.9, + "valid_targets_min": 492 + }, + { + "epoch": 5.950759559979047, + "grad_norm": 0.6154943388101383, + "learning_rate": 2.6786212120386124e-06, + "loss": 0.0802, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04654261842370033, + "step": 11360, + "valid_targets_mean": 1607.9, + "valid_targets_min": 833 + }, + { + "epoch": 5.953378732320587, + "grad_norm": 0.35676724141161104, + "learning_rate": 2.665576292454519e-06, + "loss": 0.0656, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02375321462750435, + "step": 11365, + "valid_targets_mean": 3502.6, + "valid_targets_min": 923 + }, + { + "epoch": 5.9559979046621265, + "grad_norm": 0.7459787971829334, + "learning_rate": 2.6525609466411207e-06, + "loss": 0.1035, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.051826655864715576, + "step": 11370, + "valid_targets_mean": 1553.9, + "valid_targets_min": 531 + }, + { + "epoch": 5.958617077003667, + "grad_norm": 0.5310568093938065, + "learning_rate": 2.6395751968035322e-06, + "loss": 0.0979, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06401866674423218, + "step": 11375, + "valid_targets_mean": 1825.6, + "valid_targets_min": 575 + }, + { + "epoch": 5.961236249345207, + "grad_norm": 0.4782124189664576, + "learning_rate": 2.6266190650963695e-06, + "loss": 0.0716, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.038485944271087646, + "step": 11380, + "valid_targets_mean": 3701.9, + "valid_targets_min": 2784 + }, + { + "epoch": 5.9638554216867465, + "grad_norm": 0.4087593790616926, + "learning_rate": 2.6136925736237294e-06, + "loss": 0.0699, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03156688064336777, + "step": 11385, + "valid_targets_mean": 3575.8, + "valid_targets_min": 2525 + }, + { + "epoch": 5.966474594028287, + "grad_norm": 0.39190323540721084, + "learning_rate": 2.6007957444391285e-06, + "loss": 0.0683, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0255313441157341, + "step": 11390, + "valid_targets_mean": 3081.0, + "valid_targets_min": 970 + }, + { + "epoch": 5.969093766369827, + "grad_norm": 0.51699522650557, + "learning_rate": 2.5879285995454904e-06, + "loss": 0.0641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.031044133007526398, + "step": 11395, + "valid_targets_mean": 1963.5, + "valid_targets_min": 817 + }, + { + "epoch": 5.971712938711367, + "grad_norm": 0.8952837747705978, + "learning_rate": 2.5750911608950756e-06, + "loss": 0.0837, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05980469286441803, + "step": 11400, + "valid_targets_mean": 1270.9, + "valid_targets_min": 637 + }, + { + "epoch": 5.974332111052908, + "grad_norm": 0.4099808057463521, + "learning_rate": 2.562283450389489e-06, + "loss": 0.0621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03177203610539436, + "step": 11405, + "valid_targets_mean": 2594.1, + "valid_targets_min": 893 + }, + { + "epoch": 5.976951283394447, + "grad_norm": 0.40631750093059726, + "learning_rate": 2.549505489879589e-06, + "loss": 0.0653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.028754254803061485, + "step": 11410, + "valid_targets_mean": 3222.2, + "valid_targets_min": 1606 + }, + { + "epoch": 5.9795704557359874, + "grad_norm": 0.5522428400424914, + "learning_rate": 2.536757301165511e-06, + "loss": 0.0671, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.028628377243876457, + "step": 11415, + "valid_targets_mean": 3023.8, + "valid_targets_min": 678 + }, + { + "epoch": 5.982189628077528, + "grad_norm": 0.3924448115671155, + "learning_rate": 2.5240389059965642e-06, + "loss": 0.0753, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03105129860341549, + "step": 11420, + "valid_targets_mean": 4263.8, + "valid_targets_min": 1078 + }, + { + "epoch": 5.984808800419067, + "grad_norm": 0.38690813940980917, + "learning_rate": 2.5113503260712514e-06, + "loss": 0.0648, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03710411116480827, + "step": 11425, + "valid_targets_mean": 4150.0, + "valid_targets_min": 761 + }, + { + "epoch": 5.9874279727606075, + "grad_norm": 0.4826422485215377, + "learning_rate": 2.498691583037196e-06, + "loss": 0.0695, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0368012934923172, + "step": 11430, + "valid_targets_mean": 1368.4, + "valid_targets_min": 538 + }, + { + "epoch": 5.990047145102148, + "grad_norm": 0.519782763564192, + "learning_rate": 2.486062698491125e-06, + "loss": 0.0867, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07773230969905853, + "step": 11435, + "valid_targets_mean": 2630.4, + "valid_targets_min": 780 + }, + { + "epoch": 5.992666317443688, + "grad_norm": 0.37054664090641287, + "learning_rate": 2.4734636939788216e-06, + "loss": 0.1409, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.030455132946372032, + "step": 11440, + "valid_targets_mean": 3353.9, + "valid_targets_min": 2347 + }, + { + "epoch": 5.995285489785228, + "grad_norm": 0.4400819327957686, + "learning_rate": 2.460894590995091e-06, + "loss": 0.0703, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04020780324935913, + "step": 11445, + "valid_targets_mean": 3880.2, + "valid_targets_min": 2473 + }, + { + "epoch": 5.997904662126768, + "grad_norm": 0.3963239425973607, + "learning_rate": 2.448355410983723e-06, + "loss": 0.0676, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03425648808479309, + "step": 11450, + "valid_targets_mean": 3556.4, + "valid_targets_min": 2245 + }, + { + "epoch": 6.000523834468308, + "grad_norm": 0.9180097151052058, + "learning_rate": 2.4358461753374663e-06, + "loss": 0.1123, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07151223719120026, + "step": 11455, + "valid_targets_mean": 1492.2, + "valid_targets_min": 544 + }, + { + "epoch": 6.003143006809848, + "grad_norm": 0.9599880015008919, + "learning_rate": 2.423366905397957e-06, + "loss": 0.1487, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06720415502786636, + "step": 11460, + "valid_targets_mean": 1270.4, + "valid_targets_min": 632 + }, + { + "epoch": 6.005762179151388, + "grad_norm": 1.1052017481465797, + "learning_rate": 2.4109176224557463e-06, + "loss": 0.1315, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.055264897644519806, + "step": 11465, + "valid_targets_mean": 1358.4, + "valid_targets_min": 753 + }, + { + "epoch": 6.008381351492928, + "grad_norm": 0.9280327830610237, + "learning_rate": 2.3984983477501866e-06, + "loss": 0.1336, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07304681837558746, + "step": 11470, + "valid_targets_mean": 1413.0, + "valid_targets_min": 701 + }, + { + "epoch": 6.011000523834468, + "grad_norm": 0.8440440917837605, + "learning_rate": 2.3861091024694673e-06, + "loss": 0.1224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07937653362751007, + "step": 11475, + "valid_targets_mean": 1745.6, + "valid_targets_min": 754 + }, + { + "epoch": 6.013619696176009, + "grad_norm": 0.7769512330057519, + "learning_rate": 2.373749907750518e-06, + "loss": 0.1288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06396303325891495, + "step": 11480, + "valid_targets_mean": 1337.9, + "valid_targets_min": 746 + }, + { + "epoch": 6.016238868517548, + "grad_norm": 0.764887720106359, + "learning_rate": 2.361420784679016e-06, + "loss": 0.1312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06879110634326935, + "step": 11485, + "valid_targets_mean": 1728.8, + "valid_targets_min": 970 + }, + { + "epoch": 6.018858040859088, + "grad_norm": 0.8047908910618264, + "learning_rate": 2.3491217542893274e-06, + "loss": 0.116, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06783033907413483, + "step": 11490, + "valid_targets_mean": 1569.5, + "valid_targets_min": 648 + }, + { + "epoch": 6.021477213200629, + "grad_norm": 0.8550912758160515, + "learning_rate": 2.336852837564485e-06, + "loss": 0.1379, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07583297789096832, + "step": 11495, + "valid_targets_mean": 1538.8, + "valid_targets_min": 727 + }, + { + "epoch": 6.024096385542169, + "grad_norm": 0.7113626689321407, + "learning_rate": 2.3246140554361385e-06, + "loss": 0.1209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04935118556022644, + "step": 11500, + "valid_targets_mean": 1519.5, + "valid_targets_min": 788 + }, + { + "epoch": 6.026715557883708, + "grad_norm": 0.7922064047732775, + "learning_rate": 2.312405428784532e-06, + "loss": 0.129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.054738614708185196, + "step": 11505, + "valid_targets_mean": 1325.1, + "valid_targets_min": 627 + }, + { + "epoch": 6.029334730225249, + "grad_norm": 0.7956421797633352, + "learning_rate": 2.3002269784384533e-06, + "loss": 0.1231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0749821588397026, + "step": 11510, + "valid_targets_mean": 1732.4, + "valid_targets_min": 633 + }, + { + "epoch": 6.031953902566789, + "grad_norm": 0.8077100279931957, + "learning_rate": 2.2880787251752134e-06, + "loss": 0.1202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06252764910459518, + "step": 11515, + "valid_targets_mean": 1525.6, + "valid_targets_min": 923 + }, + { + "epoch": 6.034573074908329, + "grad_norm": 0.7804853727327673, + "learning_rate": 2.2759606897206043e-06, + "loss": 0.1186, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06563736498355865, + "step": 11520, + "valid_targets_mean": 1603.5, + "valid_targets_min": 740 + }, + { + "epoch": 6.037192247249869, + "grad_norm": 0.8622259356502991, + "learning_rate": 2.263872892748866e-06, + "loss": 0.1163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06406301259994507, + "step": 11525, + "valid_targets_mean": 1757.0, + "valid_targets_min": 895 + }, + { + "epoch": 6.039811419591409, + "grad_norm": 0.8644492816609076, + "learning_rate": 2.251815354882647e-06, + "loss": 0.1112, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05467421934008598, + "step": 11530, + "valid_targets_mean": 1391.5, + "valid_targets_min": 1005 + }, + { + "epoch": 6.042430591932949, + "grad_norm": 0.8034350215030263, + "learning_rate": 2.2397880966929718e-06, + "loss": 0.1281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04740656539797783, + "step": 11535, + "valid_targets_mean": 1217.1, + "valid_targets_min": 870 + }, + { + "epoch": 6.04504976427449, + "grad_norm": 0.7982295042700137, + "learning_rate": 2.227791138699211e-06, + "loss": 0.123, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06267914175987244, + "step": 11540, + "valid_targets_mean": 1619.1, + "valid_targets_min": 879 + }, + { + "epoch": 6.047668936616029, + "grad_norm": 0.7768829121969157, + "learning_rate": 2.2158245013690216e-06, + "loss": 0.1241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0555448904633522, + "step": 11545, + "valid_targets_mean": 1507.5, + "valid_targets_min": 906 + }, + { + "epoch": 6.050288108957569, + "grad_norm": 0.8186437461505175, + "learning_rate": 2.2038882051183606e-06, + "loss": 0.1213, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07260645925998688, + "step": 11550, + "valid_targets_mean": 1707.1, + "valid_targets_min": 814 + }, + { + "epoch": 6.05290728129911, + "grad_norm": 0.8297988799685673, + "learning_rate": 2.1919822703113945e-06, + "loss": 0.1235, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06317691504955292, + "step": 11555, + "valid_targets_mean": 1747.9, + "valid_targets_min": 832 + }, + { + "epoch": 6.05552645364065, + "grad_norm": 0.7807605710807147, + "learning_rate": 2.180106717260515e-06, + "loss": 0.1191, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05148398131132126, + "step": 11560, + "valid_targets_mean": 1581.9, + "valid_targets_min": 891 + }, + { + "epoch": 6.058145625982189, + "grad_norm": 0.9167811492382313, + "learning_rate": 2.168261566226255e-06, + "loss": 0.1216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07749298214912415, + "step": 11565, + "valid_targets_mean": 1746.8, + "valid_targets_min": 1052 + }, + { + "epoch": 6.06076479832373, + "grad_norm": 0.7718625888889671, + "learning_rate": 2.1564468374172986e-06, + "loss": 0.1118, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05473483353853226, + "step": 11570, + "valid_targets_mean": 1469.5, + "valid_targets_min": 737 + }, + { + "epoch": 6.06338397066527, + "grad_norm": 0.7798331491197191, + "learning_rate": 2.144662550990422e-06, + "loss": 0.1174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06085578724741936, + "step": 11575, + "valid_targets_mean": 1762.2, + "valid_targets_min": 1062 + }, + { + "epoch": 6.06600314300681, + "grad_norm": 0.8299720107263232, + "learning_rate": 2.1329087270504577e-06, + "loss": 0.1138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06023997813463211, + "step": 11580, + "valid_targets_mean": 1482.1, + "valid_targets_min": 805 + }, + { + "epoch": 6.06862231534835, + "grad_norm": 0.7736914438669119, + "learning_rate": 2.1211853856502794e-06, + "loss": 0.1217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06807412952184677, + "step": 11585, + "valid_targets_mean": 1962.8, + "valid_targets_min": 1253 + }, + { + "epoch": 6.07124148768989, + "grad_norm": 0.854125867360808, + "learning_rate": 2.1094925467907456e-06, + "loss": 0.1271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07101461291313171, + "step": 11590, + "valid_targets_mean": 1958.0, + "valid_targets_min": 1264 + }, + { + "epoch": 6.07386066003143, + "grad_norm": 0.7946035281916202, + "learning_rate": 2.0978302304206766e-06, + "loss": 0.1187, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04817923903465271, + "step": 11595, + "valid_targets_mean": 1201.4, + "valid_targets_min": 613 + }, + { + "epoch": 6.0764798323729705, + "grad_norm": 0.8165893535643656, + "learning_rate": 2.0861984564368297e-06, + "loss": 0.1207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.061780575662851334, + "step": 11600, + "valid_targets_mean": 1559.0, + "valid_targets_min": 768 + }, + { + "epoch": 6.07909900471451, + "grad_norm": 1.2887836682489096, + "learning_rate": 2.0745972446838294e-06, + "loss": 0.1157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05495624244213104, + "step": 11605, + "valid_targets_mean": 1210.0, + "valid_targets_min": 714 + }, + { + "epoch": 6.08171817705605, + "grad_norm": 0.8710831103154718, + "learning_rate": 2.0630266149541934e-06, + "loss": 0.1249, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04973271116614342, + "step": 11610, + "valid_targets_mean": 1242.2, + "valid_targets_min": 841 + }, + { + "epoch": 6.0843373493975905, + "grad_norm": 0.7665366475838662, + "learning_rate": 2.0514865869882295e-06, + "loss": 0.1176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06063533201813698, + "step": 11615, + "valid_targets_mean": 1708.1, + "valid_targets_min": 936 + }, + { + "epoch": 6.086956521739131, + "grad_norm": 0.894116689823647, + "learning_rate": 2.039977180474071e-06, + "loss": 0.1159, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05748577415943146, + "step": 11620, + "valid_targets_mean": 1163.1, + "valid_targets_min": 746 + }, + { + "epoch": 6.08957569408067, + "grad_norm": 0.790949054699234, + "learning_rate": 2.0284984150475795e-06, + "loss": 0.1042, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05484342202544212, + "step": 11625, + "valid_targets_mean": 1380.4, + "valid_targets_min": 814 + }, + { + "epoch": 6.0921948664222105, + "grad_norm": 0.7846854748574492, + "learning_rate": 2.0170503102923544e-06, + "loss": 0.1199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0660267323255539, + "step": 11630, + "valid_targets_mean": 1625.4, + "valid_targets_min": 635 + }, + { + "epoch": 6.094814038763751, + "grad_norm": 0.8299153408407629, + "learning_rate": 2.0056328857396856e-06, + "loss": 0.1146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04472474753856659, + "step": 11635, + "valid_targets_mean": 1153.4, + "valid_targets_min": 734 + }, + { + "epoch": 6.097433211105291, + "grad_norm": 0.8316666817616704, + "learning_rate": 1.994246160868516e-06, + "loss": 0.1155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06456252932548523, + "step": 11640, + "valid_targets_mean": 1487.1, + "valid_targets_min": 831 + }, + { + "epoch": 6.1000523834468305, + "grad_norm": 0.7880769174254484, + "learning_rate": 1.9828901551054193e-06, + "loss": 0.1151, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05208251625299454, + "step": 11645, + "valid_targets_mean": 1479.1, + "valid_targets_min": 1015 + }, + { + "epoch": 6.102671555788371, + "grad_norm": 0.7833005697941994, + "learning_rate": 1.9715648878245532e-06, + "loss": 0.1145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05049904063344002, + "step": 11650, + "valid_targets_mean": 1366.5, + "valid_targets_min": 711 + }, + { + "epoch": 6.105290728129911, + "grad_norm": 0.7489628605619162, + "learning_rate": 1.960270378347642e-06, + "loss": 0.1135, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.042261186987161636, + "step": 11655, + "valid_targets_mean": 1318.1, + "valid_targets_min": 736 + }, + { + "epoch": 6.107909900471451, + "grad_norm": 0.9224735642475472, + "learning_rate": 1.9490066459439184e-06, + "loss": 0.1178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07317248731851578, + "step": 11660, + "valid_targets_mean": 1541.2, + "valid_targets_min": 931 + }, + { + "epoch": 6.110529072812991, + "grad_norm": 0.7834065543973477, + "learning_rate": 1.9377737098301263e-06, + "loss": 0.1222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06088053807616234, + "step": 11665, + "valid_targets_mean": 1790.2, + "valid_targets_min": 1011 + }, + { + "epoch": 6.113148245154531, + "grad_norm": 0.8178539351959183, + "learning_rate": 1.9265715891704583e-06, + "loss": 0.1241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06058657169342041, + "step": 11670, + "valid_targets_mean": 1511.6, + "valid_targets_min": 748 + }, + { + "epoch": 6.1157674174960714, + "grad_norm": 0.8386374996628507, + "learning_rate": 1.9154003030765377e-06, + "loss": 0.113, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.058460816740989685, + "step": 11675, + "valid_targets_mean": 1568.1, + "valid_targets_min": 699 + }, + { + "epoch": 6.118386589837612, + "grad_norm": 0.8067359342212168, + "learning_rate": 1.9042598706073767e-06, + "loss": 0.1065, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.038479067385196686, + "step": 11680, + "valid_targets_mean": 1002.4, + "valid_targets_min": 534 + }, + { + "epoch": 6.121005762179151, + "grad_norm": 0.8310382170192431, + "learning_rate": 1.8931503107693605e-06, + "loss": 0.121, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05678606778383255, + "step": 11685, + "valid_targets_mean": 1367.1, + "valid_targets_min": 687 + }, + { + "epoch": 6.1236249345206915, + "grad_norm": 0.8446260002301718, + "learning_rate": 1.8820716425161812e-06, + "loss": 0.1132, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04868333414196968, + "step": 11690, + "valid_targets_mean": 1259.8, + "valid_targets_min": 835 + }, + { + "epoch": 6.126244106862232, + "grad_norm": 0.834487265817137, + "learning_rate": 1.8710238847488572e-06, + "loss": 0.1078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05200199782848358, + "step": 11695, + "valid_targets_mean": 1330.9, + "valid_targets_min": 829 + }, + { + "epoch": 6.128863279203772, + "grad_norm": 0.7950437491710232, + "learning_rate": 1.8600070563156425e-06, + "loss": 0.1074, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06211322546005249, + "step": 11700, + "valid_targets_mean": 1756.4, + "valid_targets_min": 1138 + }, + { + "epoch": 6.1314824515453115, + "grad_norm": 0.8023437380624452, + "learning_rate": 1.8490211760120513e-06, + "loss": 0.1181, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0646124929189682, + "step": 11705, + "valid_targets_mean": 1799.8, + "valid_targets_min": 1174 + }, + { + "epoch": 6.134101623886852, + "grad_norm": 1.5271236396896737, + "learning_rate": 1.8380662625807665e-06, + "loss": 0.1155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.057662054896354675, + "step": 11710, + "valid_targets_mean": 1524.5, + "valid_targets_min": 554 + }, + { + "epoch": 6.136720796228392, + "grad_norm": 0.7862694098761159, + "learning_rate": 1.8271423347116757e-06, + "loss": 0.1119, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05381157621741295, + "step": 11715, + "valid_targets_mean": 1367.2, + "valid_targets_min": 843 + }, + { + "epoch": 6.1393399685699315, + "grad_norm": 0.8073338604081094, + "learning_rate": 1.8162494110417683e-06, + "loss": 0.1106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05907204747200012, + "step": 11720, + "valid_targets_mean": 1673.1, + "valid_targets_min": 849 + }, + { + "epoch": 6.141959140911472, + "grad_norm": 0.8167808150540459, + "learning_rate": 1.805387510155161e-06, + "loss": 0.1171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05595570057630539, + "step": 11725, + "valid_targets_mean": 1509.0, + "valid_targets_min": 612 + }, + { + "epoch": 6.144578313253012, + "grad_norm": 0.856293701424457, + "learning_rate": 1.7945566505830325e-06, + "loss": 0.1175, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05260946974158287, + "step": 11730, + "valid_targets_mean": 1401.0, + "valid_targets_min": 841 + }, + { + "epoch": 6.147197485594552, + "grad_norm": 0.8906531417243976, + "learning_rate": 1.7837568508036108e-06, + "loss": 0.1158, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06653806567192078, + "step": 11735, + "valid_targets_mean": 1564.8, + "valid_targets_min": 746 + }, + { + "epoch": 6.149816657936092, + "grad_norm": 0.8176579226961042, + "learning_rate": 1.7729881292421236e-06, + "loss": 0.1118, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.053530290722846985, + "step": 11740, + "valid_targets_mean": 1293.1, + "valid_targets_min": 822 + }, + { + "epoch": 6.152435830277632, + "grad_norm": 0.7511511259946063, + "learning_rate": 1.7622505042707927e-06, + "loss": 0.1029, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.050591953098773956, + "step": 11745, + "valid_targets_mean": 1731.0, + "valid_targets_min": 670 + }, + { + "epoch": 6.155055002619172, + "grad_norm": 0.8166327313618861, + "learning_rate": 1.7515439942087597e-06, + "loss": 0.1177, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0659506767988205, + "step": 11750, + "valid_targets_mean": 1624.1, + "valid_targets_min": 647 + }, + { + "epoch": 6.157674174960713, + "grad_norm": 0.9273321820099081, + "learning_rate": 1.7408686173221179e-06, + "loss": 0.1177, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04893888160586357, + "step": 11755, + "valid_targets_mean": 1429.1, + "valid_targets_min": 952 + }, + { + "epoch": 6.160293347302252, + "grad_norm": 0.9048561020505893, + "learning_rate": 1.7302243918238137e-06, + "loss": 0.1145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04985303804278374, + "step": 11760, + "valid_targets_mean": 1222.5, + "valid_targets_min": 746 + }, + { + "epoch": 6.162912519643792, + "grad_norm": 0.813391650304158, + "learning_rate": 1.7196113358736655e-06, + "loss": 0.1141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0514526404440403, + "step": 11765, + "valid_targets_mean": 1417.8, + "valid_targets_min": 892 + }, + { + "epoch": 6.165531691985333, + "grad_norm": 0.8100378908596324, + "learning_rate": 1.7090294675783026e-06, + "loss": 0.1189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06349000334739685, + "step": 11770, + "valid_targets_mean": 1636.0, + "valid_targets_min": 985 + }, + { + "epoch": 6.168150864326873, + "grad_norm": 0.8672363204516796, + "learning_rate": 1.6984788049911572e-06, + "loss": 0.1139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.054531119763851166, + "step": 11775, + "valid_targets_mean": 1505.0, + "valid_targets_min": 636 + }, + { + "epoch": 6.170770036668412, + "grad_norm": 0.8618687495589307, + "learning_rate": 1.687959366112415e-06, + "loss": 0.112, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04755813628435135, + "step": 11780, + "valid_targets_mean": 1286.5, + "valid_targets_min": 641 + }, + { + "epoch": 6.173389209009953, + "grad_norm": 0.7778918855830956, + "learning_rate": 1.6774711688889933e-06, + "loss": 0.1137, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06086455285549164, + "step": 11785, + "valid_targets_mean": 1567.5, + "valid_targets_min": 1020 + }, + { + "epoch": 6.176008381351493, + "grad_norm": 0.7632153150912035, + "learning_rate": 1.667014231214512e-06, + "loss": 0.1095, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.048788003623485565, + "step": 11790, + "valid_targets_mean": 1252.4, + "valid_targets_min": 729 + }, + { + "epoch": 6.178627553693033, + "grad_norm": 0.8316843161980305, + "learning_rate": 1.6565885709292496e-06, + "loss": 0.1194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06742323935031891, + "step": 11795, + "valid_targets_mean": 1518.2, + "valid_targets_min": 682 + }, + { + "epoch": 6.181246726034573, + "grad_norm": 0.8169650561144044, + "learning_rate": 1.6461942058201397e-06, + "loss": 0.1197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0598052479326725, + "step": 11800, + "valid_targets_mean": 1619.2, + "valid_targets_min": 1260 + }, + { + "epoch": 6.183865898376113, + "grad_norm": 0.8353797928606886, + "learning_rate": 1.6358311536207084e-06, + "loss": 0.1151, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06587246060371399, + "step": 11805, + "valid_targets_mean": 1575.4, + "valid_targets_min": 906 + }, + { + "epoch": 6.186485070717653, + "grad_norm": 0.8979736643597953, + "learning_rate": 1.6254994320110707e-06, + "loss": 0.1149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06438019871711731, + "step": 11810, + "valid_targets_mean": 1608.1, + "valid_targets_min": 801 + }, + { + "epoch": 6.189104243059194, + "grad_norm": 0.7569834562634008, + "learning_rate": 1.61519905861788e-06, + "loss": 0.1072, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.055120810866355896, + "step": 11815, + "valid_targets_mean": 1414.8, + "valid_targets_min": 564 + }, + { + "epoch": 6.191723415400733, + "grad_norm": 0.8072629139008018, + "learning_rate": 1.6049300510143173e-06, + "loss": 0.1085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.056000012904405594, + "step": 11820, + "valid_targets_mean": 1512.5, + "valid_targets_min": 651 + }, + { + "epoch": 6.194342587742273, + "grad_norm": 0.8137590485392445, + "learning_rate": 1.5946924267200437e-06, + "loss": 0.1154, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04661045968532562, + "step": 11825, + "valid_targets_mean": 1262.4, + "valid_targets_min": 716 + }, + { + "epoch": 6.196961760083814, + "grad_norm": 0.7701490102572036, + "learning_rate": 1.584486203201181e-06, + "loss": 0.1075, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04992928355932236, + "step": 11830, + "valid_targets_mean": 1230.0, + "valid_targets_min": 704 + }, + { + "epoch": 6.199580932425354, + "grad_norm": 0.7514466436217656, + "learning_rate": 1.5743113978702807e-06, + "loss": 0.104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05396423488855362, + "step": 11835, + "valid_targets_mean": 1497.5, + "valid_targets_min": 1251 + }, + { + "epoch": 6.202200104766893, + "grad_norm": 0.8670940282351024, + "learning_rate": 1.5641680280862947e-06, + "loss": 0.1112, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.056431740522384644, + "step": 11840, + "valid_targets_mean": 1470.8, + "valid_targets_min": 764 + }, + { + "epoch": 6.204819277108434, + "grad_norm": 0.9243653707102031, + "learning_rate": 1.5540561111545272e-06, + "loss": 0.1194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06075423210859299, + "step": 11845, + "valid_targets_mean": 1469.4, + "valid_targets_min": 846 + }, + { + "epoch": 6.207438449449974, + "grad_norm": 0.8745717321879108, + "learning_rate": 1.5439756643266468e-06, + "loss": 0.107, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06556703895330429, + "step": 11850, + "valid_targets_mean": 1774.4, + "valid_targets_min": 1011 + }, + { + "epoch": 6.210057621791514, + "grad_norm": 0.7920889225831382, + "learning_rate": 1.5339267048006078e-06, + "loss": 0.1129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05082762986421585, + "step": 11855, + "valid_targets_mean": 1558.9, + "valid_targets_min": 823 + }, + { + "epoch": 6.212676794133054, + "grad_norm": 0.7701394032471317, + "learning_rate": 1.5239092497206697e-06, + "loss": 0.0991, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05166442319750786, + "step": 11860, + "valid_targets_mean": 1687.6, + "valid_targets_min": 595 + }, + { + "epoch": 6.215295966474594, + "grad_norm": 0.9627179393614519, + "learning_rate": 1.5139233161773193e-06, + "loss": 0.1085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05256475508213043, + "step": 11865, + "valid_targets_mean": 1336.9, + "valid_targets_min": 868 + }, + { + "epoch": 6.217915138816134, + "grad_norm": 0.8767320830018093, + "learning_rate": 1.5039689212072772e-06, + "loss": 0.1062, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05469423532485962, + "step": 11870, + "valid_targets_mean": 1266.6, + "valid_targets_min": 818 + }, + { + "epoch": 6.2205343111576745, + "grad_norm": 0.8010639984469596, + "learning_rate": 1.4940460817934587e-06, + "loss": 0.1114, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06903129816055298, + "step": 11875, + "valid_targets_mean": 1976.8, + "valid_targets_min": 1080 + }, + { + "epoch": 6.223153483499214, + "grad_norm": 0.8188843415246827, + "learning_rate": 1.4841548148649376e-06, + "loss": 0.1104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.061441607773303986, + "step": 11880, + "valid_targets_mean": 1554.1, + "valid_targets_min": 658 + }, + { + "epoch": 6.225772655840754, + "grad_norm": 0.7992562221434741, + "learning_rate": 1.4742951372969262e-06, + "loss": 0.1131, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05371711403131485, + "step": 11885, + "valid_targets_mean": 1499.6, + "valid_targets_min": 1018 + }, + { + "epoch": 6.2283918281822945, + "grad_norm": 0.8391318946920864, + "learning_rate": 1.4644670659107419e-06, + "loss": 0.1117, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0553358718752861, + "step": 11890, + "valid_targets_mean": 1475.5, + "valid_targets_min": 897 + }, + { + "epoch": 6.231011000523835, + "grad_norm": 0.9655110948032307, + "learning_rate": 1.454670617473779e-06, + "loss": 0.1288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08838294446468353, + "step": 11895, + "valid_targets_mean": 7107.2, + "valid_targets_min": 5295 + }, + { + "epoch": 6.233630172865374, + "grad_norm": 0.8958472755472283, + "learning_rate": 1.4449058086994839e-06, + "loss": 0.1636, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08870230615139008, + "step": 11900, + "valid_targets_mean": 7098.2, + "valid_targets_min": 5066 + }, + { + "epoch": 6.2362493452069145, + "grad_norm": 0.8201353608539739, + "learning_rate": 1.4351726562473166e-06, + "loss": 0.1602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07592824101448059, + "step": 11905, + "valid_targets_mean": 6838.1, + "valid_targets_min": 4923 + }, + { + "epoch": 6.238868517548455, + "grad_norm": 0.7182641005412113, + "learning_rate": 1.4254711767227347e-06, + "loss": 0.1529, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07479575276374817, + "step": 11910, + "valid_targets_mean": 5701.2, + "valid_targets_min": 3922 + }, + { + "epoch": 6.241487689889995, + "grad_norm": 0.6340844273775583, + "learning_rate": 1.4158013866771624e-06, + "loss": 0.1498, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07615907490253448, + "step": 11915, + "valid_targets_mean": 7340.9, + "valid_targets_min": 4797 + }, + { + "epoch": 6.2441068622315345, + "grad_norm": 0.6199312834660536, + "learning_rate": 1.4061633026079501e-06, + "loss": 0.1651, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08893653750419617, + "step": 11920, + "valid_targets_mean": 6343.9, + "valid_targets_min": 3853 + }, + { + "epoch": 6.246726034573075, + "grad_norm": 0.5247604131189251, + "learning_rate": 1.3965569409583646e-06, + "loss": 0.1533, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0741259753704071, + "step": 11925, + "valid_targets_mean": 6566.2, + "valid_targets_min": 4586 + }, + { + "epoch": 6.249345206914615, + "grad_norm": 0.507275471084232, + "learning_rate": 1.3869823181175468e-06, + "loss": 0.1461, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08363064378499985, + "step": 11930, + "valid_targets_mean": 7153.6, + "valid_targets_min": 4728 + }, + { + "epoch": 6.2519643792561554, + "grad_norm": 0.6009936005906976, + "learning_rate": 1.3774394504204925e-06, + "loss": 0.172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12445858865976334, + "step": 11935, + "valid_targets_mean": 6562.0, + "valid_targets_min": 5203 + }, + { + "epoch": 6.254583551597695, + "grad_norm": 0.45766553236629404, + "learning_rate": 1.3679283541480116e-06, + "loss": 0.1423, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07799802720546722, + "step": 11940, + "valid_targets_mean": 7098.9, + "valid_targets_min": 4561 + }, + { + "epoch": 6.257202723939235, + "grad_norm": 0.524128723453135, + "learning_rate": 1.3584490455267263e-06, + "loss": 0.1578, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1061946228146553, + "step": 11945, + "valid_targets_mean": 4960.2, + "valid_targets_min": 3439 + }, + { + "epoch": 6.2598218962807755, + "grad_norm": 0.4413781153928334, + "learning_rate": 1.349001540729009e-06, + "loss": 0.143, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06203271076083183, + "step": 11950, + "valid_targets_mean": 5384.2, + "valid_targets_min": 3635 + }, + { + "epoch": 6.262441068622316, + "grad_norm": 0.44634902795119863, + "learning_rate": 1.339585855872989e-06, + "loss": 0.1499, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0751538872718811, + "step": 11955, + "valid_targets_mean": 6940.2, + "valid_targets_min": 4393 + }, + { + "epoch": 6.265060240963855, + "grad_norm": 0.43672764749518056, + "learning_rate": 1.3302020070224942e-06, + "loss": 0.1393, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07703030109405518, + "step": 11960, + "valid_targets_mean": 6812.4, + "valid_targets_min": 4749 + }, + { + "epoch": 6.2676794133053955, + "grad_norm": 0.48392158271644026, + "learning_rate": 1.3208500101870446e-06, + "loss": 0.1364, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.029781676828861237, + "step": 11965, + "valid_targets_mean": 2363.0, + "valid_targets_min": 1062 + }, + { + "epoch": 6.270298585646936, + "grad_norm": 0.4393216070908655, + "learning_rate": 1.3115298813218201e-06, + "loss": 0.1372, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06820503622293472, + "step": 11970, + "valid_targets_mean": 5841.2, + "valid_targets_min": 3119 + }, + { + "epoch": 6.272917757988475, + "grad_norm": 0.4006964994183144, + "learning_rate": 1.302241636327628e-06, + "loss": 0.1475, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08046795427799225, + "step": 11975, + "valid_targets_mean": 5761.4, + "valid_targets_min": 3774 + }, + { + "epoch": 6.2755369303300155, + "grad_norm": 0.4525483967505272, + "learning_rate": 1.2929852910508811e-06, + "loss": 0.1439, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07478667795658112, + "step": 11980, + "valid_targets_mean": 6412.4, + "valid_targets_min": 5293 + }, + { + "epoch": 6.278156102671556, + "grad_norm": 0.40466175114045916, + "learning_rate": 1.2837608612835717e-06, + "loss": 0.1295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07089799642562866, + "step": 11985, + "valid_targets_mean": 6709.1, + "valid_targets_min": 5665 + }, + { + "epoch": 6.280775275013096, + "grad_norm": 0.433406964654351, + "learning_rate": 1.274568362763231e-06, + "loss": 0.1363, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07706020772457123, + "step": 11990, + "valid_targets_mean": 7344.6, + "valid_targets_min": 4428 + }, + { + "epoch": 6.283394447354636, + "grad_norm": 0.424450344960714, + "learning_rate": 1.2654078111729318e-06, + "loss": 0.1549, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07545164227485657, + "step": 11995, + "valid_targets_mean": 5780.6, + "valid_targets_min": 4690 + }, + { + "epoch": 6.286013619696176, + "grad_norm": 0.391086310864684, + "learning_rate": 1.256279222141219e-06, + "loss": 0.1552, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06854374706745148, + "step": 12000, + "valid_targets_mean": 5854.5, + "valid_targets_min": 4335 + }, + { + "epoch": 6.288632792037716, + "grad_norm": 0.4395805926833709, + "learning_rate": 1.2471826112421348e-06, + "loss": 0.1385, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06968638300895691, + "step": 12005, + "valid_targets_mean": 6378.9, + "valid_targets_min": 5342 + }, + { + "epoch": 6.291251964379256, + "grad_norm": 0.44846829068853294, + "learning_rate": 1.238117993995136e-06, + "loss": 0.1459, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06752711534500122, + "step": 12010, + "valid_targets_mean": 5756.5, + "valid_targets_min": 3840 + }, + { + "epoch": 6.293871136720796, + "grad_norm": 0.44086127341386794, + "learning_rate": 1.2290853858651252e-06, + "loss": 0.1596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08626071363687515, + "step": 12015, + "valid_targets_mean": 6438.6, + "valid_targets_min": 5104 + }, + { + "epoch": 6.296490309062336, + "grad_norm": 0.4560999311130661, + "learning_rate": 1.220084802262369e-06, + "loss": 0.176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06795895099639893, + "step": 12020, + "valid_targets_mean": 5190.4, + "valid_targets_min": 4224 + }, + { + "epoch": 6.299109481403876, + "grad_norm": 0.43551584888346606, + "learning_rate": 1.211116258542513e-06, + "loss": 0.1651, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07206246256828308, + "step": 12025, + "valid_targets_mean": 5932.8, + "valid_targets_min": 4318 + }, + { + "epoch": 6.301728653745417, + "grad_norm": 0.41431914162984274, + "learning_rate": 1.202179770006533e-06, + "loss": 0.147, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07387147843837738, + "step": 12030, + "valid_targets_mean": 6348.5, + "valid_targets_min": 4783 + }, + { + "epoch": 6.304347826086957, + "grad_norm": 0.45201928195808644, + "learning_rate": 1.1932753519007246e-06, + "loss": 0.1485, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0748416930437088, + "step": 12035, + "valid_targets_mean": 7200.1, + "valid_targets_min": 4412 + }, + { + "epoch": 6.306966998428496, + "grad_norm": 0.45895603504767424, + "learning_rate": 1.18440301941666e-06, + "loss": 0.1551, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08404980599880219, + "step": 12040, + "valid_targets_mean": 6137.5, + "valid_targets_min": 5033 + }, + { + "epoch": 6.309586170770037, + "grad_norm": 0.40531811665772616, + "learning_rate": 1.1755627876911823e-06, + "loss": 0.1464, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06787222623825073, + "step": 12045, + "valid_targets_mean": 5695.5, + "valid_targets_min": 4822 + }, + { + "epoch": 6.312205343111577, + "grad_norm": 0.4505022302270149, + "learning_rate": 1.1667546718063493e-06, + "loss": 0.1497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07829370349645615, + "step": 12050, + "valid_targets_mean": 5906.1, + "valid_targets_min": 2364 + }, + { + "epoch": 6.314824515453116, + "grad_norm": 0.4518121518021245, + "learning_rate": 1.1579786867894471e-06, + "loss": 0.1574, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08290734142065048, + "step": 12055, + "valid_targets_mean": 6359.0, + "valid_targets_min": 4793 + }, + { + "epoch": 6.317443687794657, + "grad_norm": 0.4299181018801878, + "learning_rate": 1.1492348476129323e-06, + "loss": 0.1495, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08029110729694366, + "step": 12060, + "valid_targets_mean": 6104.9, + "valid_targets_min": 4733 + }, + { + "epoch": 6.320062860136197, + "grad_norm": 0.3650039174519398, + "learning_rate": 1.1405231691944252e-06, + "loss": 0.1367, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06358305364847183, + "step": 12065, + "valid_targets_mean": 6780.8, + "valid_targets_min": 5388 + }, + { + "epoch": 6.322682032477737, + "grad_norm": 0.40302057029858435, + "learning_rate": 1.1318436663966703e-06, + "loss": 0.133, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07508301734924316, + "step": 12070, + "valid_targets_mean": 5956.2, + "valid_targets_min": 3182 + }, + { + "epoch": 6.325301204819277, + "grad_norm": 0.4250736175157111, + "learning_rate": 1.123196354027527e-06, + "loss": 0.1552, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08265276253223419, + "step": 12075, + "valid_targets_mean": 6389.4, + "valid_targets_min": 5077 + }, + { + "epoch": 6.327920377160817, + "grad_norm": 0.45821405058257997, + "learning_rate": 1.1145812468399274e-06, + "loss": 0.1536, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08668242394924164, + "step": 12080, + "valid_targets_mean": 5607.8, + "valid_targets_min": 3663 + }, + { + "epoch": 6.330539549502357, + "grad_norm": 0.4249903395916202, + "learning_rate": 1.1059983595318613e-06, + "loss": 0.1438, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06720085442066193, + "step": 12085, + "valid_targets_mean": 5616.4, + "valid_targets_min": 4105 + }, + { + "epoch": 6.333158721843898, + "grad_norm": 0.3896070204803804, + "learning_rate": 1.0974477067463552e-06, + "loss": 0.1446, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0791177898645401, + "step": 12090, + "valid_targets_mean": 7271.0, + "valid_targets_min": 5201 + }, + { + "epoch": 6.335777894185437, + "grad_norm": 0.421885075677326, + "learning_rate": 1.0889293030714288e-06, + "loss": 0.1361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07875902950763702, + "step": 12095, + "valid_targets_mean": 6797.6, + "valid_targets_min": 5069 + }, + { + "epoch": 6.338397066526977, + "grad_norm": 0.4143888260982762, + "learning_rate": 1.0804431630401013e-06, + "loss": 0.145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07206882536411285, + "step": 12100, + "valid_targets_mean": 5787.4, + "valid_targets_min": 4729 + }, + { + "epoch": 6.341016238868518, + "grad_norm": 0.4447957567250799, + "learning_rate": 1.071989301130325e-06, + "loss": 0.1525, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0739193931221962, + "step": 12105, + "valid_targets_mean": 5989.0, + "valid_targets_min": 4567 + }, + { + "epoch": 6.343635411210058, + "grad_norm": 0.4116999865777004, + "learning_rate": 1.0635677317650006e-06, + "loss": 0.1387, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06551603227853775, + "step": 12110, + "valid_targets_mean": 5873.4, + "valid_targets_min": 4464 + }, + { + "epoch": 6.346254583551597, + "grad_norm": 0.4261393249437143, + "learning_rate": 1.0551784693119281e-06, + "loss": 0.1549, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07234413921833038, + "step": 12115, + "valid_targets_mean": 5373.8, + "valid_targets_min": 4908 + }, + { + "epoch": 6.348873755893138, + "grad_norm": 0.3769429712793793, + "learning_rate": 1.0468215280837945e-06, + "loss": 0.1367, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.059860795736312866, + "step": 12120, + "valid_targets_mean": 5441.6, + "valid_targets_min": 4443 + }, + { + "epoch": 6.351492928234678, + "grad_norm": 0.3943897450855496, + "learning_rate": 1.038496922338137e-06, + "loss": 0.1258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0633818507194519, + "step": 12125, + "valid_targets_mean": 6286.8, + "valid_targets_min": 3381 + }, + { + "epoch": 6.354112100576218, + "grad_norm": 0.41650678916559775, + "learning_rate": 1.0302046662773301e-06, + "loss": 0.1293, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06222138553857803, + "step": 12130, + "valid_targets_mean": 6162.8, + "valid_targets_min": 4790 + }, + { + "epoch": 6.356731272917758, + "grad_norm": 0.3995135580856778, + "learning_rate": 1.0219447740485622e-06, + "loss": 0.1321, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06467224657535553, + "step": 12135, + "valid_targets_mean": 6336.1, + "valid_targets_min": 5161 + }, + { + "epoch": 6.359350445259298, + "grad_norm": 0.4200816063818399, + "learning_rate": 1.0137172597438006e-06, + "loss": 0.1472, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06530135124921799, + "step": 12140, + "valid_targets_mean": 6038.0, + "valid_targets_min": 4491 + }, + { + "epoch": 6.361969617600838, + "grad_norm": 0.6366831964221076, + "learning_rate": 1.0055221373997704e-06, + "loss": 0.1752, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11287716031074524, + "step": 12145, + "valid_targets_mean": 1423.0, + "valid_targets_min": 817 + }, + { + "epoch": 6.3645887899423785, + "grad_norm": 0.44211213435952007, + "learning_rate": 9.973594209979475e-07, + "loss": 0.1572, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06968766450881958, + "step": 12150, + "valid_targets_mean": 5531.1, + "valid_targets_min": 3893 + }, + { + "epoch": 6.367207962283918, + "grad_norm": 0.4166404237161675, + "learning_rate": 9.892291244645014e-07, + "loss": 0.1399, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0780155211687088, + "step": 12155, + "valid_targets_mean": 6276.2, + "valid_targets_min": 4622 + }, + { + "epoch": 6.369827134625458, + "grad_norm": 0.40278586878859884, + "learning_rate": 9.811312616703072e-07, + "loss": 0.1455, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07156006246805191, + "step": 12160, + "valid_targets_mean": 8019.8, + "valid_targets_min": 6108 + }, + { + "epoch": 6.3724463069669985, + "grad_norm": 0.43210480480170727, + "learning_rate": 9.730658464309007e-07, + "loss": 0.1511, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07802318036556244, + "step": 12165, + "valid_targets_mean": 6822.1, + "valid_targets_min": 4253 + }, + { + "epoch": 6.375065479308539, + "grad_norm": 0.425610981171059, + "learning_rate": 9.650328925064545e-07, + "loss": 0.1588, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07639053463935852, + "step": 12170, + "valid_targets_mean": 6800.6, + "valid_targets_min": 4990 + }, + { + "epoch": 6.377684651650078, + "grad_norm": 0.43050386355730597, + "learning_rate": 9.570324136017683e-07, + "loss": 0.1494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09192109107971191, + "step": 12175, + "valid_targets_mean": 6860.5, + "valid_targets_min": 4957 + }, + { + "epoch": 6.3803038239916186, + "grad_norm": 0.4091475548747802, + "learning_rate": 9.490644233662328e-07, + "loss": 0.1488, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06866734474897385, + "step": 12180, + "valid_targets_mean": 5820.2, + "valid_targets_min": 4775 + }, + { + "epoch": 6.382922996333159, + "grad_norm": 0.37973839807835397, + "learning_rate": 9.411289353938136e-07, + "loss": 0.1404, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05396395921707153, + "step": 12185, + "valid_targets_mean": 5628.8, + "valid_targets_min": 4098 + }, + { + "epoch": 6.385542168674699, + "grad_norm": 0.3950700056570422, + "learning_rate": 9.332259632230123e-07, + "loss": 0.1366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07747262716293335, + "step": 12190, + "valid_targets_mean": 6170.6, + "valid_targets_min": 4801 + }, + { + "epoch": 6.388161341016239, + "grad_norm": 0.4635368797467224, + "learning_rate": 9.253555203368792e-07, + "loss": 0.1872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18500551581382751, + "step": 12195, + "valid_targets_mean": 6196.0, + "valid_targets_min": 4734 + }, + { + "epoch": 6.390780513357779, + "grad_norm": 0.44116838575681694, + "learning_rate": 9.175176201629466e-07, + "loss": 0.1507, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08110781013965607, + "step": 12200, + "valid_targets_mean": 6086.4, + "valid_targets_min": 4400 + }, + { + "epoch": 6.393399685699319, + "grad_norm": 0.4394803002233574, + "learning_rate": 9.09712276073238e-07, + "loss": 0.1383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07908235490322113, + "step": 12205, + "valid_targets_mean": 6544.9, + "valid_targets_min": 4919 + }, + { + "epoch": 6.3960188580408595, + "grad_norm": 0.4318114046998599, + "learning_rate": 9.019395013842303e-07, + "loss": 0.1465, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0808994323015213, + "step": 12210, + "valid_targets_mean": 6052.2, + "valid_targets_min": 4611 + }, + { + "epoch": 6.398638030382399, + "grad_norm": 0.43101304490405234, + "learning_rate": 8.941993093568314e-07, + "loss": 0.149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06643542647361755, + "step": 12215, + "valid_targets_mean": 6934.9, + "valid_targets_min": 2275 + }, + { + "epoch": 6.401257202723939, + "grad_norm": 0.4130400097681656, + "learning_rate": 8.86491713196369e-07, + "loss": 0.1284, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06309416890144348, + "step": 12220, + "valid_targets_mean": 5878.5, + "valid_targets_min": 4826 + }, + { + "epoch": 6.4038763750654795, + "grad_norm": 0.39866053805511975, + "learning_rate": 8.788167260525537e-07, + "loss": 0.1424, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06360381841659546, + "step": 12225, + "valid_targets_mean": 6784.9, + "valid_targets_min": 4707 + }, + { + "epoch": 6.40649554740702, + "grad_norm": 0.3952513558012143, + "learning_rate": 8.7117436101946e-07, + "loss": 0.1313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10245849192142487, + "step": 12230, + "valid_targets_mean": 7245.8, + "valid_targets_min": 5421 + }, + { + "epoch": 6.409114719748559, + "grad_norm": 0.3855066970646897, + "learning_rate": 8.635646311355206e-07, + "loss": 0.1371, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0684409886598587, + "step": 12235, + "valid_targets_mean": 7122.0, + "valid_targets_min": 4949 + }, + { + "epoch": 6.4117338920900995, + "grad_norm": 0.3819539134322198, + "learning_rate": 8.559875493834702e-07, + "loss": 0.1375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0731293186545372, + "step": 12240, + "valid_targets_mean": 6444.5, + "valid_targets_min": 4831 + }, + { + "epoch": 6.41435306443164, + "grad_norm": 0.4052284152288746, + "learning_rate": 8.484431286903616e-07, + "loss": 0.1437, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08262995630502701, + "step": 12245, + "valid_targets_mean": 6454.9, + "valid_targets_min": 4018 + }, + { + "epoch": 6.41697223677318, + "grad_norm": 0.3474902598250319, + "learning_rate": 8.409313819275144e-07, + "loss": 0.1355, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0552181750535965, + "step": 12250, + "valid_targets_mean": 6851.4, + "valid_targets_min": 5034 + }, + { + "epoch": 6.4195914091147195, + "grad_norm": 0.5507816017274946, + "learning_rate": 8.334523219105084e-07, + "loss": 0.1383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0801452100276947, + "step": 12255, + "valid_targets_mean": 6674.2, + "valid_targets_min": 4682 + }, + { + "epoch": 6.42221058145626, + "grad_norm": 0.447494323940838, + "learning_rate": 8.260059613991545e-07, + "loss": 0.1496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07584092020988464, + "step": 12260, + "valid_targets_mean": 5518.1, + "valid_targets_min": 4764 + }, + { + "epoch": 6.4248297537978, + "grad_norm": 0.4725890617126325, + "learning_rate": 8.185923130974816e-07, + "loss": 0.1496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08310903608798981, + "step": 12265, + "valid_targets_mean": 5329.2, + "valid_targets_min": 2481 + }, + { + "epoch": 6.42744892613934, + "grad_norm": 0.6737547623808363, + "learning_rate": 8.112113896537033e-07, + "loss": 0.1926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11236198246479034, + "step": 12270, + "valid_targets_mean": 4792.6, + "valid_targets_min": 702 + }, + { + "epoch": 6.43006809848088, + "grad_norm": 0.6449972081489183, + "learning_rate": 8.038632036602068e-07, + "loss": 0.2083, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11374415457248688, + "step": 12275, + "valid_targets_mean": 5322.8, + "valid_targets_min": 1005 + }, + { + "epoch": 6.43268727082242, + "grad_norm": 0.5654573992879217, + "learning_rate": 7.965477676535216e-07, + "loss": 0.206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07705260813236237, + "step": 12280, + "valid_targets_mean": 3584.6, + "valid_targets_min": 2054 + }, + { + "epoch": 6.43530644316396, + "grad_norm": 0.6863852664683533, + "learning_rate": 7.892650941143109e-07, + "loss": 0.2056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09170589596033096, + "step": 12285, + "valid_targets_mean": 3685.6, + "valid_targets_min": 1751 + }, + { + "epoch": 6.437925615505501, + "grad_norm": 0.602298364243919, + "learning_rate": 7.820151954673316e-07, + "loss": 0.2036, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12648309767246246, + "step": 12290, + "valid_targets_mean": 5944.2, + "valid_targets_min": 1970 + }, + { + "epoch": 6.44054478784704, + "grad_norm": 0.5507065526632529, + "learning_rate": 7.747980840814384e-07, + "loss": 0.2099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09939628094434738, + "step": 12295, + "valid_targets_mean": 5916.0, + "valid_targets_min": 920 + }, + { + "epoch": 6.44316396018858, + "grad_norm": 0.6006661949709525, + "learning_rate": 7.676137722695376e-07, + "loss": 0.2027, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09916333854198456, + "step": 12300, + "valid_targets_mean": 6475.4, + "valid_targets_min": 2231 + }, + { + "epoch": 6.445783132530121, + "grad_norm": 0.5738573068037527, + "learning_rate": 7.60462272288578e-07, + "loss": 0.201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07840252667665482, + "step": 12305, + "valid_targets_mean": 4043.4, + "valid_targets_min": 467 + }, + { + "epoch": 6.44840230487166, + "grad_norm": 0.5439295935975441, + "learning_rate": 7.533435963395375e-07, + "loss": 0.212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11592923104763031, + "step": 12310, + "valid_targets_mean": 5549.8, + "valid_targets_min": 3440 + }, + { + "epoch": 6.4510214772132, + "grad_norm": 0.8590229109445299, + "learning_rate": 7.462577565673835e-07, + "loss": 0.21, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10425989329814911, + "step": 12315, + "valid_targets_mean": 4736.9, + "valid_targets_min": 1697 + }, + { + "epoch": 6.453640649554741, + "grad_norm": 0.6337785584790162, + "learning_rate": 7.392047650610679e-07, + "loss": 0.2034, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11334839463233948, + "step": 12320, + "valid_targets_mean": 4838.2, + "valid_targets_min": 1223 + }, + { + "epoch": 6.456259821896281, + "grad_norm": 0.5547802198399892, + "learning_rate": 7.321846338535032e-07, + "loss": 0.204, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10477716475725174, + "step": 12325, + "valid_targets_mean": 5466.9, + "valid_targets_min": 1552 + }, + { + "epoch": 6.458878994237821, + "grad_norm": 0.5876783595854257, + "learning_rate": 7.251973749215357e-07, + "loss": 0.2041, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11823265999555588, + "step": 12330, + "valid_targets_mean": 5166.0, + "valid_targets_min": 1546 + }, + { + "epoch": 6.461498166579361, + "grad_norm": 0.5857999618397483, + "learning_rate": 7.182430001859253e-07, + "loss": 0.1984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09447768330574036, + "step": 12335, + "valid_targets_mean": 3848.2, + "valid_targets_min": 1957 + }, + { + "epoch": 6.464117338920901, + "grad_norm": 0.6194569579809597, + "learning_rate": 7.113215215113456e-07, + "loss": 0.2007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09726107120513916, + "step": 12340, + "valid_targets_mean": 3487.5, + "valid_targets_min": 1538 + }, + { + "epoch": 6.466736511262441, + "grad_norm": 0.6193271598241644, + "learning_rate": 7.044329507063241e-07, + "loss": 0.1939, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09087219834327698, + "step": 12345, + "valid_targets_mean": 3397.2, + "valid_targets_min": 1645 + }, + { + "epoch": 6.469355683603981, + "grad_norm": 0.6559474003243466, + "learning_rate": 6.975772995232621e-07, + "loss": 0.1986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08520987629890442, + "step": 12350, + "valid_targets_mean": 2859.4, + "valid_targets_min": 935 + }, + { + "epoch": 6.471974855945521, + "grad_norm": 0.6428355270463898, + "learning_rate": 6.907545796583926e-07, + "loss": 0.2026, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10408250987529755, + "step": 12355, + "valid_targets_mean": 3490.6, + "valid_targets_min": 1269 + }, + { + "epoch": 6.474594028287061, + "grad_norm": 0.6780616244891007, + "learning_rate": 6.839648027517665e-07, + "loss": 0.2007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09541037678718567, + "step": 12360, + "valid_targets_mean": 2860.0, + "valid_targets_min": 1173 + }, + { + "epoch": 6.477213200628602, + "grad_norm": 0.6127512057602541, + "learning_rate": 6.772079803872267e-07, + "loss": 0.1981, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09076771885156631, + "step": 12365, + "valid_targets_mean": 3480.9, + "valid_targets_min": 1392 + }, + { + "epoch": 6.479832372970141, + "grad_norm": 0.6625302661809119, + "learning_rate": 6.704841240924031e-07, + "loss": 0.2021, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1085045337677002, + "step": 12370, + "valid_targets_mean": 3878.6, + "valid_targets_min": 1883 + }, + { + "epoch": 6.482451545311681, + "grad_norm": 0.6526193395022808, + "learning_rate": 6.637932453386664e-07, + "loss": 0.1928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11360698938369751, + "step": 12375, + "valid_targets_mean": 3721.4, + "valid_targets_min": 2106 + }, + { + "epoch": 6.485070717653222, + "grad_norm": 0.5927849705531022, + "learning_rate": 6.571353555411475e-07, + "loss": 0.1782, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07101786136627197, + "step": 12380, + "valid_targets_mean": 3868.5, + "valid_targets_min": 2222 + }, + { + "epoch": 6.487689889994762, + "grad_norm": 0.6476439861205255, + "learning_rate": 6.505104660586759e-07, + "loss": 0.1928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09150652587413788, + "step": 12385, + "valid_targets_mean": 3010.1, + "valid_targets_min": 958 + }, + { + "epoch": 6.490309062336301, + "grad_norm": 0.6184049122484422, + "learning_rate": 6.439185881937949e-07, + "loss": 0.1963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09595520049333572, + "step": 12390, + "valid_targets_mean": 3789.1, + "valid_targets_min": 771 + }, + { + "epoch": 6.492928234677842, + "grad_norm": 0.6302199004088047, + "learning_rate": 6.373597331927128e-07, + "loss": 0.1986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06606753170490265, + "step": 12395, + "valid_targets_mean": 3578.9, + "valid_targets_min": 1774 + }, + { + "epoch": 6.495547407019382, + "grad_norm": 0.693365212113418, + "learning_rate": 6.308339122453189e-07, + "loss": 0.1908, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08515545725822449, + "step": 12400, + "valid_targets_mean": 2545.8, + "valid_targets_min": 997 + }, + { + "epoch": 6.498166579360922, + "grad_norm": 0.6048352005477383, + "learning_rate": 6.243411364851204e-07, + "loss": 0.1921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09665270149707794, + "step": 12405, + "valid_targets_mean": 3667.1, + "valid_targets_min": 1741 + }, + { + "epoch": 6.500785751702462, + "grad_norm": 0.6792020303860473, + "learning_rate": 6.178814169892633e-07, + "loss": 0.1938, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09353077411651611, + "step": 12410, + "valid_targets_mean": 3606.1, + "valid_targets_min": 863 + }, + { + "epoch": 6.503404924044002, + "grad_norm": 0.6470828919156506, + "learning_rate": 6.114547647784941e-07, + "loss": 0.1894, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0979934111237526, + "step": 12415, + "valid_targets_mean": 3876.9, + "valid_targets_min": 1854 + }, + { + "epoch": 6.506024096385542, + "grad_norm": 0.5779518222287894, + "learning_rate": 6.0506119081714e-07, + "loss": 0.1819, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09203438460826874, + "step": 12420, + "valid_targets_mean": 4763.2, + "valid_targets_min": 2040 + }, + { + "epoch": 6.5086432687270825, + "grad_norm": 0.6346688915452731, + "learning_rate": 5.987007060130978e-07, + "loss": 0.1945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08190780133008957, + "step": 12425, + "valid_targets_mean": 3521.9, + "valid_targets_min": 1036 + }, + { + "epoch": 6.511262441068622, + "grad_norm": 0.6318536696051502, + "learning_rate": 5.92373321217814e-07, + "loss": 0.1938, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10408752411603928, + "step": 12430, + "valid_targets_mean": 4304.8, + "valid_targets_min": 1279 + }, + { + "epoch": 6.513881613410162, + "grad_norm": 0.6421579092608279, + "learning_rate": 5.860790472262534e-07, + "loss": 0.186, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09606657922267914, + "step": 12435, + "valid_targets_mean": 3600.0, + "valid_targets_min": 1798 + }, + { + "epoch": 6.5165007857517026, + "grad_norm": 0.6457038058905296, + "learning_rate": 5.798178947769106e-07, + "loss": 0.188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08636249601840973, + "step": 12440, + "valid_targets_mean": 3067.2, + "valid_targets_min": 1446 + }, + { + "epoch": 6.519119958093243, + "grad_norm": 0.6154324966048933, + "learning_rate": 5.735898745517499e-07, + "loss": 0.188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0979316383600235, + "step": 12445, + "valid_targets_mean": 4183.2, + "valid_targets_min": 1270 + }, + { + "epoch": 6.521739130434782, + "grad_norm": 0.5862027446389466, + "learning_rate": 5.673949971762249e-07, + "loss": 0.1931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10502250492572784, + "step": 12450, + "valid_targets_mean": 5485.8, + "valid_targets_min": 1216 + }, + { + "epoch": 6.524358302776323, + "grad_norm": 0.6376219612800321, + "learning_rate": 5.612332732192416e-07, + "loss": 0.1843, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10316480696201324, + "step": 12455, + "valid_targets_mean": 3994.0, + "valid_targets_min": 2028 + }, + { + "epoch": 6.526977475117863, + "grad_norm": 0.6787194184067051, + "learning_rate": 5.551047131931442e-07, + "loss": 0.195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11441092193126678, + "step": 12460, + "valid_targets_mean": 3700.6, + "valid_targets_min": 2329 + }, + { + "epoch": 6.529596647459403, + "grad_norm": 0.6767800339802285, + "learning_rate": 5.490093275536934e-07, + "loss": 0.1916, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11958886682987213, + "step": 12465, + "valid_targets_mean": 4075.2, + "valid_targets_min": 1363 + }, + { + "epoch": 6.532215819800943, + "grad_norm": 0.6225915057487827, + "learning_rate": 5.429471267000552e-07, + "loss": 0.1814, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08626016974449158, + "step": 12470, + "valid_targets_mean": 3560.8, + "valid_targets_min": 1087 + }, + { + "epoch": 6.534834992142483, + "grad_norm": 0.6555202364215589, + "learning_rate": 5.36918120974781e-07, + "loss": 0.1948, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09971264004707336, + "step": 12475, + "valid_targets_mean": 3860.1, + "valid_targets_min": 2483 + }, + { + "epoch": 6.537454164484023, + "grad_norm": 0.6733343811998177, + "learning_rate": 5.309223206637826e-07, + "loss": 0.1956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11346982419490814, + "step": 12480, + "valid_targets_mean": 4583.2, + "valid_targets_min": 2316 + }, + { + "epoch": 6.5400733368255635, + "grad_norm": 0.6473883245274624, + "learning_rate": 5.249597359963332e-07, + "loss": 0.1866, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09985611587762833, + "step": 12485, + "valid_targets_mean": 4198.9, + "valid_targets_min": 2022 + }, + { + "epoch": 6.542692509167103, + "grad_norm": 0.6039774253852044, + "learning_rate": 5.190303771450222e-07, + "loss": 0.1793, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07155510783195496, + "step": 12490, + "valid_targets_mean": 3228.9, + "valid_targets_min": 1294 + }, + { + "epoch": 6.545311681508643, + "grad_norm": 0.6989217643366192, + "learning_rate": 5.131342542257666e-07, + "loss": 0.1977, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11551254987716675, + "step": 12495, + "valid_targets_mean": 3846.8, + "valid_targets_min": 2716 + }, + { + "epoch": 6.5479308538501835, + "grad_norm": 0.6953253783559055, + "learning_rate": 5.072713772977711e-07, + "loss": 0.1892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09119541943073273, + "step": 12500, + "valid_targets_mean": 3211.6, + "valid_targets_min": 2060 + }, + { + "epoch": 6.550550026191724, + "grad_norm": 0.6984431761510316, + "learning_rate": 5.014417563635276e-07, + "loss": 0.1887, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09894177317619324, + "step": 12505, + "valid_targets_mean": 3320.4, + "valid_targets_min": 2407 + }, + { + "epoch": 6.553169198533263, + "grad_norm": 0.611165944926459, + "learning_rate": 4.956454013687873e-07, + "loss": 0.1927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10009843111038208, + "step": 12510, + "valid_targets_mean": 4165.1, + "valid_targets_min": 1533 + }, + { + "epoch": 6.5557883708748035, + "grad_norm": 0.6677128161368928, + "learning_rate": 4.898823222025462e-07, + "loss": 0.1964, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12110663950443268, + "step": 12515, + "valid_targets_mean": 5201.2, + "valid_targets_min": 2189 + }, + { + "epoch": 6.558407543216344, + "grad_norm": 0.6393601054937041, + "learning_rate": 4.841525286970327e-07, + "loss": 0.1871, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11260367929935455, + "step": 12520, + "valid_targets_mean": 4193.1, + "valid_targets_min": 1328 + }, + { + "epoch": 6.561026715557884, + "grad_norm": 0.6701988763152277, + "learning_rate": 4.784560306276875e-07, + "loss": 0.2032, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13839399814605713, + "step": 12525, + "valid_targets_mean": 4500.4, + "valid_targets_min": 1708 + }, + { + "epoch": 6.5636458878994235, + "grad_norm": 0.6291661582869631, + "learning_rate": 4.727928377131363e-07, + "loss": 0.1826, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07673248648643494, + "step": 12530, + "valid_targets_mean": 3494.0, + "valid_targets_min": 1912 + }, + { + "epoch": 6.566265060240964, + "grad_norm": 0.676320891906221, + "learning_rate": 4.6716295961520384e-07, + "loss": 0.1807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11168824881315231, + "step": 12535, + "valid_targets_mean": 4145.2, + "valid_targets_min": 2606 + }, + { + "epoch": 6.568884232582504, + "grad_norm": 0.6125559428322571, + "learning_rate": 4.6156640593885805e-07, + "loss": 0.1812, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08832336217164993, + "step": 12540, + "valid_targets_mean": 4189.0, + "valid_targets_min": 1378 + }, + { + "epoch": 6.571503404924044, + "grad_norm": 0.6638100292937631, + "learning_rate": 4.560031862322278e-07, + "loss": 0.1901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11195237934589386, + "step": 12545, + "valid_targets_mean": 3983.4, + "valid_targets_min": 1219 + }, + { + "epoch": 6.574122577265584, + "grad_norm": 0.6212782016254619, + "learning_rate": 4.504733099865566e-07, + "loss": 0.1963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09998372197151184, + "step": 12550, + "valid_targets_mean": 3997.0, + "valid_targets_min": 2631 + }, + { + "epoch": 6.576741749607124, + "grad_norm": 0.6954308718876611, + "learning_rate": 4.4497678663621756e-07, + "loss": 0.1938, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11565820127725601, + "step": 12555, + "valid_targets_mean": 4167.4, + "valid_targets_min": 1423 + }, + { + "epoch": 6.579360921948664, + "grad_norm": 0.6549184271938823, + "learning_rate": 4.395136255586696e-07, + "loss": 0.1874, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07491223514080048, + "step": 12560, + "valid_targets_mean": 3381.9, + "valid_targets_min": 2320 + }, + { + "epoch": 6.581980094290204, + "grad_norm": 0.7132956672725176, + "learning_rate": 4.340838360744615e-07, + "loss": 0.1946, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09730696678161621, + "step": 12565, + "valid_targets_mean": 3174.9, + "valid_targets_min": 1188 + }, + { + "epoch": 6.584599266631744, + "grad_norm": 0.613721618741684, + "learning_rate": 4.286874274471986e-07, + "loss": 0.1968, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07196123898029327, + "step": 12570, + "valid_targets_mean": 3378.6, + "valid_targets_min": 618 + }, + { + "epoch": 6.587218438973284, + "grad_norm": 0.7250752630540884, + "learning_rate": 4.233244088835453e-07, + "loss": 0.1914, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10160218179225922, + "step": 12575, + "valid_targets_mean": 2988.1, + "valid_targets_min": 1364 + }, + { + "epoch": 6.589837611314825, + "grad_norm": 0.6503760009869628, + "learning_rate": 4.1799478953319814e-07, + "loss": 0.1826, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08129014819860458, + "step": 12580, + "valid_targets_mean": 3199.1, + "valid_targets_min": 1397 + }, + { + "epoch": 6.592456783656365, + "grad_norm": 0.6238635228912598, + "learning_rate": 4.1269857848886153e-07, + "loss": 0.1776, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10387745499610901, + "step": 12585, + "valid_targets_mean": 5348.0, + "valid_targets_min": 1778 + }, + { + "epoch": 6.595075955997904, + "grad_norm": 0.6460935080740302, + "learning_rate": 4.074357847862609e-07, + "loss": 0.1772, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09542147815227509, + "step": 12590, + "valid_targets_mean": 3444.9, + "valid_targets_min": 621 + }, + { + "epoch": 6.597695128339445, + "grad_norm": 0.6121163929342296, + "learning_rate": 4.022064174040918e-07, + "loss": 0.1722, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07590524852275848, + "step": 12595, + "valid_targets_mean": 3872.9, + "valid_targets_min": 1290 + }, + { + "epoch": 6.600314300680985, + "grad_norm": 0.7923605265608449, + "learning_rate": 3.9701048526403774e-07, + "loss": 0.1738, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08326010406017303, + "step": 12600, + "valid_targets_mean": 2546.6, + "valid_targets_min": 642 + }, + { + "epoch": 6.602933473022524, + "grad_norm": 0.6844825101895506, + "learning_rate": 3.9184799723072764e-07, + "loss": 0.1703, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09406258165836334, + "step": 12605, + "valid_targets_mean": 3428.2, + "valid_targets_min": 1978 + }, + { + "epoch": 6.605552645364065, + "grad_norm": 0.6745675038663468, + "learning_rate": 3.867189621117362e-07, + "loss": 0.1886, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12714041769504547, + "step": 12610, + "valid_targets_mean": 4160.0, + "valid_targets_min": 2642 + }, + { + "epoch": 6.608171817705605, + "grad_norm": 0.6502643748669914, + "learning_rate": 3.81623388657566e-07, + "loss": 0.1947, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07471387088298798, + "step": 12615, + "valid_targets_mean": 2937.1, + "valid_targets_min": 1510 + }, + { + "epoch": 6.610790990047145, + "grad_norm": 0.7399225689301697, + "learning_rate": 3.7656128556163407e-07, + "loss": 0.1815, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09238269180059433, + "step": 12620, + "valid_targets_mean": 2744.2, + "valid_targets_min": 987 + }, + { + "epoch": 6.613410162388686, + "grad_norm": 0.6197270407292439, + "learning_rate": 3.7153266146024547e-07, + "loss": 0.1857, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08794254064559937, + "step": 12625, + "valid_targets_mean": 3638.4, + "valid_targets_min": 1428 + }, + { + "epoch": 6.616029334730225, + "grad_norm": 0.6334397777503624, + "learning_rate": 3.6653752493259976e-07, + "loss": 0.1843, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10795360803604126, + "step": 12630, + "valid_targets_mean": 4731.5, + "valid_targets_min": 1700 + }, + { + "epoch": 6.618648507071765, + "grad_norm": 0.5566634348297339, + "learning_rate": 3.615758845007533e-07, + "loss": 0.1791, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08727572858333588, + "step": 12635, + "valid_targets_mean": 5699.6, + "valid_targets_min": 1767 + }, + { + "epoch": 6.621267679413306, + "grad_norm": 0.5570405375278416, + "learning_rate": 3.5664774862962605e-07, + "loss": 0.1838, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08419948816299438, + "step": 12640, + "valid_targets_mean": 4101.5, + "valid_targets_min": 2684 + }, + { + "epoch": 6.623886851754845, + "grad_norm": 0.6816645231727136, + "learning_rate": 3.5175312572696795e-07, + "loss": 0.1787, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08527840673923492, + "step": 12645, + "valid_targets_mean": 2761.2, + "valid_targets_min": 1542 + }, + { + "epoch": 6.626506024096385, + "grad_norm": 0.6537470489254144, + "learning_rate": 3.468920241433571e-07, + "loss": 0.1835, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07553485035896301, + "step": 12650, + "valid_targets_mean": 2765.8, + "valid_targets_min": 1476 + }, + { + "epoch": 6.629125196437926, + "grad_norm": 0.6249077159518814, + "learning_rate": 3.4206445217217944e-07, + "loss": 0.1839, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08840804547071457, + "step": 12655, + "valid_targets_mean": 3884.5, + "valid_targets_min": 1711 + }, + { + "epoch": 6.631744368779466, + "grad_norm": 0.6499343409410591, + "learning_rate": 3.3727041804962447e-07, + "loss": 0.1858, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09530726075172424, + "step": 12660, + "valid_targets_mean": 3235.6, + "valid_targets_min": 1669 + }, + { + "epoch": 6.634363541121006, + "grad_norm": 0.6919759268955735, + "learning_rate": 3.3250992995465416e-07, + "loss": 0.1928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.092196524143219, + "step": 12665, + "valid_targets_mean": 3388.5, + "valid_targets_min": 1624 + }, + { + "epoch": 6.636982713462546, + "grad_norm": 0.6748818891045982, + "learning_rate": 3.277829960090073e-07, + "loss": 0.1874, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09625837206840515, + "step": 12670, + "valid_targets_mean": 3380.9, + "valid_targets_min": 1676 + }, + { + "epoch": 6.639601885804086, + "grad_norm": 0.6481965100625632, + "learning_rate": 3.230896242771642e-07, + "loss": 0.197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07984872162342072, + "step": 12675, + "valid_targets_mean": 3148.4, + "valid_targets_min": 1500 + }, + { + "epoch": 6.642221058145626, + "grad_norm": 0.5984040546530887, + "learning_rate": 3.184298227663618e-07, + "loss": 0.1795, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08513247966766357, + "step": 12680, + "valid_targets_mean": 4343.5, + "valid_targets_min": 2556 + }, + { + "epoch": 6.644840230487166, + "grad_norm": 0.677679937873208, + "learning_rate": 3.13803599426552e-07, + "loss": 0.2025, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07720249146223068, + "step": 12685, + "valid_targets_mean": 3299.5, + "valid_targets_min": 1241 + }, + { + "epoch": 6.647459402828706, + "grad_norm": 0.7324573724604573, + "learning_rate": 3.092109621504058e-07, + "loss": 0.197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1175050139427185, + "step": 12690, + "valid_targets_mean": 3547.0, + "valid_targets_min": 992 + }, + { + "epoch": 6.650078575170246, + "grad_norm": 0.6946700460208859, + "learning_rate": 3.0465191877329104e-07, + "loss": 0.1854, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10434059053659439, + "step": 12695, + "valid_targets_mean": 4328.6, + "valid_targets_min": 1133 + }, + { + "epoch": 6.6526977475117866, + "grad_norm": 0.6687980880353598, + "learning_rate": 3.001264770732615e-07, + "loss": 0.1854, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09853892028331757, + "step": 12700, + "valid_targets_mean": 4202.6, + "valid_targets_min": 2369 + }, + { + "epoch": 6.655316919853326, + "grad_norm": 0.6663236224684165, + "learning_rate": 2.9563464477104786e-07, + "loss": 0.1876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07648585736751556, + "step": 12705, + "valid_targets_mean": 3563.0, + "valid_targets_min": 1919 + }, + { + "epoch": 6.657936092194866, + "grad_norm": 0.6637108325798059, + "learning_rate": 2.9117642953003564e-07, + "loss": 0.1919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11010406911373138, + "step": 12710, + "valid_targets_mean": 3975.5, + "valid_targets_min": 2902 + }, + { + "epoch": 6.660555264536407, + "grad_norm": 0.7498564576579266, + "learning_rate": 2.867518389562629e-07, + "loss": 0.1909, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11214965581893921, + "step": 12715, + "valid_targets_mean": 2975.5, + "valid_targets_min": 617 + }, + { + "epoch": 6.663174436877947, + "grad_norm": 0.6239320454745892, + "learning_rate": 2.823608805983957e-07, + "loss": 0.1719, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0791563019156456, + "step": 12720, + "valid_targets_mean": 3290.4, + "valid_targets_min": 1349 + }, + { + "epoch": 6.665793609219486, + "grad_norm": 0.6505688926922241, + "learning_rate": 2.7800356194772836e-07, + "loss": 0.1837, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0979127585887909, + "step": 12725, + "valid_targets_mean": 3459.0, + "valid_targets_min": 1769 + }, + { + "epoch": 6.668412781561027, + "grad_norm": 0.6130763206181329, + "learning_rate": 2.7367989043815434e-07, + "loss": 0.18, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0859518051147461, + "step": 12730, + "valid_targets_mean": 4186.1, + "valid_targets_min": 2097 + }, + { + "epoch": 6.671031953902567, + "grad_norm": 0.682777529916058, + "learning_rate": 2.6938987344616864e-07, + "loss": 0.1875, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09927409142255783, + "step": 12735, + "valid_targets_mean": 3304.0, + "valid_targets_min": 1066 + }, + { + "epoch": 6.673651126244107, + "grad_norm": 0.6139750346228053, + "learning_rate": 2.651335182908499e-07, + "loss": 0.181, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09072718769311905, + "step": 12740, + "valid_targets_mean": 4457.9, + "valid_targets_min": 2635 + }, + { + "epoch": 6.676270298585647, + "grad_norm": 0.6688779633764557, + "learning_rate": 2.6091083223384496e-07, + "loss": 0.1931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10317809879779816, + "step": 12745, + "valid_targets_mean": 4296.2, + "valid_targets_min": 981 + }, + { + "epoch": 6.678889470927187, + "grad_norm": 0.6153838140431476, + "learning_rate": 2.5672182247935773e-07, + "loss": 0.1818, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08931320160627365, + "step": 12750, + "valid_targets_mean": 4020.1, + "valid_targets_min": 2131 + }, + { + "epoch": 6.681508643268727, + "grad_norm": 0.6841531773090127, + "learning_rate": 2.525664961741403e-07, + "loss": 0.1821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09330379217863083, + "step": 12755, + "valid_targets_mean": 3541.0, + "valid_targets_min": 1353 + }, + { + "epoch": 6.6841278156102675, + "grad_norm": 0.5892914974913471, + "learning_rate": 2.484448604074796e-07, + "loss": 0.1868, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07329745590686798, + "step": 12760, + "valid_targets_mean": 3362.0, + "valid_targets_min": 1509 + }, + { + "epoch": 6.686746987951807, + "grad_norm": 0.6057942078920835, + "learning_rate": 2.4435692221117966e-07, + "loss": 0.179, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08245901763439178, + "step": 12765, + "valid_targets_mean": 3918.9, + "valid_targets_min": 2128 + }, + { + "epoch": 6.689366160293347, + "grad_norm": 0.7912254274223812, + "learning_rate": 2.4030268855955495e-07, + "loss": 0.172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07037973403930664, + "step": 12770, + "valid_targets_mean": 2919.0, + "valid_targets_min": 1687 + }, + { + "epoch": 6.6919853326348875, + "grad_norm": 0.6624467951019597, + "learning_rate": 2.362821663694237e-07, + "loss": 0.1815, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10190001875162125, + "step": 12775, + "valid_targets_mean": 3696.9, + "valid_targets_min": 1803 + }, + { + "epoch": 6.694604504976428, + "grad_norm": 0.6255604822386763, + "learning_rate": 2.32295362500079e-07, + "loss": 0.1771, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08623208105564117, + "step": 12780, + "valid_targets_mean": 4102.0, + "valid_targets_min": 2263 + }, + { + "epoch": 6.697223677317967, + "grad_norm": 0.6706980490532756, + "learning_rate": 2.2834228375330003e-07, + "loss": 0.1785, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10698755085468292, + "step": 12785, + "valid_targets_mean": 4621.4, + "valid_targets_min": 2232 + }, + { + "epoch": 6.6998428496595075, + "grad_norm": 0.6372593378139074, + "learning_rate": 2.2442293687331863e-07, + "loss": 0.1687, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10318998992443085, + "step": 12790, + "valid_targets_mean": 4051.6, + "valid_targets_min": 873 + }, + { + "epoch": 6.702462022001048, + "grad_norm": 0.6193928640374642, + "learning_rate": 2.2053732854682598e-07, + "loss": 0.1729, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07823237776756287, + "step": 12795, + "valid_targets_mean": 3340.1, + "valid_targets_min": 1942 + }, + { + "epoch": 6.705081194342588, + "grad_norm": 0.6780240423049211, + "learning_rate": 2.16685465402946e-07, + "loss": 0.179, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08720569312572479, + "step": 12800, + "valid_targets_mean": 3179.4, + "valid_targets_min": 897 + }, + { + "epoch": 6.7077003666841275, + "grad_norm": 0.659535201767842, + "learning_rate": 2.128673540132331e-07, + "loss": 0.193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09473605453968048, + "step": 12805, + "valid_targets_mean": 3492.2, + "valid_targets_min": 1695 + }, + { + "epoch": 6.710319539025668, + "grad_norm": 0.6495919509093001, + "learning_rate": 2.090830008916589e-07, + "loss": 0.1735, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07860636711120605, + "step": 12810, + "valid_targets_mean": 4043.9, + "valid_targets_min": 1712 + }, + { + "epoch": 6.712938711367208, + "grad_norm": 0.611522543603785, + "learning_rate": 2.0533241249460545e-07, + "loss": 0.176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07307950407266617, + "step": 12815, + "valid_targets_mean": 2987.9, + "valid_targets_min": 993 + }, + { + "epoch": 6.715557883708748, + "grad_norm": 0.5993522606495606, + "learning_rate": 2.0161559522084095e-07, + "loss": 0.1709, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08598138391971588, + "step": 12820, + "valid_targets_mean": 3854.8, + "valid_targets_min": 1679 + }, + { + "epoch": 6.718177056050288, + "grad_norm": 0.5714454997499965, + "learning_rate": 1.9793255541152633e-07, + "loss": 0.1803, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08323566615581512, + "step": 12825, + "valid_targets_mean": 3938.8, + "valid_targets_min": 2345 + }, + { + "epoch": 6.720796228391828, + "grad_norm": 0.6519650606498112, + "learning_rate": 1.9428329935018642e-07, + "loss": 0.1845, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09488783776760101, + "step": 12830, + "valid_targets_mean": 4507.9, + "valid_targets_min": 3068 + }, + { + "epoch": 6.723415400733368, + "grad_norm": 0.6573069225818161, + "learning_rate": 1.9066783326272098e-07, + "loss": 0.1821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08799446374177933, + "step": 12835, + "valid_targets_mean": 4080.9, + "valid_targets_min": 2965 + }, + { + "epoch": 6.726034573074909, + "grad_norm": 0.6211160166989392, + "learning_rate": 1.870861633173693e-07, + "loss": 0.1795, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07835432887077332, + "step": 12840, + "valid_targets_mean": 2993.5, + "valid_targets_min": 1817 + }, + { + "epoch": 6.728653745416448, + "grad_norm": 0.6320423602834774, + "learning_rate": 1.8353829562471893e-07, + "loss": 0.1778, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0895933210849762, + "step": 12845, + "valid_targets_mean": 3795.2, + "valid_targets_min": 1727 + }, + { + "epoch": 6.731272917757988, + "grad_norm": 0.5841924116488029, + "learning_rate": 1.8002423623768584e-07, + "loss": 0.1771, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08804034441709518, + "step": 12850, + "valid_targets_mean": 4095.9, + "valid_targets_min": 2491 + }, + { + "epoch": 6.733892090099529, + "grad_norm": 0.5169148104446686, + "learning_rate": 1.7654399115150988e-07, + "loss": 0.1459, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09014087915420532, + "step": 12855, + "valid_targets_mean": 2046.1, + "valid_targets_min": 333 + }, + { + "epoch": 6.736511262441068, + "grad_norm": 0.38211913498028294, + "learning_rate": 1.7309756630373486e-07, + "loss": 0.0801, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04085535183548927, + "step": 12860, + "valid_targets_mean": 3455.9, + "valid_targets_min": 712 + }, + { + "epoch": 6.739130434782608, + "grad_norm": 0.4488289713041321, + "learning_rate": 1.6968496757421294e-07, + "loss": 0.0747, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0355193093419075, + "step": 12865, + "valid_targets_mean": 2452.6, + "valid_targets_min": 732 + }, + { + "epoch": 6.741749607124149, + "grad_norm": 0.5332516349959687, + "learning_rate": 1.663062007850824e-07, + "loss": 0.082, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03894609957933426, + "step": 12870, + "valid_targets_mean": 2228.9, + "valid_targets_min": 803 + }, + { + "epoch": 6.744368779465689, + "grad_norm": 0.3891080450363208, + "learning_rate": 1.6296127170075894e-07, + "loss": 0.0724, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.035704925656318665, + "step": 12875, + "valid_targets_mean": 3038.6, + "valid_targets_min": 818 + }, + { + "epoch": 6.746987951807229, + "grad_norm": 0.4282429329715162, + "learning_rate": 1.5965018602793315e-07, + "loss": 0.0767, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04017750546336174, + "step": 12880, + "valid_targets_mean": 3049.4, + "valid_targets_min": 1524 + }, + { + "epoch": 6.749607124148769, + "grad_norm": 0.802341758882023, + "learning_rate": 1.5637294941555526e-07, + "loss": 0.1187, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05328008532524109, + "step": 12885, + "valid_targets_mean": 1256.1, + "valid_targets_min": 539 + }, + { + "epoch": 6.752226296490309, + "grad_norm": 0.390005962090855, + "learning_rate": 1.5312956745482388e-07, + "loss": 0.0878, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03711675852537155, + "step": 12890, + "valid_targets_mean": 3597.0, + "valid_targets_min": 2920 + }, + { + "epoch": 6.754845468831849, + "grad_norm": 0.46639672819519007, + "learning_rate": 1.4992004567918383e-07, + "loss": 0.0844, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04318893328309059, + "step": 12895, + "valid_targets_mean": 2737.9, + "valid_targets_min": 1048 + }, + { + "epoch": 6.757464641173389, + "grad_norm": 0.30713773620726875, + "learning_rate": 1.4674438956430837e-07, + "loss": 0.1103, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02616284415125847, + "step": 12900, + "valid_targets_mean": 4340.1, + "valid_targets_min": 962 + }, + { + "epoch": 6.760083813514929, + "grad_norm": 0.3858031244610261, + "learning_rate": 1.4360260452809472e-07, + "loss": 0.0646, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.041911303997039795, + "step": 12905, + "valid_targets_mean": 4283.1, + "valid_targets_min": 2091 + }, + { + "epoch": 6.762702985856469, + "grad_norm": 0.3659335945049293, + "learning_rate": 1.4049469593065524e-07, + "loss": 0.0727, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03540034592151642, + "step": 12910, + "valid_targets_mean": 4320.9, + "valid_targets_min": 3349 + }, + { + "epoch": 6.76532215819801, + "grad_norm": 0.4146819659753387, + "learning_rate": 1.3742066907430185e-07, + "loss": 0.0741, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03829266503453255, + "step": 12915, + "valid_targets_mean": 3895.9, + "valid_targets_min": 518 + }, + { + "epoch": 6.76794133053955, + "grad_norm": 0.5409036972770743, + "learning_rate": 1.3438052920354827e-07, + "loss": 0.1116, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04457290470600128, + "step": 12920, + "valid_targets_mean": 2219.6, + "valid_targets_min": 549 + }, + { + "epoch": 6.770560502881089, + "grad_norm": 0.35095890145217795, + "learning_rate": 1.313742815050878e-07, + "loss": 0.0665, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.029218202456831932, + "step": 12925, + "valid_targets_mean": 3700.2, + "valid_targets_min": 2724 + }, + { + "epoch": 6.77317967522263, + "grad_norm": 0.49776452924136344, + "learning_rate": 1.2840193110779776e-07, + "loss": 0.0782, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.039242640137672424, + "step": 12930, + "valid_targets_mean": 1672.5, + "valid_targets_min": 775 + }, + { + "epoch": 6.77579884756417, + "grad_norm": 0.3355855933765676, + "learning_rate": 1.2546348308271949e-07, + "loss": 0.0632, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02106427773833275, + "step": 12935, + "valid_targets_mean": 3546.2, + "valid_targets_min": 3183 + }, + { + "epoch": 6.778418019905709, + "grad_norm": 0.4377025120082717, + "learning_rate": 1.2255894244305843e-07, + "loss": 0.0773, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03368924558162689, + "step": 12940, + "valid_targets_mean": 2473.2, + "valid_targets_min": 577 + }, + { + "epoch": 6.78103719224725, + "grad_norm": 0.5287519420200428, + "learning_rate": 1.1968831414416626e-07, + "loss": 0.0849, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.055708516389131546, + "step": 12945, + "valid_targets_mean": 1597.0, + "valid_targets_min": 557 + }, + { + "epoch": 6.78365636458879, + "grad_norm": 0.4376992157043782, + "learning_rate": 1.1685160308354315e-07, + "loss": 0.0806, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04162124544382095, + "step": 12950, + "valid_targets_mean": 3019.1, + "valid_targets_min": 774 + }, + { + "epoch": 6.78627553693033, + "grad_norm": 0.41988601074037835, + "learning_rate": 1.1404881410082002e-07, + "loss": 0.0823, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03479935973882675, + "step": 12955, + "valid_targets_mean": 1825.8, + "valid_targets_min": 680 + }, + { + "epoch": 6.7888947092718706, + "grad_norm": 0.49979181398974065, + "learning_rate": 1.1127995197775632e-07, + "loss": 0.1213, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0622258298099041, + "step": 12960, + "valid_targets_mean": 3686.9, + "valid_targets_min": 2819 + }, + { + "epoch": 6.79151388161341, + "grad_norm": 0.31947197879194844, + "learning_rate": 1.085450214382311e-07, + "loss": 0.0689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02941582351922989, + "step": 12965, + "valid_targets_mean": 4137.8, + "valid_targets_min": 3927 + }, + { + "epoch": 6.79413305395495, + "grad_norm": 0.552564569567585, + "learning_rate": 1.0584402714822972e-07, + "loss": 0.0794, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0524916835129261, + "step": 12970, + "valid_targets_mean": 1376.1, + "valid_targets_min": 714 + }, + { + "epoch": 6.796752226296491, + "grad_norm": 0.4017964533375128, + "learning_rate": 1.031769737158439e-07, + "loss": 0.1005, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03385963290929794, + "step": 12975, + "valid_targets_mean": 3432.0, + "valid_targets_min": 754 + }, + { + "epoch": 6.79937139863803, + "grad_norm": 0.39071375705825395, + "learning_rate": 1.0054386569126051e-07, + "loss": 0.0885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.037942830473184586, + "step": 12980, + "valid_targets_mean": 3855.2, + "valid_targets_min": 3178 + }, + { + "epoch": 6.80199057097957, + "grad_norm": 0.7343800331543665, + "learning_rate": 9.79447075667439e-08, + "loss": 0.1086, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11189083755016327, + "step": 12985, + "valid_targets_mean": 1566.6, + "valid_targets_min": 920 + }, + { + "epoch": 6.804609743321111, + "grad_norm": 0.460517421977809, + "learning_rate": 9.53795037766514e-08, + "loss": 0.2418, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03707824647426605, + "step": 12990, + "valid_targets_mean": 3478.0, + "valid_targets_min": 2314 + }, + { + "epoch": 6.807228915662651, + "grad_norm": 0.40921888799466477, + "learning_rate": 9.284825869739999e-08, + "loss": 0.0848, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.031269654631614685, + "step": 12995, + "valid_targets_mean": 2561.1, + "valid_targets_min": 833 + }, + { + "epoch": 6.809848088004191, + "grad_norm": 0.4426077347230882, + "learning_rate": 9.035097664747972e-08, + "loss": 0.0825, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.049915894865989685, + "step": 13000, + "valid_targets_mean": 3509.2, + "valid_targets_min": 1803 + }, + { + "epoch": 6.812467260345731, + "grad_norm": 0.4285004055276, + "learning_rate": 8.788766188742914e-08, + "loss": 0.1731, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05492042750120163, + "step": 13005, + "valid_targets_mean": 4291.4, + "valid_targets_min": 3089 + }, + { + "epoch": 6.815086432687271, + "grad_norm": 0.2697662860913481, + "learning_rate": 8.545831861983989e-08, + "loss": 0.0619, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03071390651166439, + "step": 13010, + "valid_targets_mean": 4843.2, + "valid_targets_min": 2664 + }, + { + "epoch": 6.817705605028811, + "grad_norm": 0.3521097778524677, + "learning_rate": 8.306295098934991e-08, + "loss": 0.0851, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.023876160383224487, + "step": 13015, + "valid_targets_mean": 3042.1, + "valid_targets_min": 560 + }, + { + "epoch": 6.820324777370351, + "grad_norm": 0.4436727602143218, + "learning_rate": 8.070156308262356e-08, + "loss": 0.0817, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04059450328350067, + "step": 13020, + "valid_targets_mean": 3863.6, + "valid_targets_min": 1615 + }, + { + "epoch": 6.822943949711891, + "grad_norm": 0.37161958824132174, + "learning_rate": 7.837415892836264e-08, + "loss": 0.069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02635052613914013, + "step": 13025, + "valid_targets_mean": 3312.5, + "valid_targets_min": 2172 + }, + { + "epoch": 6.825563122053431, + "grad_norm": 0.3756347701876398, + "learning_rate": 7.608074249728204e-08, + "loss": 0.0676, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0313107855618, + "step": 13030, + "valid_targets_mean": 3059.9, + "valid_targets_min": 536 + }, + { + "epoch": 6.8281822943949715, + "grad_norm": 0.38514610915482933, + "learning_rate": 7.382131770211409e-08, + "loss": 0.0712, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03413877636194229, + "step": 13035, + "valid_targets_mean": 3881.0, + "valid_targets_min": 3295 + }, + { + "epoch": 6.830801466736511, + "grad_norm": 0.3701505847408979, + "learning_rate": 7.159588839760423e-08, + "loss": 0.0668, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.027802327647805214, + "step": 13040, + "valid_targets_mean": 3287.2, + "valid_targets_min": 820 + }, + { + "epoch": 6.833420639078051, + "grad_norm": 0.6436076477730783, + "learning_rate": 6.940445838049093e-08, + "loss": 0.1063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10774976760149002, + "step": 13045, + "valid_targets_mean": 2566.6, + "valid_targets_min": 1046 + }, + { + "epoch": 6.8360398114195915, + "grad_norm": 0.3211581572540816, + "learning_rate": 6.724703138951017e-08, + "loss": 0.064, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.031185396015644073, + "step": 13050, + "valid_targets_mean": 3590.1, + "valid_targets_min": 2719 + }, + { + "epoch": 6.838658983761132, + "grad_norm": 0.6395463224449414, + "learning_rate": 6.5123611105391e-08, + "loss": 0.0663, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05162978917360306, + "step": 13055, + "valid_targets_mean": 1638.1, + "valid_targets_min": 699 + }, + { + "epoch": 6.841278156102671, + "grad_norm": 0.3482974711492975, + "learning_rate": 6.303420115083781e-08, + "loss": 0.063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02813403680920601, + "step": 13060, + "valid_targets_mean": 3621.6, + "valid_targets_min": 2353 + }, + { + "epoch": 6.8438973284442115, + "grad_norm": 0.3862083760665773, + "learning_rate": 6.097880509053467e-08, + "loss": 0.0641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02983633428812027, + "step": 13065, + "valid_targets_mean": 2328.1, + "valid_targets_min": 549 + }, + { + "epoch": 6.846516500785752, + "grad_norm": 0.4292286502108055, + "learning_rate": 5.8957426431136554e-08, + "loss": 0.1103, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.028507661074399948, + "step": 13070, + "valid_targets_mean": 3330.4, + "valid_targets_min": 908 + }, + { + "epoch": 6.849135673127292, + "grad_norm": 0.4010713221943791, + "learning_rate": 5.69700686212582e-08, + "loss": 0.0929, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06634754687547684, + "step": 13075, + "valid_targets_mean": 3458.4, + "valid_targets_min": 2196 + }, + { + "epoch": 6.8517548454688315, + "grad_norm": 0.3699757785067211, + "learning_rate": 5.5016735051474093e-08, + "loss": 0.0769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.026269644498825073, + "step": 13080, + "valid_targets_mean": 1252.1, + "valid_targets_min": 598 + }, + { + "epoch": 6.854374017810372, + "grad_norm": 0.9234512573724675, + "learning_rate": 5.309742905431403e-08, + "loss": 0.0904, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08189341425895691, + "step": 13085, + "valid_targets_mean": 1353.1, + "valid_targets_min": 578 + }, + { + "epoch": 6.856993190151912, + "grad_norm": 0.6584269157012614, + "learning_rate": 5.121215390424761e-08, + "loss": 0.1143, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.06208275631070137, + "step": 13090, + "valid_targets_mean": 1974.2, + "valid_targets_min": 695 + }, + { + "epoch": 6.859612362493452, + "grad_norm": 0.4854169557630643, + "learning_rate": 4.9360912817695286e-08, + "loss": 0.0774, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03507557511329651, + "step": 13095, + "valid_targets_mean": 1724.5, + "valid_targets_min": 691 + }, + { + "epoch": 6.862231534834992, + "grad_norm": 0.3355601007497446, + "learning_rate": 4.7543708953003974e-08, + "loss": 0.0944, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.029666226357221603, + "step": 13100, + "valid_targets_mean": 3842.6, + "valid_targets_min": 2024 + }, + { + "epoch": 6.864850707176532, + "grad_norm": 0.5702376430529507, + "learning_rate": 4.576054541045149e-08, + "loss": 0.0772, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05020301789045334, + "step": 13105, + "valid_targets_mean": 1651.0, + "valid_targets_min": 523 + }, + { + "epoch": 6.867469879518072, + "grad_norm": 0.3188062480989316, + "learning_rate": 4.4011425232248774e-08, + "loss": 0.0713, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02868589386343956, + "step": 13110, + "valid_targets_mean": 3532.5, + "valid_targets_min": 468 + }, + { + "epoch": 6.870089051859613, + "grad_norm": 0.288519923378264, + "learning_rate": 4.229635140251542e-08, + "loss": 0.0776, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.019699353724718094, + "step": 13115, + "valid_targets_mean": 5298.0, + "valid_targets_min": 1195 + }, + { + "epoch": 6.872708224201152, + "grad_norm": 0.3565904224985087, + "learning_rate": 4.061532684729308e-08, + "loss": 0.0679, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.022875187918543816, + "step": 13120, + "valid_targets_mean": 3562.6, + "valid_targets_min": 459 + }, + { + "epoch": 6.875327396542692, + "grad_norm": 0.36958882575456525, + "learning_rate": 3.896835443452762e-08, + "loss": 0.0673, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03134230524301529, + "step": 13125, + "valid_targets_mean": 3548.0, + "valid_targets_min": 981 + }, + { + "epoch": 6.877946568884233, + "grad_norm": 0.5216557128177458, + "learning_rate": 3.735543697407362e-08, + "loss": 0.077, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.047654591500759125, + "step": 13130, + "valid_targets_mean": 2130.1, + "valid_targets_min": 697 + }, + { + "epoch": 6.880565741225773, + "grad_norm": 0.3969544010234322, + "learning_rate": 3.577657721768546e-08, + "loss": 0.0844, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.041403673589229584, + "step": 13135, + "valid_targets_mean": 3661.6, + "valid_targets_min": 2759 + }, + { + "epoch": 6.883184913567312, + "grad_norm": 0.4335928920568747, + "learning_rate": 3.423177785900844e-08, + "loss": 0.0843, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04310900717973709, + "step": 13140, + "valid_targets_mean": 3909.5, + "valid_targets_min": 3391 + }, + { + "epoch": 6.885804085908853, + "grad_norm": 0.3516525920530094, + "learning_rate": 3.272104153358324e-08, + "loss": 0.069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03035726025700569, + "step": 13145, + "valid_targets_mean": 3319.9, + "valid_targets_min": 1099 + }, + { + "epoch": 6.888423258250393, + "grad_norm": 0.38123268468604504, + "learning_rate": 3.12443708188348e-08, + "loss": 0.0712, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0375220850110054, + "step": 13150, + "valid_targets_mean": 3717.0, + "valid_targets_min": 1874 + }, + { + "epoch": 6.891042430591933, + "grad_norm": 0.3370066351747024, + "learning_rate": 2.9801768234065663e-08, + "loss": 0.0807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.030697906389832497, + "step": 13155, + "valid_targets_mean": 3263.5, + "valid_targets_min": 724 + }, + { + "epoch": 6.893661602933473, + "grad_norm": 0.31056030103191984, + "learning_rate": 2.8393236240464862e-08, + "loss": 0.0595, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.027445081621408463, + "step": 13160, + "valid_targets_mean": 3707.5, + "valid_targets_min": 2769 + }, + { + "epoch": 6.896280775275013, + "grad_norm": 0.4350193105458767, + "learning_rate": 2.7018777241083484e-08, + "loss": 0.078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03260853886604309, + "step": 13165, + "valid_targets_mean": 2815.8, + "valid_targets_min": 645 + }, + { + "epoch": 6.898899947616553, + "grad_norm": 0.3672746943249268, + "learning_rate": 2.5678393580852446e-08, + "loss": 0.0733, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.02962132729589939, + "step": 13170, + "valid_targets_mean": 3488.8, + "valid_targets_min": 600 + }, + { + "epoch": 6.901519119958094, + "grad_norm": 0.47663563451660984, + "learning_rate": 2.4372087546558064e-08, + "loss": 0.0882, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03674224019050598, + "step": 13175, + "valid_targets_mean": 3373.4, + "valid_targets_min": 1648 + }, + { + "epoch": 6.904138292299633, + "grad_norm": 0.46794766227137546, + "learning_rate": 2.309986136685316e-08, + "loss": 0.0759, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04254136234521866, + "step": 13180, + "valid_targets_mean": 2555.0, + "valid_targets_min": 821 + }, + { + "epoch": 6.906757464641173, + "grad_norm": 0.8481521508164337, + "learning_rate": 2.186171721225039e-08, + "loss": 0.0858, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.05657971277832985, + "step": 13185, + "valid_targets_mean": 867.1, + "valid_targets_min": 612 + }, + { + "epoch": 6.909376636982714, + "grad_norm": 0.5203667342062566, + "learning_rate": 2.0657657195106706e-08, + "loss": 0.0754, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.055201150476932526, + "step": 13190, + "valid_targets_mean": 2202.1, + "valid_targets_min": 830 + }, + { + "epoch": 6.911995809324253, + "grad_norm": 0.4604582895283477, + "learning_rate": 1.948768336963891e-08, + "loss": 0.0868, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.033401697874069214, + "step": 13195, + "valid_targets_mean": 3027.0, + "valid_targets_min": 1146 + }, + { + "epoch": 6.914614981665793, + "grad_norm": 0.4239609510185353, + "learning_rate": 1.8351797731908093e-08, + "loss": 0.075, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.043332524597644806, + "step": 13200, + "valid_targets_mean": 3296.6, + "valid_targets_min": 2760 + }, + { + "epoch": 6.917234154007334, + "grad_norm": 0.5935804080113309, + "learning_rate": 1.725000221981077e-08, + "loss": 0.0689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04814621061086655, + "step": 13205, + "valid_targets_mean": 1469.5, + "valid_targets_min": 628 + }, + { + "epoch": 6.919853326348874, + "grad_norm": 0.6134461274577795, + "learning_rate": 1.61822987130944e-08, + "loss": 0.0897, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07188950479030609, + "step": 13210, + "valid_targets_mean": 1752.1, + "valid_targets_min": 691 + }, + { + "epoch": 6.922472498690414, + "grad_norm": 0.3179609176982656, + "learning_rate": 1.5148689033333e-08, + "loss": 0.0684, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0196039117872715, + "step": 13215, + "valid_targets_mean": 3863.9, + "valid_targets_min": 3613 + }, + { + "epoch": 6.925091671031954, + "grad_norm": 0.3614387988412621, + "learning_rate": 1.4149174943944854e-08, + "loss": 0.0663, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03423801809549332, + "step": 13220, + "valid_targets_mean": 4304.2, + "valid_targets_min": 1773 + }, + { + "epoch": 6.927710843373494, + "grad_norm": 0.374604024416944, + "learning_rate": 1.3183758150165926e-08, + "loss": 0.0728, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.039071012288331985, + "step": 13225, + "valid_targets_mean": 1971.9, + "valid_targets_min": 762 + }, + { + "epoch": 6.930330015715034, + "grad_norm": 0.3937368208843535, + "learning_rate": 1.2252440299072022e-08, + "loss": 0.0634, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04523179307579994, + "step": 13230, + "valid_targets_mean": 4554.1, + "valid_targets_min": 946 + }, + { + "epoch": 6.932949188056574, + "grad_norm": 0.3459868864418305, + "learning_rate": 1.1355222979556601e-08, + "loss": 0.061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04321659356355667, + "step": 13235, + "valid_targets_mean": 5015.5, + "valid_targets_min": 4104 + }, + { + "epoch": 6.935568360398114, + "grad_norm": 0.37124590537719093, + "learning_rate": 1.049210772233522e-08, + "loss": 0.08, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03389116749167442, + "step": 13240, + "valid_targets_mean": 3064.4, + "valid_targets_min": 739 + }, + { + "epoch": 6.938187532739654, + "grad_norm": 0.6654117129434783, + "learning_rate": 9.663095999947746e-09, + "loss": 0.0895, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03874023258686066, + "step": 13245, + "valid_targets_mean": 3863.6, + "valid_targets_min": 3550 + }, + { + "epoch": 6.940806705081195, + "grad_norm": 0.4001454604435511, + "learning_rate": 8.868189226742818e-09, + "loss": 0.0715, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04071683809161186, + "step": 13250, + "valid_targets_mean": 3474.9, + "valid_targets_min": 704 + }, + { + "epoch": 6.943425877422735, + "grad_norm": 0.37231918968783745, + "learning_rate": 8.107388758893386e-09, + "loss": 0.0773, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.030651133507490158, + "step": 13255, + "valid_targets_mean": 2568.8, + "valid_targets_min": 774 + }, + { + "epoch": 6.946045049764274, + "grad_norm": 0.3178243411639312, + "learning_rate": 7.380695894376733e-09, + "loss": 0.0906, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.027471695095300674, + "step": 13260, + "valid_targets_mean": 3486.2, + "valid_targets_min": 888 + }, + { + "epoch": 6.948664222105815, + "grad_norm": 0.4390643538547763, + "learning_rate": 6.688111872983349e-09, + "loss": 0.0686, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03612307459115982, + "step": 13265, + "valid_targets_mean": 3371.6, + "valid_targets_min": 1048 + }, + { + "epoch": 6.951283394447355, + "grad_norm": 0.38238054940342986, + "learning_rate": 6.0296378763125e-09, + "loss": 0.0767, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0332840159535408, + "step": 13270, + "valid_targets_mean": 2941.5, + "valid_targets_min": 722 + }, + { + "epoch": 6.953902566788894, + "grad_norm": 0.4548474365698735, + "learning_rate": 5.405275027765555e-09, + "loss": 0.0739, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04574700817465782, + "step": 13275, + "valid_targets_mean": 2359.2, + "valid_targets_min": 865 + }, + { + "epoch": 6.956521739130435, + "grad_norm": 0.48640228468480634, + "learning_rate": 4.815024392552659e-09, + "loss": 0.1072, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.030867867171764374, + "step": 13280, + "valid_targets_mean": 1747.0, + "valid_targets_min": 570 + }, + { + "epoch": 6.959140911471975, + "grad_norm": 0.41893656806678314, + "learning_rate": 4.258886977683841e-09, + "loss": 0.0894, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.04409385845065117, + "step": 13285, + "valid_targets_mean": 3704.2, + "valid_targets_min": 2811 + }, + { + "epoch": 6.961760083813515, + "grad_norm": 0.42153506890974424, + "learning_rate": 3.7368637319690204e-09, + "loss": 0.0712, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.031005047261714935, + "step": 13290, + "valid_targets_mean": 1749.1, + "valid_targets_min": 635 + }, + { + "epoch": 6.9643792561550555, + "grad_norm": 0.44756068678422617, + "learning_rate": 3.2489555460157863e-09, + "loss": 0.0699, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0354573056101799, + "step": 13295, + "valid_targets_mean": 2985.1, + "valid_targets_min": 1591 + }, + { + "epoch": 6.966998428496595, + "grad_norm": 0.4244297106292505, + "learning_rate": 2.795163252231614e-09, + "loss": 0.0686, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.030690640211105347, + "step": 13300, + "valid_targets_mean": 2912.6, + "valid_targets_min": 800 + }, + { + "epoch": 6.969617600838135, + "grad_norm": 0.36870229760270784, + "learning_rate": 2.3754876248216484e-09, + "loss": 0.0621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.033027928322553635, + "step": 13305, + "valid_targets_mean": 3084.9, + "valid_targets_min": 860 + }, + { + "epoch": 6.9722367731796755, + "grad_norm": 0.5218797174304519, + "learning_rate": 1.9899293797753792e-09, + "loss": 0.0865, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03889650106430054, + "step": 13310, + "valid_targets_mean": 2482.6, + "valid_targets_min": 878 + }, + { + "epoch": 6.974855945521215, + "grad_norm": 0.3670369079177163, + "learning_rate": 1.6384891748910669e-09, + "loss": 0.0615, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03365497291088104, + "step": 13315, + "valid_targets_mean": 3403.2, + "valid_targets_min": 1024 + }, + { + "epoch": 6.977475117862755, + "grad_norm": 0.44160164601539337, + "learning_rate": 1.3211676097446558e-09, + "loss": 0.0681, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.034843601286411285, + "step": 13320, + "valid_targets_mean": 2173.1, + "valid_targets_min": 786 + }, + { + "epoch": 6.9800942902042955, + "grad_norm": 0.43451913090030936, + "learning_rate": 1.0379652257141991e-09, + "loss": 0.0697, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0458085760474205, + "step": 13325, + "valid_targets_mean": 3233.9, + "valid_targets_min": 2573 + }, + { + "epoch": 6.982713462545836, + "grad_norm": 0.3746873455054217, + "learning_rate": 7.888825059576555e-10, + "loss": 0.0711, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.03752672299742699, + "step": 13330, + "valid_targets_mean": 3821.9, + "valid_targets_min": 2274 + }, + { + "epoch": 6.985332634887375, + "grad_norm": 0.4241442188246108, + "learning_rate": 5.739198754350916e-10, + "loss": 0.0626, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.039890218526124954, + "step": 13335, + "valid_targets_mean": 3791.2, + "valid_targets_min": 892 + }, + { + "epoch": 6.9879518072289155, + "grad_norm": 0.3639122279373955, + "learning_rate": 3.9307770088203855e-10, + "loss": 0.0675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.027569664642214775, + "step": 13340, + "valid_targets_mean": 4820.4, + "valid_targets_min": 4491 + }, + { + "epoch": 6.990570979570456, + "grad_norm": 0.6518008964117099, + "learning_rate": 2.463562908316952e-10, + "loss": 0.1068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08742758631706238, + "step": 13345, + "valid_targets_mean": 2159.1, + "valid_targets_min": 709 + }, + { + "epoch": 6.993190151911996, + "grad_norm": 0.33525197631159753, + "learning_rate": 1.3375589559938562e-10, + "loss": 0.1183, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.021990729495882988, + "step": 13350, + "valid_targets_mean": 3430.8, + "valid_targets_min": 1097 + }, + { + "epoch": 6.9958093242535355, + "grad_norm": 0.3826266404168604, + "learning_rate": 5.5276707291440637e-11, + "loss": 0.0714, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.029649188742041588, + "step": 13355, + "valid_targets_mean": 3032.0, + "valid_targets_min": 840 + }, + { + "epoch": 6.998428496595076, + "grad_norm": 0.3197481698629408, + "learning_rate": 1.0918859796316127e-11, + "loss": 0.0653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.026989787817001343, + "step": 13360, + "valid_targets_mean": 3812.2, + "valid_targets_min": 3106 + }, + { + "epoch": 7.0, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.029614586383104324, + "step": 13363, + "total_flos": 4.5218040599627694e+18, + "train_loss": 0.07040505743371078, + "train_runtime": 148647.7084, + "train_samples_per_second": 1.438, + "train_steps_per_second": 0.09, + "valid_targets_mean": 2983.1, + "valid_targets_min": 791 + } + ], + "logging_steps": 5, + "max_steps": 13363, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 200, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 4.5218040599627694e+18, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +}